1 // SPDX-License-Identifier: GPL-2.0 2 /* 3 * This file contains instructions for testing by the test titled: 4 * 5 * "Test x86 instruction decoder - new instructions" 6 * 7 * Note that the 'Expecting' comment lines are consumed by the 8 * gen-insn-x86-dat.awk script and have the format: 9 * 10 * Expecting: <op> <branch> <rel> 11 * 12 * If this file is changed, remember to run the gen-insn-x86-dat.sh 13 * script and commit the result. 14 * 15 * Refer to insn-x86.c for more details. 16 */ 17 18 int main(void) 19 { 20 /* Following line is a marker for the awk script - do not change */ 21 asm volatile("rdtsc"); /* Start here */ 22 23 /* Test fix for vcvtph2ps in x86-opcode-map.txt */ 24 25 asm volatile("vcvtph2ps %xmm3,%ymm5"); 26 27 #ifdef __x86_64__ 28 29 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 30 31 asm volatile("cmovno %rax,%rbx"); 32 asm volatile("cmovno 0x12345678(%rax),%rcx"); 33 asm volatile("cmovno 0x12345678(%rax),%cx"); 34 35 asm volatile("cmove %rax,%rbx"); 36 asm volatile("cmove 0x12345678(%rax),%rcx"); 37 asm volatile("cmove 0x12345678(%rax),%cx"); 38 39 asm volatile("seto 0x12345678(%rax)"); 40 asm volatile("setno 0x12345678(%rax)"); 41 asm volatile("setb 0x12345678(%rax)"); 42 asm volatile("setc 0x12345678(%rax)"); 43 asm volatile("setnae 0x12345678(%rax)"); 44 asm volatile("setae 0x12345678(%rax)"); 45 asm volatile("setnb 0x12345678(%rax)"); 46 asm volatile("setnc 0x12345678(%rax)"); 47 asm volatile("sets 0x12345678(%rax)"); 48 asm volatile("setns 0x12345678(%rax)"); 49 50 /* AVX-512: Mask Instructions */ 51 52 asm volatile("kandw %k7,%k6,%k5"); 53 asm volatile("kandq %k7,%k6,%k5"); 54 asm volatile("kandb %k7,%k6,%k5"); 55 asm volatile("kandd %k7,%k6,%k5"); 56 57 asm volatile("kandnw %k7,%k6,%k5"); 58 asm volatile("kandnq %k7,%k6,%k5"); 59 asm volatile("kandnb %k7,%k6,%k5"); 60 asm volatile("kandnd %k7,%k6,%k5"); 61 62 asm volatile("knotw %k7,%k6"); 63 asm volatile("knotq %k7,%k6"); 64 asm volatile("knotb %k7,%k6"); 65 asm volatile("knotd %k7,%k6"); 66 67 asm volatile("korw %k7,%k6,%k5"); 68 asm volatile("korq %k7,%k6,%k5"); 69 asm volatile("korb %k7,%k6,%k5"); 70 asm volatile("kord %k7,%k6,%k5"); 71 72 asm volatile("kxnorw %k7,%k6,%k5"); 73 asm volatile("kxnorq %k7,%k6,%k5"); 74 asm volatile("kxnorb %k7,%k6,%k5"); 75 asm volatile("kxnord %k7,%k6,%k5"); 76 77 asm volatile("kxorw %k7,%k6,%k5"); 78 asm volatile("kxorq %k7,%k6,%k5"); 79 asm volatile("kxorb %k7,%k6,%k5"); 80 asm volatile("kxord %k7,%k6,%k5"); 81 82 asm volatile("kaddw %k7,%k6,%k5"); 83 asm volatile("kaddq %k7,%k6,%k5"); 84 asm volatile("kaddb %k7,%k6,%k5"); 85 asm volatile("kaddd %k7,%k6,%k5"); 86 87 asm volatile("kunpckbw %k7,%k6,%k5"); 88 asm volatile("kunpckwd %k7,%k6,%k5"); 89 asm volatile("kunpckdq %k7,%k6,%k5"); 90 91 asm volatile("kmovw %k6,%k5"); 92 asm volatile("kmovw (%rcx),%k5"); 93 asm volatile("kmovw 0x123(%rax,%r14,8),%k5"); 94 asm volatile("kmovw %k5,(%rcx)"); 95 asm volatile("kmovw %k5,0x123(%rax,%r14,8)"); 96 asm volatile("kmovw %eax,%k5"); 97 asm volatile("kmovw %ebp,%k5"); 98 asm volatile("kmovw %r13d,%k5"); 99 asm volatile("kmovw %k5,%eax"); 100 asm volatile("kmovw %k5,%ebp"); 101 asm volatile("kmovw %k5,%r13d"); 102 103 asm volatile("kmovq %k6,%k5"); 104 asm volatile("kmovq (%rcx),%k5"); 105 asm volatile("kmovq 0x123(%rax,%r14,8),%k5"); 106 asm volatile("kmovq %k5,(%rcx)"); 107 asm volatile("kmovq %k5,0x123(%rax,%r14,8)"); 108 asm volatile("kmovq %rax,%k5"); 109 asm volatile("kmovq %rbp,%k5"); 110 asm volatile("kmovq %r13,%k5"); 111 asm volatile("kmovq %k5,%rax"); 112 asm volatile("kmovq %k5,%rbp"); 113 asm volatile("kmovq %k5,%r13"); 114 115 asm volatile("kmovb %k6,%k5"); 116 asm volatile("kmovb (%rcx),%k5"); 117 asm volatile("kmovb 0x123(%rax,%r14,8),%k5"); 118 asm volatile("kmovb %k5,(%rcx)"); 119 asm volatile("kmovb %k5,0x123(%rax,%r14,8)"); 120 asm volatile("kmovb %eax,%k5"); 121 asm volatile("kmovb %ebp,%k5"); 122 asm volatile("kmovb %r13d,%k5"); 123 asm volatile("kmovb %k5,%eax"); 124 asm volatile("kmovb %k5,%ebp"); 125 asm volatile("kmovb %k5,%r13d"); 126 127 asm volatile("kmovd %k6,%k5"); 128 asm volatile("kmovd (%rcx),%k5"); 129 asm volatile("kmovd 0x123(%rax,%r14,8),%k5"); 130 asm volatile("kmovd %k5,(%rcx)"); 131 asm volatile("kmovd %k5,0x123(%rax,%r14,8)"); 132 asm volatile("kmovd %eax,%k5"); 133 asm volatile("kmovd %ebp,%k5"); 134 asm volatile("kmovd %r13d,%k5"); 135 asm volatile("kmovd %k5,%eax"); 136 asm volatile("kmovd %k5,%ebp"); 137 asm volatile("kmovd %k5,%r13d"); 138 139 asm volatile("kortestw %k6,%k5"); 140 asm volatile("kortestq %k6,%k5"); 141 asm volatile("kortestb %k6,%k5"); 142 asm volatile("kortestd %k6,%k5"); 143 144 asm volatile("ktestw %k6,%k5"); 145 asm volatile("ktestq %k6,%k5"); 146 asm volatile("ktestb %k6,%k5"); 147 asm volatile("ktestd %k6,%k5"); 148 149 asm volatile("kshiftrw $0x12,%k6,%k5"); 150 asm volatile("kshiftrq $0x5b,%k6,%k5"); 151 asm volatile("kshiftlw $0x12,%k6,%k5"); 152 asm volatile("kshiftlq $0x5b,%k6,%k5"); 153 154 /* AVX-512: Op code 0f 5b */ 155 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 156 asm volatile("vcvtqq2ps %zmm29,%ymm6{%k7}"); 157 asm volatile("vcvtps2dq %xmm5,%xmm6"); 158 asm volatile("vcvttps2dq %xmm5,%xmm6"); 159 160 /* AVX-512: Op code 0f 6f */ 161 162 asm volatile("movq %mm0,%mm4"); 163 asm volatile("vmovdqa %ymm4,%ymm6"); 164 asm volatile("vmovdqa32 %zmm25,%zmm26"); 165 asm volatile("vmovdqa64 %zmm25,%zmm26"); 166 asm volatile("vmovdqu %ymm4,%ymm6"); 167 asm volatile("vmovdqu32 %zmm29,%zmm30"); 168 asm volatile("vmovdqu64 %zmm25,%zmm26"); 169 asm volatile("vmovdqu8 %zmm29,%zmm30"); 170 asm volatile("vmovdqu16 %zmm25,%zmm26"); 171 172 /* AVX-512: Op code 0f 78 */ 173 174 asm volatile("vmread %rax,%rbx"); 175 asm volatile("vcvttps2udq %zmm25,%zmm26"); 176 asm volatile("vcvttpd2udq %zmm29,%ymm6{%k7}"); 177 asm volatile("vcvttsd2usi %xmm6,%rax"); 178 asm volatile("vcvttss2usi %xmm6,%rax"); 179 asm volatile("vcvttps2uqq %ymm5,%zmm26{%k7}"); 180 asm volatile("vcvttpd2uqq %zmm29,%zmm30"); 181 182 /* AVX-512: Op code 0f 79 */ 183 184 asm volatile("vmwrite %rax,%rbx"); 185 asm volatile("vcvtps2udq %zmm25,%zmm26"); 186 asm volatile("vcvtpd2udq %zmm29,%ymm6{%k7}"); 187 asm volatile("vcvtsd2usi %xmm6,%rax"); 188 asm volatile("vcvtss2usi %xmm6,%rax"); 189 asm volatile("vcvtps2uqq %ymm5,%zmm26{%k7}"); 190 asm volatile("vcvtpd2uqq %zmm29,%zmm30"); 191 192 /* AVX-512: Op code 0f 7a */ 193 194 asm volatile("vcvtudq2pd %ymm5,%zmm29{%k7}"); 195 asm volatile("vcvtuqq2pd %zmm25,%zmm26"); 196 asm volatile("vcvtudq2ps %zmm29,%zmm30"); 197 asm volatile("vcvtuqq2ps %zmm25,%ymm26{%k7}"); 198 asm volatile("vcvttps2qq %ymm25,%zmm26{%k7}"); 199 asm volatile("vcvttpd2qq %zmm29,%zmm30"); 200 201 /* AVX-512: Op code 0f 7b */ 202 203 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 204 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 205 asm volatile("vcvtps2qq %ymm5,%zmm26{%k7}"); 206 asm volatile("vcvtpd2qq %zmm29,%zmm30"); 207 208 /* AVX-512: Op code 0f 7f */ 209 210 asm volatile("movq.s %mm0,%mm4"); 211 asm volatile("vmovdqa %ymm8,%ymm6"); 212 asm volatile("vmovdqa32.s %zmm25,%zmm26"); 213 asm volatile("vmovdqa64.s %zmm25,%zmm26"); 214 asm volatile("vmovdqu %ymm8,%ymm6"); 215 asm volatile("vmovdqu32.s %zmm25,%zmm26"); 216 asm volatile("vmovdqu64.s %zmm25,%zmm26"); 217 asm volatile("vmovdqu8.s %zmm30,(%rcx)"); 218 asm volatile("vmovdqu16.s %zmm25,%zmm26"); 219 220 /* AVX-512: Op code 0f db */ 221 222 asm volatile("pand %mm1,%mm2"); 223 asm volatile("pand %xmm1,%xmm2"); 224 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 225 asm volatile("vpandd %zmm24,%zmm25,%zmm26"); 226 asm volatile("vpandq %zmm24,%zmm25,%zmm26"); 227 228 /* AVX-512: Op code 0f df */ 229 230 asm volatile("pandn %mm1,%mm2"); 231 asm volatile("pandn %xmm1,%xmm2"); 232 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 233 asm volatile("vpandnd %zmm24,%zmm25,%zmm26"); 234 asm volatile("vpandnq %zmm24,%zmm25,%zmm26"); 235 236 /* AVX-512: Op code 0f e6 */ 237 238 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 239 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 240 asm volatile("vcvtdq2pd %ymm5,%zmm26{%k7}"); 241 asm volatile("vcvtqq2pd %zmm25,%zmm26"); 242 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 243 244 /* AVX-512: Op code 0f eb */ 245 246 asm volatile("por %mm4,%mm6"); 247 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 248 asm volatile("vpord %zmm24,%zmm25,%zmm26"); 249 asm volatile("vporq %zmm24,%zmm25,%zmm26"); 250 251 /* AVX-512: Op code 0f ef */ 252 253 asm volatile("pxor %mm4,%mm6"); 254 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 255 asm volatile("vpxord %zmm24,%zmm25,%zmm26"); 256 asm volatile("vpxorq %zmm24,%zmm25,%zmm26"); 257 258 /* AVX-512: Op code 0f 38 10 */ 259 260 asm volatile("pblendvb %xmm1,%xmm0"); 261 asm volatile("vpsrlvw %zmm27,%zmm28,%zmm29"); 262 asm volatile("vpmovuswb %zmm28,%ymm6{%k7}"); 263 264 /* AVX-512: Op code 0f 38 11 */ 265 266 asm volatile("vpmovusdb %zmm28,%xmm6{%k7}"); 267 asm volatile("vpsravw %zmm27,%zmm28,%zmm29"); 268 269 /* AVX-512: Op code 0f 38 12 */ 270 271 asm volatile("vpmovusqb %zmm27,%xmm6{%k7}"); 272 asm volatile("vpsllvw %zmm27,%zmm28,%zmm29"); 273 274 /* AVX-512: Op code 0f 38 13 */ 275 276 asm volatile("vcvtph2ps %xmm3,%ymm5"); 277 asm volatile("vcvtph2ps %ymm5,%zmm27{%k7}"); 278 asm volatile("vpmovusdw %zmm27,%ymm6{%k7}"); 279 280 /* AVX-512: Op code 0f 38 14 */ 281 282 asm volatile("blendvps %xmm1,%xmm0"); 283 asm volatile("vpmovusqw %zmm27,%xmm6{%k7}"); 284 asm volatile("vprorvd %zmm27,%zmm28,%zmm29"); 285 asm volatile("vprorvq %zmm27,%zmm28,%zmm29"); 286 287 /* AVX-512: Op code 0f 38 15 */ 288 289 asm volatile("blendvpd %xmm1,%xmm0"); 290 asm volatile("vpmovusqd %zmm27,%ymm6{%k7}"); 291 asm volatile("vprolvd %zmm27,%zmm28,%zmm29"); 292 asm volatile("vprolvq %zmm27,%zmm28,%zmm29"); 293 294 /* AVX-512: Op code 0f 38 16 */ 295 296 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 297 asm volatile("vpermps %ymm24,%ymm26,%ymm22{%k7}"); 298 asm volatile("vpermpd %ymm24,%ymm26,%ymm22{%k7}"); 299 300 /* AVX-512: Op code 0f 38 19 */ 301 302 asm volatile("vbroadcastsd %xmm4,%ymm6"); 303 asm volatile("vbroadcastf32x2 %xmm27,%zmm26"); 304 305 /* AVX-512: Op code 0f 38 1a */ 306 307 asm volatile("vbroadcastf128 (%rcx),%ymm4"); 308 asm volatile("vbroadcastf32x4 (%rcx),%zmm26"); 309 asm volatile("vbroadcastf64x2 (%rcx),%zmm26"); 310 311 /* AVX-512: Op code 0f 38 1b */ 312 313 asm volatile("vbroadcastf32x8 (%rcx),%zmm27"); 314 asm volatile("vbroadcastf64x4 (%rcx),%zmm26"); 315 316 /* AVX-512: Op code 0f 38 1f */ 317 318 asm volatile("vpabsq %zmm27,%zmm28"); 319 320 /* AVX-512: Op code 0f 38 20 */ 321 322 asm volatile("vpmovsxbw %xmm4,%xmm5"); 323 asm volatile("vpmovswb %zmm27,%ymm6{%k7}"); 324 325 /* AVX-512: Op code 0f 38 21 */ 326 327 asm volatile("vpmovsxbd %xmm4,%ymm6"); 328 asm volatile("vpmovsdb %zmm27,%xmm6{%k7}"); 329 330 /* AVX-512: Op code 0f 38 22 */ 331 332 asm volatile("vpmovsxbq %xmm4,%ymm4"); 333 asm volatile("vpmovsqb %zmm27,%xmm6{%k7}"); 334 335 /* AVX-512: Op code 0f 38 23 */ 336 337 asm volatile("vpmovsxwd %xmm4,%ymm4"); 338 asm volatile("vpmovsdw %zmm27,%ymm6{%k7}"); 339 340 /* AVX-512: Op code 0f 38 24 */ 341 342 asm volatile("vpmovsxwq %xmm4,%ymm6"); 343 asm volatile("vpmovsqw %zmm27,%xmm6{%k7}"); 344 345 /* AVX-512: Op code 0f 38 25 */ 346 347 asm volatile("vpmovsxdq %xmm4,%ymm4"); 348 asm volatile("vpmovsqd %zmm27,%ymm6{%k7}"); 349 350 /* AVX-512: Op code 0f 38 26 */ 351 352 asm volatile("vptestmb %zmm27,%zmm28,%k5"); 353 asm volatile("vptestmw %zmm27,%zmm28,%k5"); 354 asm volatile("vptestnmb %zmm26,%zmm27,%k5"); 355 asm volatile("vptestnmw %zmm26,%zmm27,%k5"); 356 357 /* AVX-512: Op code 0f 38 27 */ 358 359 asm volatile("vptestmd %zmm27,%zmm28,%k5"); 360 asm volatile("vptestmq %zmm27,%zmm28,%k5"); 361 asm volatile("vptestnmd %zmm26,%zmm27,%k5"); 362 asm volatile("vptestnmq %zmm26,%zmm27,%k5"); 363 364 /* AVX-512: Op code 0f 38 28 */ 365 366 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 367 asm volatile("vpmovm2b %k5,%zmm28"); 368 asm volatile("vpmovm2w %k5,%zmm28"); 369 370 /* AVX-512: Op code 0f 38 29 */ 371 372 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 373 asm volatile("vpmovb2m %zmm28,%k5"); 374 asm volatile("vpmovw2m %zmm28,%k5"); 375 376 /* AVX-512: Op code 0f 38 2a */ 377 378 asm volatile("vmovntdqa (%rcx),%ymm4"); 379 asm volatile("vpbroadcastmb2q %k6,%zmm30"); 380 381 /* AVX-512: Op code 0f 38 2c */ 382 383 asm volatile("vmaskmovps (%rcx),%ymm4,%ymm6"); 384 asm volatile("vscalefps %zmm24,%zmm25,%zmm26"); 385 asm volatile("vscalefpd %zmm24,%zmm25,%zmm26"); 386 387 /* AVX-512: Op code 0f 38 2d */ 388 389 asm volatile("vmaskmovpd (%rcx),%ymm4,%ymm6"); 390 asm volatile("vscalefss %xmm24,%xmm25,%xmm26{%k7}"); 391 asm volatile("vscalefsd %xmm24,%xmm25,%xmm26{%k7}"); 392 393 /* AVX-512: Op code 0f 38 30 */ 394 395 asm volatile("vpmovzxbw %xmm4,%ymm4"); 396 asm volatile("vpmovwb %zmm27,%ymm6{%k7}"); 397 398 /* AVX-512: Op code 0f 38 31 */ 399 400 asm volatile("vpmovzxbd %xmm4,%ymm6"); 401 asm volatile("vpmovdb %zmm27,%xmm6{%k7}"); 402 403 /* AVX-512: Op code 0f 38 32 */ 404 405 asm volatile("vpmovzxbq %xmm4,%ymm4"); 406 asm volatile("vpmovqb %zmm27,%xmm6{%k7}"); 407 408 /* AVX-512: Op code 0f 38 33 */ 409 410 asm volatile("vpmovzxwd %xmm4,%ymm4"); 411 asm volatile("vpmovdw %zmm27,%ymm6{%k7}"); 412 413 /* AVX-512: Op code 0f 38 34 */ 414 415 asm volatile("vpmovzxwq %xmm4,%ymm6"); 416 asm volatile("vpmovqw %zmm27,%xmm6{%k7}"); 417 418 /* AVX-512: Op code 0f 38 35 */ 419 420 asm volatile("vpmovzxdq %xmm4,%ymm4"); 421 asm volatile("vpmovqd %zmm27,%ymm6{%k7}"); 422 423 /* AVX-512: Op code 0f 38 38 */ 424 425 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 426 asm volatile("vpermd %ymm24,%ymm26,%ymm22{%k7}"); 427 asm volatile("vpermq %ymm24,%ymm26,%ymm22{%k7}"); 428 429 /* AVX-512: Op code 0f 38 38 */ 430 431 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 432 asm volatile("vpmovm2d %k5,%zmm28"); 433 asm volatile("vpmovm2q %k5,%zmm28"); 434 435 /* AVX-512: Op code 0f 38 39 */ 436 437 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 438 asm volatile("vpminsd %zmm24,%zmm25,%zmm26"); 439 asm volatile("vpminsq %zmm24,%zmm25,%zmm26"); 440 asm volatile("vpmovd2m %zmm28,%k5"); 441 asm volatile("vpmovq2m %zmm28,%k5"); 442 443 /* AVX-512: Op code 0f 38 3a */ 444 445 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 446 asm volatile("vpbroadcastmw2d %k6,%zmm28"); 447 448 /* AVX-512: Op code 0f 38 3b */ 449 450 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 451 asm volatile("vpminud %zmm24,%zmm25,%zmm26"); 452 asm volatile("vpminuq %zmm24,%zmm25,%zmm26"); 453 454 /* AVX-512: Op code 0f 38 3d */ 455 456 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 457 asm volatile("vpmaxsd %zmm24,%zmm25,%zmm26"); 458 asm volatile("vpmaxsq %zmm24,%zmm25,%zmm26"); 459 460 /* AVX-512: Op code 0f 38 3f */ 461 462 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 463 asm volatile("vpmaxud %zmm24,%zmm25,%zmm26"); 464 asm volatile("vpmaxuq %zmm24,%zmm25,%zmm26"); 465 466 /* AVX-512: Op code 0f 38 42 */ 467 468 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 469 asm volatile("vpmulld %zmm24,%zmm25,%zmm26"); 470 asm volatile("vpmullq %zmm24,%zmm25,%zmm26"); 471 472 /* AVX-512: Op code 0f 38 42 */ 473 474 asm volatile("vgetexpps %zmm25,%zmm26"); 475 asm volatile("vgetexppd %zmm27,%zmm28"); 476 477 /* AVX-512: Op code 0f 38 43 */ 478 479 asm volatile("vgetexpss %xmm24,%xmm25,%xmm26{%k7}"); 480 asm volatile("vgetexpsd %xmm28,%xmm29,%xmm30{%k7}"); 481 482 /* AVX-512: Op code 0f 38 44 */ 483 484 asm volatile("vplzcntd %zmm27,%zmm28"); 485 asm volatile("vplzcntq %zmm27,%zmm28"); 486 487 /* AVX-512: Op code 0f 38 46 */ 488 489 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 490 asm volatile("vpsravd %zmm24,%zmm25,%zmm26"); 491 asm volatile("vpsravq %zmm24,%zmm25,%zmm26"); 492 493 /* AVX-512: Op code 0f 38 4c */ 494 495 asm volatile("vrcp14ps %zmm25,%zmm26"); 496 asm volatile("vrcp14pd %zmm27,%zmm28"); 497 498 /* AVX-512: Op code 0f 38 4d */ 499 500 asm volatile("vrcp14ss %xmm24,%xmm25,%xmm26{%k7}"); 501 asm volatile("vrcp14sd %xmm24,%xmm25,%xmm26{%k7}"); 502 503 /* AVX-512: Op code 0f 38 4e */ 504 505 asm volatile("vrsqrt14ps %zmm25,%zmm26"); 506 asm volatile("vrsqrt14pd %zmm27,%zmm28"); 507 508 /* AVX-512: Op code 0f 38 4f */ 509 510 asm volatile("vrsqrt14ss %xmm24,%xmm25,%xmm26{%k7}"); 511 asm volatile("vrsqrt14sd %xmm24,%xmm25,%xmm26{%k7}"); 512 513 /* AVX-512: Op code 0f 38 50 */ 514 515 asm volatile("vpdpbusd %xmm1, %xmm2, %xmm3"); 516 asm volatile("vpdpbusd %ymm1, %ymm2, %ymm3"); 517 asm volatile("vpdpbusd %zmm1, %zmm2, %zmm3"); 518 asm volatile("vpdpbusd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 519 asm volatile("vpdpbusd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 520 521 /* AVX-512: Op code 0f 38 51 */ 522 523 asm volatile("vpdpbusds %xmm1, %xmm2, %xmm3"); 524 asm volatile("vpdpbusds %ymm1, %ymm2, %ymm3"); 525 asm volatile("vpdpbusds %zmm1, %zmm2, %zmm3"); 526 asm volatile("vpdpbusds 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 527 asm volatile("vpdpbusds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 528 529 /* AVX-512: Op code 0f 38 52 */ 530 531 asm volatile("vdpbf16ps %xmm1, %xmm2, %xmm3"); 532 asm volatile("vdpbf16ps %ymm1, %ymm2, %ymm3"); 533 asm volatile("vdpbf16ps %zmm1, %zmm2, %zmm3"); 534 asm volatile("vdpbf16ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 535 asm volatile("vdpbf16ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 536 537 asm volatile("vpdpwssd %xmm1, %xmm2, %xmm3"); 538 asm volatile("vpdpwssd %ymm1, %ymm2, %ymm3"); 539 asm volatile("vpdpwssd %zmm1, %zmm2, %zmm3"); 540 asm volatile("vpdpwssd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 541 asm volatile("vpdpwssd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 542 543 asm volatile("vp4dpwssd (%rax), %zmm0, %zmm4"); 544 asm volatile("vp4dpwssd (%eax), %zmm0, %zmm4"); 545 asm volatile("vp4dpwssd 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 546 asm volatile("vp4dpwssd 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 547 548 /* AVX-512: Op code 0f 38 53 */ 549 550 asm volatile("vpdpwssds %xmm1, %xmm2, %xmm3"); 551 asm volatile("vpdpwssds %ymm1, %ymm2, %ymm3"); 552 asm volatile("vpdpwssds %zmm1, %zmm2, %zmm3"); 553 asm volatile("vpdpwssds 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 554 asm volatile("vpdpwssds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 555 556 asm volatile("vp4dpwssds (%rax), %zmm0, %zmm4"); 557 asm volatile("vp4dpwssds (%eax), %zmm0, %zmm4"); 558 asm volatile("vp4dpwssds 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 559 asm volatile("vp4dpwssds 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 560 561 /* AVX-512: Op code 0f 38 54 */ 562 563 asm volatile("vpopcntb %xmm1, %xmm2"); 564 asm volatile("vpopcntb %ymm1, %ymm2"); 565 asm volatile("vpopcntb %zmm1, %zmm2"); 566 asm volatile("vpopcntb 0x12345678(%rax,%rcx,8),%zmm2"); 567 asm volatile("vpopcntb 0x12345678(%eax,%ecx,8),%zmm2"); 568 569 asm volatile("vpopcntw %xmm1, %xmm2"); 570 asm volatile("vpopcntw %ymm1, %ymm2"); 571 asm volatile("vpopcntw %zmm1, %zmm2"); 572 asm volatile("vpopcntw 0x12345678(%rax,%rcx,8),%zmm2"); 573 asm volatile("vpopcntw 0x12345678(%eax,%ecx,8),%zmm2"); 574 575 /* AVX-512: Op code 0f 38 55 */ 576 577 asm volatile("vpopcntd %xmm1, %xmm2"); 578 asm volatile("vpopcntd %ymm1, %ymm2"); 579 asm volatile("vpopcntd %zmm1, %zmm2"); 580 asm volatile("vpopcntd 0x12345678(%rax,%rcx,8),%zmm2"); 581 asm volatile("vpopcntd 0x12345678(%eax,%ecx,8),%zmm2"); 582 583 asm volatile("vpopcntq %xmm1, %xmm2"); 584 asm volatile("vpopcntq %ymm1, %ymm2"); 585 asm volatile("vpopcntq %zmm1, %zmm2"); 586 asm volatile("vpopcntq 0x12345678(%rax,%rcx,8),%zmm2"); 587 asm volatile("vpopcntq 0x12345678(%eax,%ecx,8),%zmm2"); 588 589 /* AVX-512: Op code 0f 38 59 */ 590 591 asm volatile("vpbroadcastq %xmm4,%xmm6"); 592 asm volatile("vbroadcasti32x2 %xmm27,%zmm26"); 593 594 /* AVX-512: Op code 0f 38 5a */ 595 596 asm volatile("vbroadcasti128 (%rcx),%ymm4"); 597 asm volatile("vbroadcasti32x4 (%rcx),%zmm26"); 598 asm volatile("vbroadcasti64x2 (%rcx),%zmm26"); 599 600 /* AVX-512: Op code 0f 38 5b */ 601 602 asm volatile("vbroadcasti32x8 (%rcx),%zmm28"); 603 asm volatile("vbroadcasti64x4 (%rcx),%zmm26"); 604 605 /* AVX-512: Op code 0f 38 62 */ 606 607 asm volatile("vpexpandb %xmm1, %xmm2"); 608 asm volatile("vpexpandb %ymm1, %ymm2"); 609 asm volatile("vpexpandb %zmm1, %zmm2"); 610 asm volatile("vpexpandb 0x12345678(%rax,%rcx,8),%zmm2"); 611 asm volatile("vpexpandb 0x12345678(%eax,%ecx,8),%zmm2"); 612 613 asm volatile("vpexpandw %xmm1, %xmm2"); 614 asm volatile("vpexpandw %ymm1, %ymm2"); 615 asm volatile("vpexpandw %zmm1, %zmm2"); 616 asm volatile("vpexpandw 0x12345678(%rax,%rcx,8),%zmm2"); 617 asm volatile("vpexpandw 0x12345678(%eax,%ecx,8),%zmm2"); 618 619 /* AVX-512: Op code 0f 38 63 */ 620 621 asm volatile("vpcompressb %xmm1, %xmm2"); 622 asm volatile("vpcompressb %ymm1, %ymm2"); 623 asm volatile("vpcompressb %zmm1, %zmm2"); 624 asm volatile("vpcompressb %zmm2,0x12345678(%rax,%rcx,8)"); 625 asm volatile("vpcompressb %zmm2,0x12345678(%eax,%ecx,8)"); 626 627 asm volatile("vpcompressw %xmm1, %xmm2"); 628 asm volatile("vpcompressw %ymm1, %ymm2"); 629 asm volatile("vpcompressw %zmm1, %zmm2"); 630 asm volatile("vpcompressw %zmm2,0x12345678(%rax,%rcx,8)"); 631 asm volatile("vpcompressw %zmm2,0x12345678(%eax,%ecx,8)"); 632 633 /* AVX-512: Op code 0f 38 64 */ 634 635 asm volatile("vpblendmd %zmm26,%zmm27,%zmm28"); 636 asm volatile("vpblendmq %zmm26,%zmm27,%zmm28"); 637 638 /* AVX-512: Op code 0f 38 65 */ 639 640 asm volatile("vblendmps %zmm24,%zmm25,%zmm26"); 641 asm volatile("vblendmpd %zmm26,%zmm27,%zmm28"); 642 643 /* AVX-512: Op code 0f 38 66 */ 644 645 asm volatile("vpblendmb %zmm26,%zmm27,%zmm28"); 646 asm volatile("vpblendmw %zmm26,%zmm27,%zmm28"); 647 648 /* AVX-512: Op code 0f 38 68 */ 649 650 asm volatile("vp2intersectd %xmm1, %xmm2, %k3"); 651 asm volatile("vp2intersectd %ymm1, %ymm2, %k3"); 652 asm volatile("vp2intersectd %zmm1, %zmm2, %k3"); 653 asm volatile("vp2intersectd 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 654 asm volatile("vp2intersectd 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 655 656 asm volatile("vp2intersectq %xmm1, %xmm2, %k3"); 657 asm volatile("vp2intersectq %ymm1, %ymm2, %k3"); 658 asm volatile("vp2intersectq %zmm1, %zmm2, %k3"); 659 asm volatile("vp2intersectq 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 660 asm volatile("vp2intersectq 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 661 662 /* AVX-512: Op code 0f 38 70 */ 663 664 asm volatile("vpshldvw %xmm1, %xmm2, %xmm3"); 665 asm volatile("vpshldvw %ymm1, %ymm2, %ymm3"); 666 asm volatile("vpshldvw %zmm1, %zmm2, %zmm3"); 667 asm volatile("vpshldvw 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 668 asm volatile("vpshldvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 669 670 /* AVX-512: Op code 0f 38 71 */ 671 672 asm volatile("vpshldvd %xmm1, %xmm2, %xmm3"); 673 asm volatile("vpshldvd %ymm1, %ymm2, %ymm3"); 674 asm volatile("vpshldvd %zmm1, %zmm2, %zmm3"); 675 asm volatile("vpshldvd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 676 asm volatile("vpshldvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 677 678 asm volatile("vpshldvq %xmm1, %xmm2, %xmm3"); 679 asm volatile("vpshldvq %ymm1, %ymm2, %ymm3"); 680 asm volatile("vpshldvq %zmm1, %zmm2, %zmm3"); 681 asm volatile("vpshldvq 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 682 asm volatile("vpshldvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 683 684 /* AVX-512: Op code 0f 38 72 */ 685 686 asm volatile("vcvtne2ps2bf16 %xmm1, %xmm2, %xmm3"); 687 asm volatile("vcvtne2ps2bf16 %ymm1, %ymm2, %ymm3"); 688 asm volatile("vcvtne2ps2bf16 %zmm1, %zmm2, %zmm3"); 689 asm volatile("vcvtne2ps2bf16 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 690 asm volatile("vcvtne2ps2bf16 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 691 692 asm volatile("vcvtneps2bf16 %xmm1, %xmm2"); 693 asm volatile("vcvtneps2bf16 %ymm1, %xmm2"); 694 asm volatile("vcvtneps2bf16 %zmm1, %ymm2"); 695 asm volatile("vcvtneps2bf16 0x12345678(%rax,%rcx,8),%ymm2"); 696 asm volatile("vcvtneps2bf16 0x12345678(%eax,%ecx,8),%ymm2"); 697 698 asm volatile("vpshrdvw %xmm1, %xmm2, %xmm3"); 699 asm volatile("vpshrdvw %ymm1, %ymm2, %ymm3"); 700 asm volatile("vpshrdvw %zmm1, %zmm2, %zmm3"); 701 asm volatile("vpshrdvw 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 702 asm volatile("vpshrdvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 703 704 /* AVX-512: Op code 0f 38 73 */ 705 706 asm volatile("vpshrdvd %xmm1, %xmm2, %xmm3"); 707 asm volatile("vpshrdvd %ymm1, %ymm2, %ymm3"); 708 asm volatile("vpshrdvd %zmm1, %zmm2, %zmm3"); 709 asm volatile("vpshrdvd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 710 asm volatile("vpshrdvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 711 712 asm volatile("vpshrdvq %xmm1, %xmm2, %xmm3"); 713 asm volatile("vpshrdvq %ymm1, %ymm2, %ymm3"); 714 asm volatile("vpshrdvq %zmm1, %zmm2, %zmm3"); 715 asm volatile("vpshrdvq 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 716 asm volatile("vpshrdvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 717 718 /* AVX-512: Op code 0f 38 75 */ 719 720 asm volatile("vpermi2b %zmm24,%zmm25,%zmm26"); 721 asm volatile("vpermi2w %zmm26,%zmm27,%zmm28"); 722 723 /* AVX-512: Op code 0f 38 76 */ 724 725 asm volatile("vpermi2d %zmm26,%zmm27,%zmm28"); 726 asm volatile("vpermi2q %zmm26,%zmm27,%zmm28"); 727 728 /* AVX-512: Op code 0f 38 77 */ 729 730 asm volatile("vpermi2ps %zmm26,%zmm27,%zmm28"); 731 asm volatile("vpermi2pd %zmm26,%zmm27,%zmm28"); 732 733 /* AVX-512: Op code 0f 38 7a */ 734 735 asm volatile("vpbroadcastb %eax,%xmm30"); 736 737 /* AVX-512: Op code 0f 38 7b */ 738 739 asm volatile("vpbroadcastw %eax,%xmm30"); 740 741 /* AVX-512: Op code 0f 38 7c */ 742 743 asm volatile("vpbroadcastd %eax,%xmm30"); 744 asm volatile("vpbroadcastq %rax,%zmm30"); 745 746 /* AVX-512: Op code 0f 38 7d */ 747 748 asm volatile("vpermt2b %zmm26,%zmm27,%zmm28"); 749 asm volatile("vpermt2w %zmm26,%zmm27,%zmm28"); 750 751 /* AVX-512: Op code 0f 38 7e */ 752 753 asm volatile("vpermt2d %zmm26,%zmm27,%zmm28"); 754 asm volatile("vpermt2q %zmm26,%zmm27,%zmm28"); 755 756 /* AVX-512: Op code 0f 38 7f */ 757 758 asm volatile("vpermt2ps %zmm26,%zmm27,%zmm28"); 759 asm volatile("vpermt2pd %zmm26,%zmm27,%zmm28"); 760 761 /* AVX-512: Op code 0f 38 83 */ 762 763 asm volatile("vpmultishiftqb %zmm26,%zmm27,%zmm28"); 764 765 /* AVX-512: Op code 0f 38 88 */ 766 767 asm volatile("vexpandps (%rcx),%zmm26"); 768 asm volatile("vexpandpd (%rcx),%zmm28"); 769 770 /* AVX-512: Op code 0f 38 89 */ 771 772 asm volatile("vpexpandd (%rcx),%zmm28"); 773 asm volatile("vpexpandq (%rcx),%zmm26"); 774 775 /* AVX-512: Op code 0f 38 8a */ 776 777 asm volatile("vcompressps %zmm28,(%rcx)"); 778 asm volatile("vcompresspd %zmm28,(%rcx)"); 779 780 /* AVX-512: Op code 0f 38 8b */ 781 782 asm volatile("vpcompressd %zmm28,(%rcx)"); 783 asm volatile("vpcompressq %zmm26,(%rcx)"); 784 785 /* AVX-512: Op code 0f 38 8d */ 786 787 asm volatile("vpermb %zmm26,%zmm27,%zmm28"); 788 asm volatile("vpermw %zmm26,%zmm27,%zmm28"); 789 790 /* AVX-512: Op code 0f 38 8f */ 791 792 asm volatile("vpshufbitqmb %xmm1, %xmm2, %k3"); 793 asm volatile("vpshufbitqmb %ymm1, %ymm2, %k3"); 794 asm volatile("vpshufbitqmb %zmm1, %zmm2, %k3"); 795 asm volatile("vpshufbitqmb 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 796 asm volatile("vpshufbitqmb 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 797 798 /* AVX-512: Op code 0f 38 90 */ 799 800 asm volatile("vpgatherdd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 801 asm volatile("vpgatherdq %xmm2,0x04(%rbp,%xmm7,2),%xmm1"); 802 asm volatile("vpgatherdd 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 803 asm volatile("vpgatherdq 0x7b(%rbp,%ymm27,8),%zmm26{%k1}"); 804 805 /* AVX-512: Op code 0f 38 91 */ 806 807 asm volatile("vpgatherqd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 808 asm volatile("vpgatherqq %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 809 asm volatile("vpgatherqd 0x7b(%rbp,%zmm27,8),%ymm26{%k1}"); 810 asm volatile("vpgatherqq 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 811 812 /* AVX-512: Op code 0f 38 9a */ 813 814 asm volatile("vfmsub132ps %xmm1, %xmm2, %xmm3"); 815 asm volatile("vfmsub132ps %ymm1, %ymm2, %ymm3"); 816 asm volatile("vfmsub132ps %zmm1, %zmm2, %zmm3"); 817 asm volatile("vfmsub132ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 818 asm volatile("vfmsub132ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 819 820 asm volatile("vfmsub132pd %xmm1, %xmm2, %xmm3"); 821 asm volatile("vfmsub132pd %ymm1, %ymm2, %ymm3"); 822 asm volatile("vfmsub132pd %zmm1, %zmm2, %zmm3"); 823 asm volatile("vfmsub132pd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 824 asm volatile("vfmsub132pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 825 826 asm volatile("v4fmaddps (%rax), %zmm0, %zmm4"); 827 asm volatile("v4fmaddps (%eax), %zmm0, %zmm4"); 828 asm volatile("v4fmaddps 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 829 asm volatile("v4fmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 830 831 /* AVX-512: Op code 0f 38 9b */ 832 833 asm volatile("vfmsub132ss %xmm1, %xmm2, %xmm3"); 834 asm volatile("vfmsub132ss 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 835 asm volatile("vfmsub132ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 836 837 asm volatile("vfmsub132sd %xmm1, %xmm2, %xmm3"); 838 asm volatile("vfmsub132sd 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 839 asm volatile("vfmsub132sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 840 841 asm volatile("v4fmaddss (%rax), %xmm0, %xmm4"); 842 asm volatile("v4fmaddss (%eax), %xmm0, %xmm4"); 843 asm volatile("v4fmaddss 0x12345678(%rax,%rcx,8),%xmm0,%xmm4"); 844 asm volatile("v4fmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 845 846 /* AVX-512: Op code 0f 38 a0 */ 847 848 asm volatile("vpscatterdd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 849 asm volatile("vpscatterdq %zmm26,0x7b(%rbp,%ymm27,8){%k1}"); 850 851 /* AVX-512: Op code 0f 38 a1 */ 852 853 asm volatile("vpscatterqd %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 854 asm volatile("vpscatterqq %ymm6,0x7b(%rbp,%ymm27,8){%k1}"); 855 856 /* AVX-512: Op code 0f 38 a2 */ 857 858 asm volatile("vscatterdps %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 859 asm volatile("vscatterdpd %zmm28,0x7b(%rbp,%ymm27,8){%k1}"); 860 861 /* AVX-512: Op code 0f 38 a3 */ 862 863 asm volatile("vscatterqps %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 864 asm volatile("vscatterqpd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 865 866 /* AVX-512: Op code 0f 38 aa */ 867 868 asm volatile("vfmsub213ps %xmm1, %xmm2, %xmm3"); 869 asm volatile("vfmsub213ps %ymm1, %ymm2, %ymm3"); 870 asm volatile("vfmsub213ps %zmm1, %zmm2, %zmm3"); 871 asm volatile("vfmsub213ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 872 asm volatile("vfmsub213ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 873 874 asm volatile("vfmsub213pd %xmm1, %xmm2, %xmm3"); 875 asm volatile("vfmsub213pd %ymm1, %ymm2, %ymm3"); 876 asm volatile("vfmsub213pd %zmm1, %zmm2, %zmm3"); 877 asm volatile("vfmsub213pd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 878 asm volatile("vfmsub213pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 879 880 asm volatile("v4fnmaddps (%rax), %zmm0, %zmm4"); 881 asm volatile("v4fnmaddps (%eax), %zmm0, %zmm4"); 882 asm volatile("v4fnmaddps 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 883 asm volatile("v4fnmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 884 885 /* AVX-512: Op code 0f 38 ab */ 886 887 asm volatile("vfmsub213ss %xmm1, %xmm2, %xmm3"); 888 asm volatile("vfmsub213ss 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 889 asm volatile("vfmsub213ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 890 891 asm volatile("vfmsub213sd %xmm1, %xmm2, %xmm3"); 892 asm volatile("vfmsub213sd 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 893 asm volatile("vfmsub213sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 894 895 asm volatile("v4fnmaddss (%rax), %xmm0, %xmm4"); 896 asm volatile("v4fnmaddss (%eax), %xmm0, %xmm4"); 897 asm volatile("v4fnmaddss 0x12345678(%rax,%rcx,8),%xmm0,%xmm4"); 898 asm volatile("v4fnmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 899 900 /* AVX-512: Op code 0f 38 b4 */ 901 902 asm volatile("vpmadd52luq %zmm26,%zmm27,%zmm28"); 903 904 /* AVX-512: Op code 0f 38 b5 */ 905 906 asm volatile("vpmadd52huq %zmm26,%zmm27,%zmm28"); 907 908 /* AVX-512: Op code 0f 38 c4 */ 909 910 asm volatile("vpconflictd %zmm26,%zmm27"); 911 asm volatile("vpconflictq %zmm26,%zmm27"); 912 913 /* AVX-512: Op code 0f 38 c8 */ 914 915 asm volatile("vexp2ps %zmm29,%zmm30"); 916 asm volatile("vexp2pd %zmm26,%zmm27"); 917 918 /* AVX-512: Op code 0f 38 ca */ 919 920 asm volatile("vrcp28ps %zmm29,%zmm30"); 921 asm volatile("vrcp28pd %zmm26,%zmm27"); 922 923 /* AVX-512: Op code 0f 38 cb */ 924 925 asm volatile("vrcp28ss %xmm28,%xmm29,%xmm30{%k7}"); 926 asm volatile("vrcp28sd %xmm25,%xmm26,%xmm27{%k7}"); 927 928 /* AVX-512: Op code 0f 38 cc */ 929 930 asm volatile("vrsqrt28ps %zmm29,%zmm30"); 931 asm volatile("vrsqrt28pd %zmm26,%zmm27"); 932 933 /* AVX-512: Op code 0f 38 cd */ 934 935 asm volatile("vrsqrt28ss %xmm28,%xmm29,%xmm30{%k7}"); 936 asm volatile("vrsqrt28sd %xmm25,%xmm26,%xmm27{%k7}"); 937 938 /* AVX-512: Op code 0f 38 cf */ 939 940 asm volatile("gf2p8mulb %xmm1, %xmm3"); 941 asm volatile("gf2p8mulb 0x12345678(%rax,%rcx,8),%xmm3"); 942 asm volatile("gf2p8mulb 0x12345678(%eax,%ecx,8),%xmm3"); 943 944 asm volatile("vgf2p8mulb %xmm1, %xmm2, %xmm3"); 945 asm volatile("vgf2p8mulb %ymm1, %ymm2, %ymm3"); 946 asm volatile("vgf2p8mulb %zmm1, %zmm2, %zmm3"); 947 asm volatile("vgf2p8mulb 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 948 asm volatile("vgf2p8mulb 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 949 950 /* AVX-512: Op code 0f 38 dc */ 951 952 asm volatile("vaesenc %xmm1, %xmm2, %xmm3"); 953 asm volatile("vaesenc %ymm1, %ymm2, %ymm3"); 954 asm volatile("vaesenc %zmm1, %zmm2, %zmm3"); 955 asm volatile("vaesenc 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 956 asm volatile("vaesenc 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 957 958 /* AVX-512: Op code 0f 38 dd */ 959 960 asm volatile("vaesenclast %xmm1, %xmm2, %xmm3"); 961 asm volatile("vaesenclast %ymm1, %ymm2, %ymm3"); 962 asm volatile("vaesenclast %zmm1, %zmm2, %zmm3"); 963 asm volatile("vaesenclast 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 964 asm volatile("vaesenclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 965 966 /* AVX-512: Op code 0f 38 de */ 967 968 asm volatile("vaesdec %xmm1, %xmm2, %xmm3"); 969 asm volatile("vaesdec %ymm1, %ymm2, %ymm3"); 970 asm volatile("vaesdec %zmm1, %zmm2, %zmm3"); 971 asm volatile("vaesdec 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 972 asm volatile("vaesdec 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 973 974 /* AVX-512: Op code 0f 38 df */ 975 976 asm volatile("vaesdeclast %xmm1, %xmm2, %xmm3"); 977 asm volatile("vaesdeclast %ymm1, %ymm2, %ymm3"); 978 asm volatile("vaesdeclast %zmm1, %zmm2, %zmm3"); 979 asm volatile("vaesdeclast 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 980 asm volatile("vaesdeclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 981 982 /* AVX-512: Op code 0f 3a 03 */ 983 984 asm volatile("valignd $0x12,%zmm28,%zmm29,%zmm30"); 985 asm volatile("valignq $0x12,%zmm25,%zmm26,%zmm27"); 986 987 /* AVX-512: Op code 0f 3a 08 */ 988 989 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 990 asm volatile("vrndscaleps $0x12,%zmm25,%zmm26"); 991 992 /* AVX-512: Op code 0f 3a 09 */ 993 994 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 995 asm volatile("vrndscalepd $0x12,%zmm25,%zmm26"); 996 997 /* AVX-512: Op code 0f 3a 1a */ 998 999 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 1000 asm volatile("vrndscaless $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 1001 1002 /* AVX-512: Op code 0f 3a 0b */ 1003 1004 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 1005 asm volatile("vrndscalesd $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 1006 1007 /* AVX-512: Op code 0f 3a 18 */ 1008 1009 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 1010 asm volatile("vinsertf32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 1011 asm volatile("vinsertf64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 1012 1013 /* AVX-512: Op code 0f 3a 19 */ 1014 1015 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 1016 asm volatile("vextractf32x4 $0x12,%zmm25,%xmm26{%k7}"); 1017 asm volatile("vextractf64x2 $0x12,%zmm25,%xmm26{%k7}"); 1018 1019 /* AVX-512: Op code 0f 3a 1a */ 1020 1021 asm volatile("vinsertf32x8 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 1022 asm volatile("vinsertf64x4 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 1023 1024 /* AVX-512: Op code 0f 3a 1b */ 1025 1026 asm volatile("vextractf32x8 $0x12,%zmm29,%ymm30{%k7}"); 1027 asm volatile("vextractf64x4 $0x12,%zmm26,%ymm27{%k7}"); 1028 1029 /* AVX-512: Op code 0f 3a 1e */ 1030 1031 asm volatile("vpcmpud $0x12,%zmm29,%zmm30,%k5"); 1032 asm volatile("vpcmpuq $0x12,%zmm26,%zmm27,%k5"); 1033 1034 /* AVX-512: Op code 0f 3a 1f */ 1035 1036 asm volatile("vpcmpd $0x12,%zmm29,%zmm30,%k5"); 1037 asm volatile("vpcmpq $0x12,%zmm26,%zmm27,%k5"); 1038 1039 /* AVX-512: Op code 0f 3a 23 */ 1040 1041 asm volatile("vshuff32x4 $0x12,%zmm28,%zmm29,%zmm30"); 1042 asm volatile("vshuff64x2 $0x12,%zmm25,%zmm26,%zmm27"); 1043 1044 /* AVX-512: Op code 0f 3a 25 */ 1045 1046 asm volatile("vpternlogd $0x12,%zmm28,%zmm29,%zmm30"); 1047 asm volatile("vpternlogq $0x12,%zmm28,%zmm29,%zmm30"); 1048 1049 /* AVX-512: Op code 0f 3a 26 */ 1050 1051 asm volatile("vgetmantps $0x12,%zmm26,%zmm27"); 1052 asm volatile("vgetmantpd $0x12,%zmm29,%zmm30"); 1053 1054 /* AVX-512: Op code 0f 3a 27 */ 1055 1056 asm volatile("vgetmantss $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 1057 asm volatile("vgetmantsd $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 1058 1059 /* AVX-512: Op code 0f 3a 38 */ 1060 1061 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 1062 asm volatile("vinserti32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 1063 asm volatile("vinserti64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 1064 1065 /* AVX-512: Op code 0f 3a 39 */ 1066 1067 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 1068 asm volatile("vextracti32x4 $0x12,%zmm25,%xmm26{%k7}"); 1069 asm volatile("vextracti64x2 $0x12,%zmm25,%xmm26{%k7}"); 1070 1071 /* AVX-512: Op code 0f 3a 3a */ 1072 1073 asm volatile("vinserti32x8 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 1074 asm volatile("vinserti64x4 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 1075 1076 /* AVX-512: Op code 0f 3a 3b */ 1077 1078 asm volatile("vextracti32x8 $0x12,%zmm29,%ymm30{%k7}"); 1079 asm volatile("vextracti64x4 $0x12,%zmm26,%ymm27{%k7}"); 1080 1081 /* AVX-512: Op code 0f 3a 3e */ 1082 1083 asm volatile("vpcmpub $0x12,%zmm29,%zmm30,%k5"); 1084 asm volatile("vpcmpuw $0x12,%zmm26,%zmm27,%k5"); 1085 1086 /* AVX-512: Op code 0f 3a 3f */ 1087 1088 asm volatile("vpcmpb $0x12,%zmm29,%zmm30,%k5"); 1089 asm volatile("vpcmpw $0x12,%zmm26,%zmm27,%k5"); 1090 1091 /* AVX-512: Op code 0f 3a 43 */ 1092 1093 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 1094 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 1095 1096 /* AVX-512: Op code 0f 3a 43 */ 1097 1098 asm volatile("vshufi32x4 $0x12,%zmm25,%zmm26,%zmm27"); 1099 asm volatile("vshufi64x2 $0x12,%zmm28,%zmm29,%zmm30"); 1100 1101 /* AVX-512: Op code 0f 3a 44 */ 1102 1103 asm volatile("vpclmulqdq $0x12,%xmm1,%xmm2,%xmm3"); 1104 asm volatile("vpclmulqdq $0x12,%ymm1,%ymm2,%ymm3"); 1105 asm volatile("vpclmulqdq $0x12,%zmm1,%zmm2,%zmm3"); 1106 asm volatile("vpclmulqdq $0x12,%zmm25,%zmm26,%zmm27"); 1107 1108 /* AVX-512: Op code 0f 3a 50 */ 1109 1110 asm volatile("vrangeps $0x12,%zmm25,%zmm26,%zmm27"); 1111 asm volatile("vrangepd $0x12,%zmm28,%zmm29,%zmm30"); 1112 1113 /* AVX-512: Op code 0f 3a 51 */ 1114 1115 asm volatile("vrangess $0x12,%xmm25,%xmm26,%xmm27"); 1116 asm volatile("vrangesd $0x12,%xmm28,%xmm29,%xmm30"); 1117 1118 /* AVX-512: Op code 0f 3a 54 */ 1119 1120 asm volatile("vfixupimmps $0x12,%zmm28,%zmm29,%zmm30"); 1121 asm volatile("vfixupimmpd $0x12,%zmm25,%zmm26,%zmm27"); 1122 1123 /* AVX-512: Op code 0f 3a 55 */ 1124 1125 asm volatile("vfixupimmss $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 1126 asm volatile("vfixupimmsd $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 1127 1128 /* AVX-512: Op code 0f 3a 56 */ 1129 1130 asm volatile("vreduceps $0x12,%zmm26,%zmm27"); 1131 asm volatile("vreducepd $0x12,%zmm29,%zmm30"); 1132 1133 /* AVX-512: Op code 0f 3a 57 */ 1134 1135 asm volatile("vreducess $0x12,%xmm25,%xmm26,%xmm27"); 1136 asm volatile("vreducesd $0x12,%xmm28,%xmm29,%xmm30"); 1137 1138 /* AVX-512: Op code 0f 3a 66 */ 1139 1140 asm volatile("vfpclassps $0x12,%zmm27,%k5"); 1141 asm volatile("vfpclasspd $0x12,%zmm30,%k5"); 1142 1143 /* AVX-512: Op code 0f 3a 67 */ 1144 1145 asm volatile("vfpclassss $0x12,%xmm27,%k5"); 1146 asm volatile("vfpclasssd $0x12,%xmm30,%k5"); 1147 1148 /* AVX-512: Op code 0f 3a 70 */ 1149 1150 asm volatile("vpshldw $0x12,%xmm1,%xmm2,%xmm3"); 1151 asm volatile("vpshldw $0x12,%ymm1,%ymm2,%ymm3"); 1152 asm volatile("vpshldw $0x12,%zmm1,%zmm2,%zmm3"); 1153 asm volatile("vpshldw $0x12,%zmm25,%zmm26,%zmm27"); 1154 1155 /* AVX-512: Op code 0f 3a 71 */ 1156 1157 asm volatile("vpshldd $0x12,%xmm1,%xmm2,%xmm3"); 1158 asm volatile("vpshldd $0x12,%ymm1,%ymm2,%ymm3"); 1159 asm volatile("vpshldd $0x12,%zmm1,%zmm2,%zmm3"); 1160 asm volatile("vpshldd $0x12,%zmm25,%zmm26,%zmm27"); 1161 1162 asm volatile("vpshldq $0x12,%xmm1,%xmm2,%xmm3"); 1163 asm volatile("vpshldq $0x12,%ymm1,%ymm2,%ymm3"); 1164 asm volatile("vpshldq $0x12,%zmm1,%zmm2,%zmm3"); 1165 asm volatile("vpshldq $0x12,%zmm25,%zmm26,%zmm27"); 1166 1167 /* AVX-512: Op code 0f 3a 72 */ 1168 1169 asm volatile("vpshrdw $0x12,%xmm1,%xmm2,%xmm3"); 1170 asm volatile("vpshrdw $0x12,%ymm1,%ymm2,%ymm3"); 1171 asm volatile("vpshrdw $0x12,%zmm1,%zmm2,%zmm3"); 1172 asm volatile("vpshrdw $0x12,%zmm25,%zmm26,%zmm27"); 1173 1174 /* AVX-512: Op code 0f 3a 73 */ 1175 1176 asm volatile("vpshrdd $0x12,%xmm1,%xmm2,%xmm3"); 1177 asm volatile("vpshrdd $0x12,%ymm1,%ymm2,%ymm3"); 1178 asm volatile("vpshrdd $0x12,%zmm1,%zmm2,%zmm3"); 1179 asm volatile("vpshrdd $0x12,%zmm25,%zmm26,%zmm27"); 1180 1181 asm volatile("vpshrdq $0x12,%xmm1,%xmm2,%xmm3"); 1182 asm volatile("vpshrdq $0x12,%ymm1,%ymm2,%ymm3"); 1183 asm volatile("vpshrdq $0x12,%zmm1,%zmm2,%zmm3"); 1184 asm volatile("vpshrdq $0x12,%zmm25,%zmm26,%zmm27"); 1185 1186 /* AVX-512: Op code 0f 3a ce */ 1187 1188 asm volatile("gf2p8affineqb $0x12,%xmm1,%xmm3"); 1189 1190 asm volatile("vgf2p8affineqb $0x12,%xmm1,%xmm2,%xmm3"); 1191 asm volatile("vgf2p8affineqb $0x12,%ymm1,%ymm2,%ymm3"); 1192 asm volatile("vgf2p8affineqb $0x12,%zmm1,%zmm2,%zmm3"); 1193 asm volatile("vgf2p8affineqb $0x12,%zmm25,%zmm26,%zmm27"); 1194 1195 /* AVX-512: Op code 0f 3a cf */ 1196 1197 asm volatile("gf2p8affineinvqb $0x12,%xmm1,%xmm3"); 1198 1199 asm volatile("vgf2p8affineinvqb $0x12,%xmm1,%xmm2,%xmm3"); 1200 asm volatile("vgf2p8affineinvqb $0x12,%ymm1,%ymm2,%ymm3"); 1201 asm volatile("vgf2p8affineinvqb $0x12,%zmm1,%zmm2,%zmm3"); 1202 asm volatile("vgf2p8affineinvqb $0x12,%zmm25,%zmm26,%zmm27"); 1203 1204 /* AVX-512: Op code 0f 72 (Grp13) */ 1205 1206 asm volatile("vprord $0x12,%zmm25,%zmm26"); 1207 asm volatile("vprorq $0x12,%zmm25,%zmm26"); 1208 asm volatile("vprold $0x12,%zmm29,%zmm30"); 1209 asm volatile("vprolq $0x12,%zmm29,%zmm30"); 1210 asm volatile("psrad $0x2,%mm6"); 1211 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 1212 asm volatile("vpsrad $0x5,%zmm26,%zmm22"); 1213 asm volatile("vpsraq $0x5,%zmm26,%zmm22"); 1214 1215 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 1216 1217 asm volatile("vgatherpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 1218 asm volatile("vgatherpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 1219 asm volatile("vgatherpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 1220 asm volatile("vgatherpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 1221 asm volatile("vscatterpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 1222 asm volatile("vscatterpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 1223 asm volatile("vscatterpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 1224 asm volatile("vscatterpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 1225 1226 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 1227 1228 asm volatile("vgatherpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 1229 asm volatile("vgatherpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 1230 asm volatile("vgatherpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 1231 asm volatile("vgatherpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 1232 asm volatile("vscatterpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 1233 asm volatile("vscatterpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 1234 asm volatile("vscatterpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 1235 asm volatile("vscatterpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 1236 1237 /* AVX-512: Examples */ 1238 1239 asm volatile("vaddpd %zmm28,%zmm29,%zmm30"); 1240 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}"); 1241 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}{z}"); 1242 asm volatile("vaddpd {rn-sae},%zmm28,%zmm29,%zmm30"); 1243 asm volatile("vaddpd {ru-sae},%zmm28,%zmm29,%zmm30"); 1244 asm volatile("vaddpd {rd-sae},%zmm28,%zmm29,%zmm30"); 1245 asm volatile("vaddpd {rz-sae},%zmm28,%zmm29,%zmm30"); 1246 asm volatile("vaddpd (%rcx),%zmm29,%zmm30"); 1247 asm volatile("vaddpd 0x123(%rax,%r14,8),%zmm29,%zmm30"); 1248 asm volatile("vaddpd (%rcx){1to8},%zmm29,%zmm30"); 1249 asm volatile("vaddpd 0x1fc0(%rdx),%zmm29,%zmm30"); 1250 asm volatile("vaddpd 0x3f8(%rdx){1to8},%zmm29,%zmm30"); 1251 asm volatile("vcmpeq_uqps 0x1fc(%rdx){1to16},%zmm30,%k5"); 1252 asm volatile("vcmpltsd 0x123(%rax,%r14,8),%xmm29,%k5{%k7}"); 1253 asm volatile("vcmplesd {sae},%xmm28,%xmm29,%k5{%k7}"); 1254 asm volatile("vgetmantss $0x5b,0x123(%rax,%r14,8),%xmm29,%xmm30{%k7}"); 1255 1256 /* bndmk m64, bnd */ 1257 1258 asm volatile("bndmk (%rax), %bnd0"); 1259 asm volatile("bndmk (%r8), %bnd0"); 1260 asm volatile("bndmk (0x12345678), %bnd0"); 1261 asm volatile("bndmk (%rax), %bnd3"); 1262 asm volatile("bndmk (%rcx,%rax,1), %bnd0"); 1263 asm volatile("bndmk 0x12345678(,%rax,1), %bnd0"); 1264 asm volatile("bndmk (%rax,%rcx,1), %bnd0"); 1265 asm volatile("bndmk (%rax,%rcx,8), %bnd0"); 1266 asm volatile("bndmk 0x12(%rax), %bnd0"); 1267 asm volatile("bndmk 0x12(%rbp), %bnd0"); 1268 asm volatile("bndmk 0x12(%rcx,%rax,1), %bnd0"); 1269 asm volatile("bndmk 0x12(%rbp,%rax,1), %bnd0"); 1270 asm volatile("bndmk 0x12(%rax,%rcx,1), %bnd0"); 1271 asm volatile("bndmk 0x12(%rax,%rcx,8), %bnd0"); 1272 asm volatile("bndmk 0x12345678(%rax), %bnd0"); 1273 asm volatile("bndmk 0x12345678(%rbp), %bnd0"); 1274 asm volatile("bndmk 0x12345678(%rcx,%rax,1), %bnd0"); 1275 asm volatile("bndmk 0x12345678(%rbp,%rax,1), %bnd0"); 1276 asm volatile("bndmk 0x12345678(%rax,%rcx,1), %bnd0"); 1277 asm volatile("bndmk 0x12345678(%rax,%rcx,8), %bnd0"); 1278 1279 /* bndcl r/m64, bnd */ 1280 1281 asm volatile("bndcl (%rax), %bnd0"); 1282 asm volatile("bndcl (%r8), %bnd0"); 1283 asm volatile("bndcl (0x12345678), %bnd0"); 1284 asm volatile("bndcl (%rax), %bnd3"); 1285 asm volatile("bndcl (%rcx,%rax,1), %bnd0"); 1286 asm volatile("bndcl 0x12345678(,%rax,1), %bnd0"); 1287 asm volatile("bndcl (%rax,%rcx,1), %bnd0"); 1288 asm volatile("bndcl (%rax,%rcx,8), %bnd0"); 1289 asm volatile("bndcl 0x12(%rax), %bnd0"); 1290 asm volatile("bndcl 0x12(%rbp), %bnd0"); 1291 asm volatile("bndcl 0x12(%rcx,%rax,1), %bnd0"); 1292 asm volatile("bndcl 0x12(%rbp,%rax,1), %bnd0"); 1293 asm volatile("bndcl 0x12(%rax,%rcx,1), %bnd0"); 1294 asm volatile("bndcl 0x12(%rax,%rcx,8), %bnd0"); 1295 asm volatile("bndcl 0x12345678(%rax), %bnd0"); 1296 asm volatile("bndcl 0x12345678(%rbp), %bnd0"); 1297 asm volatile("bndcl 0x12345678(%rcx,%rax,1), %bnd0"); 1298 asm volatile("bndcl 0x12345678(%rbp,%rax,1), %bnd0"); 1299 asm volatile("bndcl 0x12345678(%rax,%rcx,1), %bnd0"); 1300 asm volatile("bndcl 0x12345678(%rax,%rcx,8), %bnd0"); 1301 asm volatile("bndcl %rax, %bnd0"); 1302 1303 /* bndcu r/m64, bnd */ 1304 1305 asm volatile("bndcu (%rax), %bnd0"); 1306 asm volatile("bndcu (%r8), %bnd0"); 1307 asm volatile("bndcu (0x12345678), %bnd0"); 1308 asm volatile("bndcu (%rax), %bnd3"); 1309 asm volatile("bndcu (%rcx,%rax,1), %bnd0"); 1310 asm volatile("bndcu 0x12345678(,%rax,1), %bnd0"); 1311 asm volatile("bndcu (%rax,%rcx,1), %bnd0"); 1312 asm volatile("bndcu (%rax,%rcx,8), %bnd0"); 1313 asm volatile("bndcu 0x12(%rax), %bnd0"); 1314 asm volatile("bndcu 0x12(%rbp), %bnd0"); 1315 asm volatile("bndcu 0x12(%rcx,%rax,1), %bnd0"); 1316 asm volatile("bndcu 0x12(%rbp,%rax,1), %bnd0"); 1317 asm volatile("bndcu 0x12(%rax,%rcx,1), %bnd0"); 1318 asm volatile("bndcu 0x12(%rax,%rcx,8), %bnd0"); 1319 asm volatile("bndcu 0x12345678(%rax), %bnd0"); 1320 asm volatile("bndcu 0x12345678(%rbp), %bnd0"); 1321 asm volatile("bndcu 0x12345678(%rcx,%rax,1), %bnd0"); 1322 asm volatile("bndcu 0x12345678(%rbp,%rax,1), %bnd0"); 1323 asm volatile("bndcu 0x12345678(%rax,%rcx,1), %bnd0"); 1324 asm volatile("bndcu 0x12345678(%rax,%rcx,8), %bnd0"); 1325 asm volatile("bndcu %rax, %bnd0"); 1326 1327 /* bndcn r/m64, bnd */ 1328 1329 asm volatile("bndcn (%rax), %bnd0"); 1330 asm volatile("bndcn (%r8), %bnd0"); 1331 asm volatile("bndcn (0x12345678), %bnd0"); 1332 asm volatile("bndcn (%rax), %bnd3"); 1333 asm volatile("bndcn (%rcx,%rax,1), %bnd0"); 1334 asm volatile("bndcn 0x12345678(,%rax,1), %bnd0"); 1335 asm volatile("bndcn (%rax,%rcx,1), %bnd0"); 1336 asm volatile("bndcn (%rax,%rcx,8), %bnd0"); 1337 asm volatile("bndcn 0x12(%rax), %bnd0"); 1338 asm volatile("bndcn 0x12(%rbp), %bnd0"); 1339 asm volatile("bndcn 0x12(%rcx,%rax,1), %bnd0"); 1340 asm volatile("bndcn 0x12(%rbp,%rax,1), %bnd0"); 1341 asm volatile("bndcn 0x12(%rax,%rcx,1), %bnd0"); 1342 asm volatile("bndcn 0x12(%rax,%rcx,8), %bnd0"); 1343 asm volatile("bndcn 0x12345678(%rax), %bnd0"); 1344 asm volatile("bndcn 0x12345678(%rbp), %bnd0"); 1345 asm volatile("bndcn 0x12345678(%rcx,%rax,1), %bnd0"); 1346 asm volatile("bndcn 0x12345678(%rbp,%rax,1), %bnd0"); 1347 asm volatile("bndcn 0x12345678(%rax,%rcx,1), %bnd0"); 1348 asm volatile("bndcn 0x12345678(%rax,%rcx,8), %bnd0"); 1349 asm volatile("bndcn %rax, %bnd0"); 1350 1351 /* bndmov m128, bnd */ 1352 1353 asm volatile("bndmov (%rax), %bnd0"); 1354 asm volatile("bndmov (%r8), %bnd0"); 1355 asm volatile("bndmov (0x12345678), %bnd0"); 1356 asm volatile("bndmov (%rax), %bnd3"); 1357 asm volatile("bndmov (%rcx,%rax,1), %bnd0"); 1358 asm volatile("bndmov 0x12345678(,%rax,1), %bnd0"); 1359 asm volatile("bndmov (%rax,%rcx,1), %bnd0"); 1360 asm volatile("bndmov (%rax,%rcx,8), %bnd0"); 1361 asm volatile("bndmov 0x12(%rax), %bnd0"); 1362 asm volatile("bndmov 0x12(%rbp), %bnd0"); 1363 asm volatile("bndmov 0x12(%rcx,%rax,1), %bnd0"); 1364 asm volatile("bndmov 0x12(%rbp,%rax,1), %bnd0"); 1365 asm volatile("bndmov 0x12(%rax,%rcx,1), %bnd0"); 1366 asm volatile("bndmov 0x12(%rax,%rcx,8), %bnd0"); 1367 asm volatile("bndmov 0x12345678(%rax), %bnd0"); 1368 asm volatile("bndmov 0x12345678(%rbp), %bnd0"); 1369 asm volatile("bndmov 0x12345678(%rcx,%rax,1), %bnd0"); 1370 asm volatile("bndmov 0x12345678(%rbp,%rax,1), %bnd0"); 1371 asm volatile("bndmov 0x12345678(%rax,%rcx,1), %bnd0"); 1372 asm volatile("bndmov 0x12345678(%rax,%rcx,8), %bnd0"); 1373 1374 /* bndmov bnd, m128 */ 1375 1376 asm volatile("bndmov %bnd0, (%rax)"); 1377 asm volatile("bndmov %bnd0, (%r8)"); 1378 asm volatile("bndmov %bnd0, (0x12345678)"); 1379 asm volatile("bndmov %bnd3, (%rax)"); 1380 asm volatile("bndmov %bnd0, (%rcx,%rax,1)"); 1381 asm volatile("bndmov %bnd0, 0x12345678(,%rax,1)"); 1382 asm volatile("bndmov %bnd0, (%rax,%rcx,1)"); 1383 asm volatile("bndmov %bnd0, (%rax,%rcx,8)"); 1384 asm volatile("bndmov %bnd0, 0x12(%rax)"); 1385 asm volatile("bndmov %bnd0, 0x12(%rbp)"); 1386 asm volatile("bndmov %bnd0, 0x12(%rcx,%rax,1)"); 1387 asm volatile("bndmov %bnd0, 0x12(%rbp,%rax,1)"); 1388 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,1)"); 1389 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,8)"); 1390 asm volatile("bndmov %bnd0, 0x12345678(%rax)"); 1391 asm volatile("bndmov %bnd0, 0x12345678(%rbp)"); 1392 asm volatile("bndmov %bnd0, 0x12345678(%rcx,%rax,1)"); 1393 asm volatile("bndmov %bnd0, 0x12345678(%rbp,%rax,1)"); 1394 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,1)"); 1395 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,8)"); 1396 1397 /* bndmov bnd2, bnd1 */ 1398 1399 asm volatile("bndmov %bnd0, %bnd1"); 1400 asm volatile("bndmov %bnd1, %bnd0"); 1401 1402 /* bndldx mib, bnd */ 1403 1404 asm volatile("bndldx (%rax), %bnd0"); 1405 asm volatile("bndldx (%r8), %bnd0"); 1406 asm volatile("bndldx (0x12345678), %bnd0"); 1407 asm volatile("bndldx (%rax), %bnd3"); 1408 asm volatile("bndldx (%rcx,%rax,1), %bnd0"); 1409 asm volatile("bndldx 0x12345678(,%rax,1), %bnd0"); 1410 asm volatile("bndldx (%rax,%rcx,1), %bnd0"); 1411 asm volatile("bndldx 0x12(%rax), %bnd0"); 1412 asm volatile("bndldx 0x12(%rbp), %bnd0"); 1413 asm volatile("bndldx 0x12(%rcx,%rax,1), %bnd0"); 1414 asm volatile("bndldx 0x12(%rbp,%rax,1), %bnd0"); 1415 asm volatile("bndldx 0x12(%rax,%rcx,1), %bnd0"); 1416 asm volatile("bndldx 0x12345678(%rax), %bnd0"); 1417 asm volatile("bndldx 0x12345678(%rbp), %bnd0"); 1418 asm volatile("bndldx 0x12345678(%rcx,%rax,1), %bnd0"); 1419 asm volatile("bndldx 0x12345678(%rbp,%rax,1), %bnd0"); 1420 asm volatile("bndldx 0x12345678(%rax,%rcx,1), %bnd0"); 1421 1422 /* bndstx bnd, mib */ 1423 1424 asm volatile("bndstx %bnd0, (%rax)"); 1425 asm volatile("bndstx %bnd0, (%r8)"); 1426 asm volatile("bndstx %bnd0, (0x12345678)"); 1427 asm volatile("bndstx %bnd3, (%rax)"); 1428 asm volatile("bndstx %bnd0, (%rcx,%rax,1)"); 1429 asm volatile("bndstx %bnd0, 0x12345678(,%rax,1)"); 1430 asm volatile("bndstx %bnd0, (%rax,%rcx,1)"); 1431 asm volatile("bndstx %bnd0, 0x12(%rax)"); 1432 asm volatile("bndstx %bnd0, 0x12(%rbp)"); 1433 asm volatile("bndstx %bnd0, 0x12(%rcx,%rax,1)"); 1434 asm volatile("bndstx %bnd0, 0x12(%rbp,%rax,1)"); 1435 asm volatile("bndstx %bnd0, 0x12(%rax,%rcx,1)"); 1436 asm volatile("bndstx %bnd0, 0x12345678(%rax)"); 1437 asm volatile("bndstx %bnd0, 0x12345678(%rbp)"); 1438 asm volatile("bndstx %bnd0, 0x12345678(%rcx,%rax,1)"); 1439 asm volatile("bndstx %bnd0, 0x12345678(%rbp,%rax,1)"); 1440 asm volatile("bndstx %bnd0, 0x12345678(%rax,%rcx,1)"); 1441 1442 /* bnd prefix on call, ret, jmp and all jcc */ 1443 1444 asm volatile("bnd call label1"); /* Expecting: call unconditional 0 */ 1445 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 1446 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 1447 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1448 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1449 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 1450 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0 */ 1451 1452 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 1453 1454 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 1455 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 1456 asm volatile("sha1rnds4 $0x91, %xmm8, %xmm0"); 1457 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm8"); 1458 asm volatile("sha1rnds4 $0x91, %xmm15, %xmm8"); 1459 asm volatile("sha1rnds4 $0x91, (%rax), %xmm0"); 1460 asm volatile("sha1rnds4 $0x91, (%r8), %xmm0"); 1461 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 1462 asm volatile("sha1rnds4 $0x91, (%rax), %xmm3"); 1463 asm volatile("sha1rnds4 $0x91, (%rcx,%rax,1), %xmm0"); 1464 asm volatile("sha1rnds4 $0x91, 0x12345678(,%rax,1), %xmm0"); 1465 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,1), %xmm0"); 1466 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,8), %xmm0"); 1467 asm volatile("sha1rnds4 $0x91, 0x12(%rax), %xmm0"); 1468 asm volatile("sha1rnds4 $0x91, 0x12(%rbp), %xmm0"); 1469 asm volatile("sha1rnds4 $0x91, 0x12(%rcx,%rax,1), %xmm0"); 1470 asm volatile("sha1rnds4 $0x91, 0x12(%rbp,%rax,1), %xmm0"); 1471 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,1), %xmm0"); 1472 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,8), %xmm0"); 1473 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax), %xmm0"); 1474 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp), %xmm0"); 1475 asm volatile("sha1rnds4 $0x91, 0x12345678(%rcx,%rax,1), %xmm0"); 1476 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp,%rax,1), %xmm0"); 1477 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,1), %xmm0"); 1478 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm0"); 1479 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm15"); 1480 1481 /* sha1nexte xmm2/m128, xmm1 */ 1482 1483 asm volatile("sha1nexte %xmm1, %xmm0"); 1484 asm volatile("sha1nexte %xmm7, %xmm2"); 1485 asm volatile("sha1nexte %xmm8, %xmm0"); 1486 asm volatile("sha1nexte %xmm7, %xmm8"); 1487 asm volatile("sha1nexte %xmm15, %xmm8"); 1488 asm volatile("sha1nexte (%rax), %xmm0"); 1489 asm volatile("sha1nexte (%r8), %xmm0"); 1490 asm volatile("sha1nexte (0x12345678), %xmm0"); 1491 asm volatile("sha1nexte (%rax), %xmm3"); 1492 asm volatile("sha1nexte (%rcx,%rax,1), %xmm0"); 1493 asm volatile("sha1nexte 0x12345678(,%rax,1), %xmm0"); 1494 asm volatile("sha1nexte (%rax,%rcx,1), %xmm0"); 1495 asm volatile("sha1nexte (%rax,%rcx,8), %xmm0"); 1496 asm volatile("sha1nexte 0x12(%rax), %xmm0"); 1497 asm volatile("sha1nexte 0x12(%rbp), %xmm0"); 1498 asm volatile("sha1nexte 0x12(%rcx,%rax,1), %xmm0"); 1499 asm volatile("sha1nexte 0x12(%rbp,%rax,1), %xmm0"); 1500 asm volatile("sha1nexte 0x12(%rax,%rcx,1), %xmm0"); 1501 asm volatile("sha1nexte 0x12(%rax,%rcx,8), %xmm0"); 1502 asm volatile("sha1nexte 0x12345678(%rax), %xmm0"); 1503 asm volatile("sha1nexte 0x12345678(%rbp), %xmm0"); 1504 asm volatile("sha1nexte 0x12345678(%rcx,%rax,1), %xmm0"); 1505 asm volatile("sha1nexte 0x12345678(%rbp,%rax,1), %xmm0"); 1506 asm volatile("sha1nexte 0x12345678(%rax,%rcx,1), %xmm0"); 1507 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm0"); 1508 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm15"); 1509 1510 /* sha1msg1 xmm2/m128, xmm1 */ 1511 1512 asm volatile("sha1msg1 %xmm1, %xmm0"); 1513 asm volatile("sha1msg1 %xmm7, %xmm2"); 1514 asm volatile("sha1msg1 %xmm8, %xmm0"); 1515 asm volatile("sha1msg1 %xmm7, %xmm8"); 1516 asm volatile("sha1msg1 %xmm15, %xmm8"); 1517 asm volatile("sha1msg1 (%rax), %xmm0"); 1518 asm volatile("sha1msg1 (%r8), %xmm0"); 1519 asm volatile("sha1msg1 (0x12345678), %xmm0"); 1520 asm volatile("sha1msg1 (%rax), %xmm3"); 1521 asm volatile("sha1msg1 (%rcx,%rax,1), %xmm0"); 1522 asm volatile("sha1msg1 0x12345678(,%rax,1), %xmm0"); 1523 asm volatile("sha1msg1 (%rax,%rcx,1), %xmm0"); 1524 asm volatile("sha1msg1 (%rax,%rcx,8), %xmm0"); 1525 asm volatile("sha1msg1 0x12(%rax), %xmm0"); 1526 asm volatile("sha1msg1 0x12(%rbp), %xmm0"); 1527 asm volatile("sha1msg1 0x12(%rcx,%rax,1), %xmm0"); 1528 asm volatile("sha1msg1 0x12(%rbp,%rax,1), %xmm0"); 1529 asm volatile("sha1msg1 0x12(%rax,%rcx,1), %xmm0"); 1530 asm volatile("sha1msg1 0x12(%rax,%rcx,8), %xmm0"); 1531 asm volatile("sha1msg1 0x12345678(%rax), %xmm0"); 1532 asm volatile("sha1msg1 0x12345678(%rbp), %xmm0"); 1533 asm volatile("sha1msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1534 asm volatile("sha1msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1535 asm volatile("sha1msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1536 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1537 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1538 1539 /* sha1msg2 xmm2/m128, xmm1 */ 1540 1541 asm volatile("sha1msg2 %xmm1, %xmm0"); 1542 asm volatile("sha1msg2 %xmm7, %xmm2"); 1543 asm volatile("sha1msg2 %xmm8, %xmm0"); 1544 asm volatile("sha1msg2 %xmm7, %xmm8"); 1545 asm volatile("sha1msg2 %xmm15, %xmm8"); 1546 asm volatile("sha1msg2 (%rax), %xmm0"); 1547 asm volatile("sha1msg2 (%r8), %xmm0"); 1548 asm volatile("sha1msg2 (0x12345678), %xmm0"); 1549 asm volatile("sha1msg2 (%rax), %xmm3"); 1550 asm volatile("sha1msg2 (%rcx,%rax,1), %xmm0"); 1551 asm volatile("sha1msg2 0x12345678(,%rax,1), %xmm0"); 1552 asm volatile("sha1msg2 (%rax,%rcx,1), %xmm0"); 1553 asm volatile("sha1msg2 (%rax,%rcx,8), %xmm0"); 1554 asm volatile("sha1msg2 0x12(%rax), %xmm0"); 1555 asm volatile("sha1msg2 0x12(%rbp), %xmm0"); 1556 asm volatile("sha1msg2 0x12(%rcx,%rax,1), %xmm0"); 1557 asm volatile("sha1msg2 0x12(%rbp,%rax,1), %xmm0"); 1558 asm volatile("sha1msg2 0x12(%rax,%rcx,1), %xmm0"); 1559 asm volatile("sha1msg2 0x12(%rax,%rcx,8), %xmm0"); 1560 asm volatile("sha1msg2 0x12345678(%rax), %xmm0"); 1561 asm volatile("sha1msg2 0x12345678(%rbp), %xmm0"); 1562 asm volatile("sha1msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1563 asm volatile("sha1msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1564 asm volatile("sha1msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1565 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1566 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1567 1568 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 1569 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 1570 1571 asm volatile("sha256rnds2 %xmm4, %xmm1"); 1572 asm volatile("sha256rnds2 %xmm7, %xmm2"); 1573 asm volatile("sha256rnds2 %xmm8, %xmm1"); 1574 asm volatile("sha256rnds2 %xmm7, %xmm8"); 1575 asm volatile("sha256rnds2 %xmm15, %xmm8"); 1576 asm volatile("sha256rnds2 (%rax), %xmm1"); 1577 asm volatile("sha256rnds2 (%r8), %xmm1"); 1578 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 1579 asm volatile("sha256rnds2 (%rax), %xmm3"); 1580 asm volatile("sha256rnds2 (%rcx,%rax,1), %xmm1"); 1581 asm volatile("sha256rnds2 0x12345678(,%rax,1), %xmm1"); 1582 asm volatile("sha256rnds2 (%rax,%rcx,1), %xmm1"); 1583 asm volatile("sha256rnds2 (%rax,%rcx,8), %xmm1"); 1584 asm volatile("sha256rnds2 0x12(%rax), %xmm1"); 1585 asm volatile("sha256rnds2 0x12(%rbp), %xmm1"); 1586 asm volatile("sha256rnds2 0x12(%rcx,%rax,1), %xmm1"); 1587 asm volatile("sha256rnds2 0x12(%rbp,%rax,1), %xmm1"); 1588 asm volatile("sha256rnds2 0x12(%rax,%rcx,1), %xmm1"); 1589 asm volatile("sha256rnds2 0x12(%rax,%rcx,8), %xmm1"); 1590 asm volatile("sha256rnds2 0x12345678(%rax), %xmm1"); 1591 asm volatile("sha256rnds2 0x12345678(%rbp), %xmm1"); 1592 asm volatile("sha256rnds2 0x12345678(%rcx,%rax,1), %xmm1"); 1593 asm volatile("sha256rnds2 0x12345678(%rbp,%rax,1), %xmm1"); 1594 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,1), %xmm1"); 1595 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm1"); 1596 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm15"); 1597 1598 /* sha256msg1 xmm2/m128, xmm1 */ 1599 1600 asm volatile("sha256msg1 %xmm1, %xmm0"); 1601 asm volatile("sha256msg1 %xmm7, %xmm2"); 1602 asm volatile("sha256msg1 %xmm8, %xmm0"); 1603 asm volatile("sha256msg1 %xmm7, %xmm8"); 1604 asm volatile("sha256msg1 %xmm15, %xmm8"); 1605 asm volatile("sha256msg1 (%rax), %xmm0"); 1606 asm volatile("sha256msg1 (%r8), %xmm0"); 1607 asm volatile("sha256msg1 (0x12345678), %xmm0"); 1608 asm volatile("sha256msg1 (%rax), %xmm3"); 1609 asm volatile("sha256msg1 (%rcx,%rax,1), %xmm0"); 1610 asm volatile("sha256msg1 0x12345678(,%rax,1), %xmm0"); 1611 asm volatile("sha256msg1 (%rax,%rcx,1), %xmm0"); 1612 asm volatile("sha256msg1 (%rax,%rcx,8), %xmm0"); 1613 asm volatile("sha256msg1 0x12(%rax), %xmm0"); 1614 asm volatile("sha256msg1 0x12(%rbp), %xmm0"); 1615 asm volatile("sha256msg1 0x12(%rcx,%rax,1), %xmm0"); 1616 asm volatile("sha256msg1 0x12(%rbp,%rax,1), %xmm0"); 1617 asm volatile("sha256msg1 0x12(%rax,%rcx,1), %xmm0"); 1618 asm volatile("sha256msg1 0x12(%rax,%rcx,8), %xmm0"); 1619 asm volatile("sha256msg1 0x12345678(%rax), %xmm0"); 1620 asm volatile("sha256msg1 0x12345678(%rbp), %xmm0"); 1621 asm volatile("sha256msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1622 asm volatile("sha256msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1623 asm volatile("sha256msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1624 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1625 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1626 1627 /* sha256msg2 xmm2/m128, xmm1 */ 1628 1629 asm volatile("sha256msg2 %xmm1, %xmm0"); 1630 asm volatile("sha256msg2 %xmm7, %xmm2"); 1631 asm volatile("sha256msg2 %xmm8, %xmm0"); 1632 asm volatile("sha256msg2 %xmm7, %xmm8"); 1633 asm volatile("sha256msg2 %xmm15, %xmm8"); 1634 asm volatile("sha256msg2 (%rax), %xmm0"); 1635 asm volatile("sha256msg2 (%r8), %xmm0"); 1636 asm volatile("sha256msg2 (0x12345678), %xmm0"); 1637 asm volatile("sha256msg2 (%rax), %xmm3"); 1638 asm volatile("sha256msg2 (%rcx,%rax,1), %xmm0"); 1639 asm volatile("sha256msg2 0x12345678(,%rax,1), %xmm0"); 1640 asm volatile("sha256msg2 (%rax,%rcx,1), %xmm0"); 1641 asm volatile("sha256msg2 (%rax,%rcx,8), %xmm0"); 1642 asm volatile("sha256msg2 0x12(%rax), %xmm0"); 1643 asm volatile("sha256msg2 0x12(%rbp), %xmm0"); 1644 asm volatile("sha256msg2 0x12(%rcx,%rax,1), %xmm0"); 1645 asm volatile("sha256msg2 0x12(%rbp,%rax,1), %xmm0"); 1646 asm volatile("sha256msg2 0x12(%rax,%rcx,1), %xmm0"); 1647 asm volatile("sha256msg2 0x12(%rax,%rcx,8), %xmm0"); 1648 asm volatile("sha256msg2 0x12345678(%rax), %xmm0"); 1649 asm volatile("sha256msg2 0x12345678(%rbp), %xmm0"); 1650 asm volatile("sha256msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1651 asm volatile("sha256msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1652 asm volatile("sha256msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1653 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1654 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1655 1656 /* clflushopt m8 */ 1657 1658 asm volatile("clflushopt (%rax)"); 1659 asm volatile("clflushopt (%r8)"); 1660 asm volatile("clflushopt (0x12345678)"); 1661 asm volatile("clflushopt 0x12345678(%rax,%rcx,8)"); 1662 asm volatile("clflushopt 0x12345678(%r8,%rcx,8)"); 1663 /* Also check instructions in the same group encoding as clflushopt */ 1664 asm volatile("clflush (%rax)"); 1665 asm volatile("clflush (%r8)"); 1666 asm volatile("sfence"); 1667 1668 /* clwb m8 */ 1669 1670 asm volatile("clwb (%rax)"); 1671 asm volatile("clwb (%r8)"); 1672 asm volatile("clwb (0x12345678)"); 1673 asm volatile("clwb 0x12345678(%rax,%rcx,8)"); 1674 asm volatile("clwb 0x12345678(%r8,%rcx,8)"); 1675 /* Also check instructions in the same group encoding as clwb */ 1676 asm volatile("xsaveopt (%rax)"); 1677 asm volatile("xsaveopt (%r8)"); 1678 asm volatile("mfence"); 1679 1680 /* cldemote m8 */ 1681 1682 asm volatile("cldemote (%rax)"); 1683 asm volatile("cldemote (%r8)"); 1684 asm volatile("cldemote (0x12345678)"); 1685 asm volatile("cldemote 0x12345678(%rax,%rcx,8)"); 1686 asm volatile("cldemote 0x12345678(%r8,%rcx,8)"); 1687 1688 /* xsavec mem */ 1689 1690 asm volatile("xsavec (%rax)"); 1691 asm volatile("xsavec (%r8)"); 1692 asm volatile("xsavec (0x12345678)"); 1693 asm volatile("xsavec 0x12345678(%rax,%rcx,8)"); 1694 asm volatile("xsavec 0x12345678(%r8,%rcx,8)"); 1695 1696 /* xsaves mem */ 1697 1698 asm volatile("xsaves (%rax)"); 1699 asm volatile("xsaves (%r8)"); 1700 asm volatile("xsaves (0x12345678)"); 1701 asm volatile("xsaves 0x12345678(%rax,%rcx,8)"); 1702 asm volatile("xsaves 0x12345678(%r8,%rcx,8)"); 1703 1704 /* xrstors mem */ 1705 1706 asm volatile("xrstors (%rax)"); 1707 asm volatile("xrstors (%r8)"); 1708 asm volatile("xrstors (0x12345678)"); 1709 asm volatile("xrstors 0x12345678(%rax,%rcx,8)"); 1710 asm volatile("xrstors 0x12345678(%r8,%rcx,8)"); 1711 1712 /* ptwrite */ 1713 1714 asm volatile("ptwrite (%rax)"); 1715 asm volatile("ptwrite (%r8)"); 1716 asm volatile("ptwrite (0x12345678)"); 1717 asm volatile("ptwrite 0x12345678(%rax,%rcx,8)"); 1718 asm volatile("ptwrite 0x12345678(%r8,%rcx,8)"); 1719 1720 asm volatile("ptwritel (%rax)"); 1721 asm volatile("ptwritel (%r8)"); 1722 asm volatile("ptwritel (0x12345678)"); 1723 asm volatile("ptwritel 0x12345678(%rax,%rcx,8)"); 1724 asm volatile("ptwritel 0x12345678(%r8,%rcx,8)"); 1725 1726 asm volatile("ptwriteq (%rax)"); 1727 asm volatile("ptwriteq (%r8)"); 1728 asm volatile("ptwriteq (0x12345678)"); 1729 asm volatile("ptwriteq 0x12345678(%rax,%rcx,8)"); 1730 asm volatile("ptwriteq 0x12345678(%r8,%rcx,8)"); 1731 1732 /* tpause */ 1733 1734 asm volatile("tpause %ebx"); 1735 asm volatile("tpause %r8d"); 1736 1737 /* umonitor */ 1738 1739 asm volatile("umonitor %eax"); 1740 asm volatile("umonitor %rax"); 1741 asm volatile("umonitor %r8d"); 1742 1743 /* umwait */ 1744 1745 asm volatile("umwait %eax"); 1746 asm volatile("umwait %r8d"); 1747 1748 /* movdiri */ 1749 1750 asm volatile("movdiri %rax,(%rbx)"); 1751 asm volatile("movdiri %rcx,0x12345678(%rax)"); 1752 1753 /* movdir64b */ 1754 1755 asm volatile("movdir64b (%rax),%rbx"); 1756 asm volatile("movdir64b 0x12345678(%rax),%rcx"); 1757 asm volatile("movdir64b (%eax),%ebx"); 1758 asm volatile("movdir64b 0x12345678(%eax),%ecx"); 1759 1760 /* enqcmd */ 1761 1762 asm volatile("enqcmd (%rax),%rbx"); 1763 asm volatile("enqcmd 0x12345678(%rax),%rcx"); 1764 asm volatile("enqcmd (%eax),%ebx"); 1765 asm volatile("enqcmd 0x12345678(%eax),%ecx"); 1766 1767 /* enqcmds */ 1768 1769 asm volatile("enqcmds (%rax),%rbx"); 1770 asm volatile("enqcmds 0x12345678(%rax),%rcx"); 1771 asm volatile("enqcmds (%eax),%ebx"); 1772 asm volatile("enqcmds 0x12345678(%eax),%ecx"); 1773 1774 #else /* #ifdef __x86_64__ */ 1775 1776 /* bound r32, mem (same op code as EVEX prefix) */ 1777 1778 asm volatile("bound %eax, 0x12345678(%ecx)"); 1779 asm volatile("bound %ecx, 0x12345678(%eax)"); 1780 asm volatile("bound %edx, 0x12345678(%eax)"); 1781 asm volatile("bound %ebx, 0x12345678(%eax)"); 1782 asm volatile("bound %esp, 0x12345678(%eax)"); 1783 asm volatile("bound %ebp, 0x12345678(%eax)"); 1784 asm volatile("bound %esi, 0x12345678(%eax)"); 1785 asm volatile("bound %edi, 0x12345678(%eax)"); 1786 asm volatile("bound %ecx, (%eax)"); 1787 asm volatile("bound %eax, (0x12345678)"); 1788 asm volatile("bound %edx, (%ecx,%eax,1)"); 1789 asm volatile("bound %edx, 0x12345678(,%eax,1)"); 1790 asm volatile("bound %edx, (%eax,%ecx,1)"); 1791 asm volatile("bound %edx, (%eax,%ecx,8)"); 1792 asm volatile("bound %edx, 0x12(%eax)"); 1793 asm volatile("bound %edx, 0x12(%ebp)"); 1794 asm volatile("bound %edx, 0x12(%ecx,%eax,1)"); 1795 asm volatile("bound %edx, 0x12(%ebp,%eax,1)"); 1796 asm volatile("bound %edx, 0x12(%eax,%ecx,1)"); 1797 asm volatile("bound %edx, 0x12(%eax,%ecx,8)"); 1798 asm volatile("bound %edx, 0x12345678(%eax)"); 1799 asm volatile("bound %edx, 0x12345678(%ebp)"); 1800 asm volatile("bound %edx, 0x12345678(%ecx,%eax,1)"); 1801 asm volatile("bound %edx, 0x12345678(%ebp,%eax,1)"); 1802 asm volatile("bound %edx, 0x12345678(%eax,%ecx,1)"); 1803 asm volatile("bound %edx, 0x12345678(%eax,%ecx,8)"); 1804 1805 /* bound r16, mem (same op code as EVEX prefix) */ 1806 1807 asm volatile("bound %ax, 0x12345678(%ecx)"); 1808 asm volatile("bound %cx, 0x12345678(%eax)"); 1809 asm volatile("bound %dx, 0x12345678(%eax)"); 1810 asm volatile("bound %bx, 0x12345678(%eax)"); 1811 asm volatile("bound %sp, 0x12345678(%eax)"); 1812 asm volatile("bound %bp, 0x12345678(%eax)"); 1813 asm volatile("bound %si, 0x12345678(%eax)"); 1814 asm volatile("bound %di, 0x12345678(%eax)"); 1815 asm volatile("bound %cx, (%eax)"); 1816 asm volatile("bound %ax, (0x12345678)"); 1817 asm volatile("bound %dx, (%ecx,%eax,1)"); 1818 asm volatile("bound %dx, 0x12345678(,%eax,1)"); 1819 asm volatile("bound %dx, (%eax,%ecx,1)"); 1820 asm volatile("bound %dx, (%eax,%ecx,8)"); 1821 asm volatile("bound %dx, 0x12(%eax)"); 1822 asm volatile("bound %dx, 0x12(%ebp)"); 1823 asm volatile("bound %dx, 0x12(%ecx,%eax,1)"); 1824 asm volatile("bound %dx, 0x12(%ebp,%eax,1)"); 1825 asm volatile("bound %dx, 0x12(%eax,%ecx,1)"); 1826 asm volatile("bound %dx, 0x12(%eax,%ecx,8)"); 1827 asm volatile("bound %dx, 0x12345678(%eax)"); 1828 asm volatile("bound %dx, 0x12345678(%ebp)"); 1829 asm volatile("bound %dx, 0x12345678(%ecx,%eax,1)"); 1830 asm volatile("bound %dx, 0x12345678(%ebp,%eax,1)"); 1831 asm volatile("bound %dx, 0x12345678(%eax,%ecx,1)"); 1832 asm volatile("bound %dx, 0x12345678(%eax,%ecx,8)"); 1833 1834 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 1835 1836 asm volatile("cmovno %eax,%ebx"); 1837 asm volatile("cmovno 0x12345678(%eax),%ecx"); 1838 asm volatile("cmovno 0x12345678(%eax),%cx"); 1839 1840 asm volatile("cmove %eax,%ebx"); 1841 asm volatile("cmove 0x12345678(%eax),%ecx"); 1842 asm volatile("cmove 0x12345678(%eax),%cx"); 1843 1844 asm volatile("seto 0x12345678(%eax)"); 1845 asm volatile("setno 0x12345678(%eax)"); 1846 asm volatile("setb 0x12345678(%eax)"); 1847 asm volatile("setc 0x12345678(%eax)"); 1848 asm volatile("setnae 0x12345678(%eax)"); 1849 asm volatile("setae 0x12345678(%eax)"); 1850 asm volatile("setnb 0x12345678(%eax)"); 1851 asm volatile("setnc 0x12345678(%eax)"); 1852 asm volatile("sets 0x12345678(%eax)"); 1853 asm volatile("setns 0x12345678(%eax)"); 1854 1855 /* AVX-512: Mask Instructions */ 1856 1857 asm volatile("kandw %k7,%k6,%k5"); 1858 asm volatile("kandq %k7,%k6,%k5"); 1859 asm volatile("kandb %k7,%k6,%k5"); 1860 asm volatile("kandd %k7,%k6,%k5"); 1861 1862 asm volatile("kandnw %k7,%k6,%k5"); 1863 asm volatile("kandnq %k7,%k6,%k5"); 1864 asm volatile("kandnb %k7,%k6,%k5"); 1865 asm volatile("kandnd %k7,%k6,%k5"); 1866 1867 asm volatile("knotw %k7,%k6"); 1868 asm volatile("knotq %k7,%k6"); 1869 asm volatile("knotb %k7,%k6"); 1870 asm volatile("knotd %k7,%k6"); 1871 1872 asm volatile("korw %k7,%k6,%k5"); 1873 asm volatile("korq %k7,%k6,%k5"); 1874 asm volatile("korb %k7,%k6,%k5"); 1875 asm volatile("kord %k7,%k6,%k5"); 1876 1877 asm volatile("kxnorw %k7,%k6,%k5"); 1878 asm volatile("kxnorq %k7,%k6,%k5"); 1879 asm volatile("kxnorb %k7,%k6,%k5"); 1880 asm volatile("kxnord %k7,%k6,%k5"); 1881 1882 asm volatile("kxorw %k7,%k6,%k5"); 1883 asm volatile("kxorq %k7,%k6,%k5"); 1884 asm volatile("kxorb %k7,%k6,%k5"); 1885 asm volatile("kxord %k7,%k6,%k5"); 1886 1887 asm volatile("kaddw %k7,%k6,%k5"); 1888 asm volatile("kaddq %k7,%k6,%k5"); 1889 asm volatile("kaddb %k7,%k6,%k5"); 1890 asm volatile("kaddd %k7,%k6,%k5"); 1891 1892 asm volatile("kunpckbw %k7,%k6,%k5"); 1893 asm volatile("kunpckwd %k7,%k6,%k5"); 1894 asm volatile("kunpckdq %k7,%k6,%k5"); 1895 1896 asm volatile("kmovw %k6,%k5"); 1897 asm volatile("kmovw (%ecx),%k5"); 1898 asm volatile("kmovw 0x123(%eax,%ecx,8),%k5"); 1899 asm volatile("kmovw %k5,(%ecx)"); 1900 asm volatile("kmovw %k5,0x123(%eax,%ecx,8)"); 1901 asm volatile("kmovw %eax,%k5"); 1902 asm volatile("kmovw %ebp,%k5"); 1903 asm volatile("kmovw %k5,%eax"); 1904 asm volatile("kmovw %k5,%ebp"); 1905 1906 asm volatile("kmovq %k6,%k5"); 1907 asm volatile("kmovq (%ecx),%k5"); 1908 asm volatile("kmovq 0x123(%eax,%ecx,8),%k5"); 1909 asm volatile("kmovq %k5,(%ecx)"); 1910 asm volatile("kmovq %k5,0x123(%eax,%ecx,8)"); 1911 1912 asm volatile("kmovb %k6,%k5"); 1913 asm volatile("kmovb (%ecx),%k5"); 1914 asm volatile("kmovb 0x123(%eax,%ecx,8),%k5"); 1915 asm volatile("kmovb %k5,(%ecx)"); 1916 asm volatile("kmovb %k5,0x123(%eax,%ecx,8)"); 1917 asm volatile("kmovb %eax,%k5"); 1918 asm volatile("kmovb %ebp,%k5"); 1919 asm volatile("kmovb %k5,%eax"); 1920 asm volatile("kmovb %k5,%ebp"); 1921 1922 asm volatile("kmovd %k6,%k5"); 1923 asm volatile("kmovd (%ecx),%k5"); 1924 asm volatile("kmovd 0x123(%eax,%ecx,8),%k5"); 1925 asm volatile("kmovd %k5,(%ecx)"); 1926 asm volatile("kmovd %k5,0x123(%eax,%ecx,8)"); 1927 asm volatile("kmovd %eax,%k5"); 1928 asm volatile("kmovd %ebp,%k5"); 1929 asm volatile("kmovd %k5,%eax"); 1930 asm volatile("kmovd %k5,%ebp"); 1931 1932 asm volatile("kortestw %k6,%k5"); 1933 asm volatile("kortestq %k6,%k5"); 1934 asm volatile("kortestb %k6,%k5"); 1935 asm volatile("kortestd %k6,%k5"); 1936 1937 asm volatile("ktestw %k6,%k5"); 1938 asm volatile("ktestq %k6,%k5"); 1939 asm volatile("ktestb %k6,%k5"); 1940 asm volatile("ktestd %k6,%k5"); 1941 1942 asm volatile("kshiftrw $0x12,%k6,%k5"); 1943 asm volatile("kshiftrq $0x5b,%k6,%k5"); 1944 asm volatile("kshiftlw $0x12,%k6,%k5"); 1945 asm volatile("kshiftlq $0x5b,%k6,%k5"); 1946 1947 /* AVX-512: Op code 0f 5b */ 1948 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 1949 asm volatile("vcvtqq2ps %zmm5,%ymm6{%k7}"); 1950 asm volatile("vcvtps2dq %xmm5,%xmm6"); 1951 asm volatile("vcvttps2dq %xmm5,%xmm6"); 1952 1953 /* AVX-512: Op code 0f 6f */ 1954 1955 asm volatile("movq %mm0,%mm4"); 1956 asm volatile("vmovdqa %ymm4,%ymm6"); 1957 asm volatile("vmovdqa32 %zmm5,%zmm6"); 1958 asm volatile("vmovdqa64 %zmm5,%zmm6"); 1959 asm volatile("vmovdqu %ymm4,%ymm6"); 1960 asm volatile("vmovdqu32 %zmm5,%zmm6"); 1961 asm volatile("vmovdqu64 %zmm5,%zmm6"); 1962 asm volatile("vmovdqu8 %zmm5,%zmm6"); 1963 asm volatile("vmovdqu16 %zmm5,%zmm6"); 1964 1965 /* AVX-512: Op code 0f 78 */ 1966 1967 asm volatile("vmread %eax,%ebx"); 1968 asm volatile("vcvttps2udq %zmm5,%zmm6"); 1969 asm volatile("vcvttpd2udq %zmm5,%ymm6{%k7}"); 1970 asm volatile("vcvttsd2usi %xmm6,%eax"); 1971 asm volatile("vcvttss2usi %xmm6,%eax"); 1972 asm volatile("vcvttps2uqq %ymm5,%zmm6{%k7}"); 1973 asm volatile("vcvttpd2uqq %zmm5,%zmm6"); 1974 1975 /* AVX-512: Op code 0f 79 */ 1976 1977 asm volatile("vmwrite %eax,%ebx"); 1978 asm volatile("vcvtps2udq %zmm5,%zmm6"); 1979 asm volatile("vcvtpd2udq %zmm5,%ymm6{%k7}"); 1980 asm volatile("vcvtsd2usi %xmm6,%eax"); 1981 asm volatile("vcvtss2usi %xmm6,%eax"); 1982 asm volatile("vcvtps2uqq %ymm5,%zmm6{%k7}"); 1983 asm volatile("vcvtpd2uqq %zmm5,%zmm6"); 1984 1985 /* AVX-512: Op code 0f 7a */ 1986 1987 asm volatile("vcvtudq2pd %ymm5,%zmm6{%k7}"); 1988 asm volatile("vcvtuqq2pd %zmm5,%zmm6"); 1989 asm volatile("vcvtudq2ps %zmm5,%zmm6"); 1990 asm volatile("vcvtuqq2ps %zmm5,%ymm6{%k7}"); 1991 asm volatile("vcvttps2qq %ymm5,%zmm6{%k7}"); 1992 asm volatile("vcvttpd2qq %zmm5,%zmm6"); 1993 1994 /* AVX-512: Op code 0f 7b */ 1995 1996 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 1997 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 1998 asm volatile("vcvtps2qq %ymm5,%zmm6{%k7}"); 1999 asm volatile("vcvtpd2qq %zmm5,%zmm6"); 2000 2001 /* AVX-512: Op code 0f 7f */ 2002 2003 asm volatile("movq.s %mm0,%mm4"); 2004 asm volatile("vmovdqa.s %ymm5,%ymm6"); 2005 asm volatile("vmovdqa32.s %zmm5,%zmm6"); 2006 asm volatile("vmovdqa64.s %zmm5,%zmm6"); 2007 asm volatile("vmovdqu.s %ymm5,%ymm6"); 2008 asm volatile("vmovdqu32.s %zmm5,%zmm6"); 2009 asm volatile("vmovdqu64.s %zmm5,%zmm6"); 2010 asm volatile("vmovdqu8.s %zmm5,%zmm6"); 2011 asm volatile("vmovdqu16.s %zmm5,%zmm6"); 2012 2013 /* AVX-512: Op code 0f db */ 2014 2015 asm volatile("pand %mm1,%mm2"); 2016 asm volatile("pand %xmm1,%xmm2"); 2017 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 2018 asm volatile("vpandd %zmm4,%zmm5,%zmm6"); 2019 asm volatile("vpandq %zmm4,%zmm5,%zmm6"); 2020 2021 /* AVX-512: Op code 0f df */ 2022 2023 asm volatile("pandn %mm1,%mm2"); 2024 asm volatile("pandn %xmm1,%xmm2"); 2025 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 2026 asm volatile("vpandnd %zmm4,%zmm5,%zmm6"); 2027 asm volatile("vpandnq %zmm4,%zmm5,%zmm6"); 2028 2029 /* AVX-512: Op code 0f e6 */ 2030 2031 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 2032 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 2033 asm volatile("vcvtdq2pd %ymm5,%zmm6{%k7}"); 2034 asm volatile("vcvtqq2pd %zmm5,%zmm6"); 2035 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 2036 2037 /* AVX-512: Op code 0f eb */ 2038 2039 asm volatile("por %mm4,%mm6"); 2040 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 2041 asm volatile("vpord %zmm4,%zmm5,%zmm6"); 2042 asm volatile("vporq %zmm4,%zmm5,%zmm6"); 2043 2044 /* AVX-512: Op code 0f ef */ 2045 2046 asm volatile("pxor %mm4,%mm6"); 2047 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 2048 asm volatile("vpxord %zmm4,%zmm5,%zmm6"); 2049 asm volatile("vpxorq %zmm4,%zmm5,%zmm6"); 2050 2051 /* AVX-512: Op code 0f 38 10 */ 2052 2053 asm volatile("pblendvb %xmm1,%xmm0"); 2054 asm volatile("vpsrlvw %zmm4,%zmm5,%zmm6"); 2055 asm volatile("vpmovuswb %zmm5,%ymm6{%k7}"); 2056 2057 /* AVX-512: Op code 0f 38 11 */ 2058 2059 asm volatile("vpmovusdb %zmm5,%xmm6{%k7}"); 2060 asm volatile("vpsravw %zmm4,%zmm5,%zmm6"); 2061 2062 /* AVX-512: Op code 0f 38 12 */ 2063 2064 asm volatile("vpmovusqb %zmm5,%xmm6{%k7}"); 2065 asm volatile("vpsllvw %zmm4,%zmm5,%zmm6"); 2066 2067 /* AVX-512: Op code 0f 38 13 */ 2068 2069 asm volatile("vcvtph2ps %xmm3,%ymm5"); 2070 asm volatile("vcvtph2ps %ymm5,%zmm6{%k7}"); 2071 asm volatile("vpmovusdw %zmm5,%ymm6{%k7}"); 2072 2073 /* AVX-512: Op code 0f 38 14 */ 2074 2075 asm volatile("blendvps %xmm1,%xmm0"); 2076 asm volatile("vpmovusqw %zmm5,%xmm6{%k7}"); 2077 asm volatile("vprorvd %zmm4,%zmm5,%zmm6"); 2078 asm volatile("vprorvq %zmm4,%zmm5,%zmm6"); 2079 2080 /* AVX-512: Op code 0f 38 15 */ 2081 2082 asm volatile("blendvpd %xmm1,%xmm0"); 2083 asm volatile("vpmovusqd %zmm5,%ymm6{%k7}"); 2084 asm volatile("vprolvd %zmm4,%zmm5,%zmm6"); 2085 asm volatile("vprolvq %zmm4,%zmm5,%zmm6"); 2086 2087 /* AVX-512: Op code 0f 38 16 */ 2088 2089 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 2090 asm volatile("vpermps %ymm4,%ymm6,%ymm2{%k7}"); 2091 asm volatile("vpermpd %ymm4,%ymm6,%ymm2{%k7}"); 2092 2093 /* AVX-512: Op code 0f 38 19 */ 2094 2095 asm volatile("vbroadcastsd %xmm4,%ymm6"); 2096 asm volatile("vbroadcastf32x2 %xmm7,%zmm6"); 2097 2098 /* AVX-512: Op code 0f 38 1a */ 2099 2100 asm volatile("vbroadcastf128 (%ecx),%ymm4"); 2101 asm volatile("vbroadcastf32x4 (%ecx),%zmm6"); 2102 asm volatile("vbroadcastf64x2 (%ecx),%zmm6"); 2103 2104 /* AVX-512: Op code 0f 38 1b */ 2105 2106 asm volatile("vbroadcastf32x8 (%ecx),%zmm6"); 2107 asm volatile("vbroadcastf64x4 (%ecx),%zmm6"); 2108 2109 /* AVX-512: Op code 0f 38 1f */ 2110 2111 asm volatile("vpabsq %zmm4,%zmm6"); 2112 2113 /* AVX-512: Op code 0f 38 20 */ 2114 2115 asm volatile("vpmovsxbw %xmm4,%xmm5"); 2116 asm volatile("vpmovswb %zmm5,%ymm6{%k7}"); 2117 2118 /* AVX-512: Op code 0f 38 21 */ 2119 2120 asm volatile("vpmovsxbd %xmm4,%ymm6"); 2121 asm volatile("vpmovsdb %zmm5,%xmm6{%k7}"); 2122 2123 /* AVX-512: Op code 0f 38 22 */ 2124 2125 asm volatile("vpmovsxbq %xmm4,%ymm4"); 2126 asm volatile("vpmovsqb %zmm5,%xmm6{%k7}"); 2127 2128 /* AVX-512: Op code 0f 38 23 */ 2129 2130 asm volatile("vpmovsxwd %xmm4,%ymm4"); 2131 asm volatile("vpmovsdw %zmm5,%ymm6{%k7}"); 2132 2133 /* AVX-512: Op code 0f 38 24 */ 2134 2135 asm volatile("vpmovsxwq %xmm4,%ymm6"); 2136 asm volatile("vpmovsqw %zmm5,%xmm6{%k7}"); 2137 2138 /* AVX-512: Op code 0f 38 25 */ 2139 2140 asm volatile("vpmovsxdq %xmm4,%ymm4"); 2141 asm volatile("vpmovsqd %zmm5,%ymm6{%k7}"); 2142 2143 /* AVX-512: Op code 0f 38 26 */ 2144 2145 asm volatile("vptestmb %zmm5,%zmm6,%k5"); 2146 asm volatile("vptestmw %zmm5,%zmm6,%k5"); 2147 asm volatile("vptestnmb %zmm4,%zmm5,%k5"); 2148 asm volatile("vptestnmw %zmm4,%zmm5,%k5"); 2149 2150 /* AVX-512: Op code 0f 38 27 */ 2151 2152 asm volatile("vptestmd %zmm5,%zmm6,%k5"); 2153 asm volatile("vptestmq %zmm5,%zmm6,%k5"); 2154 asm volatile("vptestnmd %zmm4,%zmm5,%k5"); 2155 asm volatile("vptestnmq %zmm4,%zmm5,%k5"); 2156 2157 /* AVX-512: Op code 0f 38 28 */ 2158 2159 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 2160 asm volatile("vpmovm2b %k5,%zmm6"); 2161 asm volatile("vpmovm2w %k5,%zmm6"); 2162 2163 /* AVX-512: Op code 0f 38 29 */ 2164 2165 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 2166 asm volatile("vpmovb2m %zmm6,%k5"); 2167 asm volatile("vpmovw2m %zmm6,%k5"); 2168 2169 /* AVX-512: Op code 0f 38 2a */ 2170 2171 asm volatile("vmovntdqa (%ecx),%ymm4"); 2172 asm volatile("vpbroadcastmb2q %k6,%zmm1"); 2173 2174 /* AVX-512: Op code 0f 38 2c */ 2175 2176 asm volatile("vmaskmovps (%ecx),%ymm4,%ymm6"); 2177 asm volatile("vscalefps %zmm4,%zmm5,%zmm6"); 2178 asm volatile("vscalefpd %zmm4,%zmm5,%zmm6"); 2179 2180 /* AVX-512: Op code 0f 38 2d */ 2181 2182 asm volatile("vmaskmovpd (%ecx),%ymm4,%ymm6"); 2183 asm volatile("vscalefss %xmm4,%xmm5,%xmm6{%k7}"); 2184 asm volatile("vscalefsd %xmm4,%xmm5,%xmm6{%k7}"); 2185 2186 /* AVX-512: Op code 0f 38 30 */ 2187 2188 asm volatile("vpmovzxbw %xmm4,%ymm4"); 2189 asm volatile("vpmovwb %zmm5,%ymm6{%k7}"); 2190 2191 /* AVX-512: Op code 0f 38 31 */ 2192 2193 asm volatile("vpmovzxbd %xmm4,%ymm6"); 2194 asm volatile("vpmovdb %zmm5,%xmm6{%k7}"); 2195 2196 /* AVX-512: Op code 0f 38 32 */ 2197 2198 asm volatile("vpmovzxbq %xmm4,%ymm4"); 2199 asm volatile("vpmovqb %zmm5,%xmm6{%k7}"); 2200 2201 /* AVX-512: Op code 0f 38 33 */ 2202 2203 asm volatile("vpmovzxwd %xmm4,%ymm4"); 2204 asm volatile("vpmovdw %zmm5,%ymm6{%k7}"); 2205 2206 /* AVX-512: Op code 0f 38 34 */ 2207 2208 asm volatile("vpmovzxwq %xmm4,%ymm6"); 2209 asm volatile("vpmovqw %zmm5,%xmm6{%k7}"); 2210 2211 /* AVX-512: Op code 0f 38 35 */ 2212 2213 asm volatile("vpmovzxdq %xmm4,%ymm4"); 2214 asm volatile("vpmovqd %zmm5,%ymm6{%k7}"); 2215 2216 /* AVX-512: Op code 0f 38 36 */ 2217 2218 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 2219 asm volatile("vpermd %ymm4,%ymm6,%ymm2{%k7}"); 2220 asm volatile("vpermq %ymm4,%ymm6,%ymm2{%k7}"); 2221 2222 /* AVX-512: Op code 0f 38 38 */ 2223 2224 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 2225 asm volatile("vpmovm2d %k5,%zmm6"); 2226 asm volatile("vpmovm2q %k5,%zmm6"); 2227 2228 /* AVX-512: Op code 0f 38 39 */ 2229 2230 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 2231 asm volatile("vpminsd %zmm4,%zmm5,%zmm6"); 2232 asm volatile("vpminsq %zmm4,%zmm5,%zmm6"); 2233 asm volatile("vpmovd2m %zmm6,%k5"); 2234 asm volatile("vpmovq2m %zmm6,%k5"); 2235 2236 /* AVX-512: Op code 0f 38 3a */ 2237 2238 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 2239 asm volatile("vpbroadcastmw2d %k6,%zmm6"); 2240 2241 /* AVX-512: Op code 0f 38 3b */ 2242 2243 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 2244 asm volatile("vpminud %zmm4,%zmm5,%zmm6"); 2245 asm volatile("vpminuq %zmm4,%zmm5,%zmm6"); 2246 2247 /* AVX-512: Op code 0f 38 3d */ 2248 2249 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 2250 asm volatile("vpmaxsd %zmm4,%zmm5,%zmm6"); 2251 asm volatile("vpmaxsq %zmm4,%zmm5,%zmm6"); 2252 2253 /* AVX-512: Op code 0f 38 3f */ 2254 2255 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 2256 asm volatile("vpmaxud %zmm4,%zmm5,%zmm6"); 2257 asm volatile("vpmaxuq %zmm4,%zmm5,%zmm6"); 2258 2259 /* AVX-512: Op code 0f 38 40 */ 2260 2261 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 2262 asm volatile("vpmulld %zmm4,%zmm5,%zmm6"); 2263 asm volatile("vpmullq %zmm4,%zmm5,%zmm6"); 2264 2265 /* AVX-512: Op code 0f 38 42 */ 2266 2267 asm volatile("vgetexpps %zmm5,%zmm6"); 2268 asm volatile("vgetexppd %zmm5,%zmm6"); 2269 2270 /* AVX-512: Op code 0f 38 43 */ 2271 2272 asm volatile("vgetexpss %xmm4,%xmm5,%xmm6{%k7}"); 2273 asm volatile("vgetexpsd %xmm2,%xmm3,%xmm4{%k7}"); 2274 2275 /* AVX-512: Op code 0f 38 44 */ 2276 2277 asm volatile("vplzcntd %zmm5,%zmm6"); 2278 asm volatile("vplzcntq %zmm5,%zmm6"); 2279 2280 /* AVX-512: Op code 0f 38 46 */ 2281 2282 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 2283 asm volatile("vpsravd %zmm4,%zmm5,%zmm6"); 2284 asm volatile("vpsravq %zmm4,%zmm5,%zmm6"); 2285 2286 /* AVX-512: Op code 0f 38 4c */ 2287 2288 asm volatile("vrcp14ps %zmm5,%zmm6"); 2289 asm volatile("vrcp14pd %zmm5,%zmm6"); 2290 2291 /* AVX-512: Op code 0f 38 4d */ 2292 2293 asm volatile("vrcp14ss %xmm4,%xmm5,%xmm6{%k7}"); 2294 asm volatile("vrcp14sd %xmm4,%xmm5,%xmm6{%k7}"); 2295 2296 /* AVX-512: Op code 0f 38 4e */ 2297 2298 asm volatile("vrsqrt14ps %zmm5,%zmm6"); 2299 asm volatile("vrsqrt14pd %zmm5,%zmm6"); 2300 2301 /* AVX-512: Op code 0f 38 4f */ 2302 2303 asm volatile("vrsqrt14ss %xmm4,%xmm5,%xmm6{%k7}"); 2304 asm volatile("vrsqrt14sd %xmm4,%xmm5,%xmm6{%k7}"); 2305 2306 /* AVX-512: Op code 0f 38 50 */ 2307 2308 asm volatile("vpdpbusd %xmm1, %xmm2, %xmm3"); 2309 asm volatile("vpdpbusd %ymm1, %ymm2, %ymm3"); 2310 asm volatile("vpdpbusd %zmm1, %zmm2, %zmm3"); 2311 asm volatile("vpdpbusd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2312 2313 /* AVX-512: Op code 0f 38 51 */ 2314 2315 asm volatile("vpdpbusds %xmm1, %xmm2, %xmm3"); 2316 asm volatile("vpdpbusds %ymm1, %ymm2, %ymm3"); 2317 asm volatile("vpdpbusds %zmm1, %zmm2, %zmm3"); 2318 asm volatile("vpdpbusds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2319 2320 /* AVX-512: Op code 0f 38 52 */ 2321 2322 asm volatile("vdpbf16ps %xmm1, %xmm2, %xmm3"); 2323 asm volatile("vdpbf16ps %ymm1, %ymm2, %ymm3"); 2324 asm volatile("vdpbf16ps %zmm1, %zmm2, %zmm3"); 2325 asm volatile("vdpbf16ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2326 2327 asm volatile("vpdpwssd %xmm1, %xmm2, %xmm3"); 2328 asm volatile("vpdpwssd %ymm1, %ymm2, %ymm3"); 2329 asm volatile("vpdpwssd %zmm1, %zmm2, %zmm3"); 2330 asm volatile("vpdpwssd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2331 2332 asm volatile("vp4dpwssd (%eax), %zmm0, %zmm4"); 2333 asm volatile("vp4dpwssd 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 2334 2335 /* AVX-512: Op code 0f 38 53 */ 2336 2337 asm volatile("vpdpwssds %xmm1, %xmm2, %xmm3"); 2338 asm volatile("vpdpwssds %ymm1, %ymm2, %ymm3"); 2339 asm volatile("vpdpwssds %zmm1, %zmm2, %zmm3"); 2340 asm volatile("vpdpwssds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2341 2342 asm volatile("vp4dpwssds (%eax), %zmm0, %zmm4"); 2343 asm volatile("vp4dpwssds 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 2344 2345 /* AVX-512: Op code 0f 38 54 */ 2346 2347 asm volatile("vpopcntb %xmm1, %xmm2"); 2348 asm volatile("vpopcntb %ymm1, %ymm2"); 2349 asm volatile("vpopcntb %zmm1, %zmm2"); 2350 asm volatile("vpopcntb 0x12345678(%eax,%ecx,8),%zmm2"); 2351 2352 asm volatile("vpopcntw %xmm1, %xmm2"); 2353 asm volatile("vpopcntw %ymm1, %ymm2"); 2354 asm volatile("vpopcntw %zmm1, %zmm2"); 2355 asm volatile("vpopcntw 0x12345678(%eax,%ecx,8),%zmm2"); 2356 2357 /* AVX-512: Op code 0f 38 55 */ 2358 2359 asm volatile("vpopcntd %xmm1, %xmm2"); 2360 asm volatile("vpopcntd %ymm1, %ymm2"); 2361 asm volatile("vpopcntd %zmm1, %zmm2"); 2362 asm volatile("vpopcntd 0x12345678(%eax,%ecx,8),%zmm2"); 2363 2364 asm volatile("vpopcntq %xmm1, %xmm2"); 2365 asm volatile("vpopcntq %ymm1, %ymm2"); 2366 asm volatile("vpopcntq %zmm1, %zmm2"); 2367 asm volatile("vpopcntq 0x12345678(%eax,%ecx,8),%zmm2"); 2368 2369 /* AVX-512: Op code 0f 38 59 */ 2370 2371 asm volatile("vpbroadcastq %xmm4,%xmm6"); 2372 asm volatile("vbroadcasti32x2 %xmm7,%zmm6"); 2373 2374 /* AVX-512: Op code 0f 38 5a */ 2375 2376 asm volatile("vbroadcasti128 (%ecx),%ymm4"); 2377 asm volatile("vbroadcasti32x4 (%ecx),%zmm6"); 2378 asm volatile("vbroadcasti64x2 (%ecx),%zmm6"); 2379 2380 /* AVX-512: Op code 0f 38 5b */ 2381 2382 asm volatile("vbroadcasti32x8 (%ecx),%zmm6"); 2383 asm volatile("vbroadcasti64x4 (%ecx),%zmm6"); 2384 2385 /* AVX-512: Op code 0f 38 62 */ 2386 2387 asm volatile("vpexpandb %xmm1, %xmm2"); 2388 asm volatile("vpexpandb %ymm1, %ymm2"); 2389 asm volatile("vpexpandb %zmm1, %zmm2"); 2390 asm volatile("vpexpandb 0x12345678(%eax,%ecx,8),%zmm2"); 2391 2392 asm volatile("vpexpandw %xmm1, %xmm2"); 2393 asm volatile("vpexpandw %ymm1, %ymm2"); 2394 asm volatile("vpexpandw %zmm1, %zmm2"); 2395 asm volatile("vpexpandw 0x12345678(%eax,%ecx,8),%zmm2"); 2396 2397 /* AVX-512: Op code 0f 38 63 */ 2398 2399 asm volatile("vpcompressb %xmm1, %xmm2"); 2400 asm volatile("vpcompressb %ymm1, %ymm2"); 2401 asm volatile("vpcompressb %zmm1, %zmm2"); 2402 asm volatile("vpcompressb %zmm2,0x12345678(%eax,%ecx,8)"); 2403 2404 asm volatile("vpcompressw %xmm1, %xmm2"); 2405 asm volatile("vpcompressw %ymm1, %ymm2"); 2406 asm volatile("vpcompressw %zmm1, %zmm2"); 2407 asm volatile("vpcompressw %zmm2,0x12345678(%eax,%ecx,8)"); 2408 2409 /* AVX-512: Op code 0f 38 64 */ 2410 2411 asm volatile("vpblendmd %zmm4,%zmm5,%zmm6"); 2412 asm volatile("vpblendmq %zmm4,%zmm5,%zmm6"); 2413 2414 /* AVX-512: Op code 0f 38 65 */ 2415 2416 asm volatile("vblendmps %zmm4,%zmm5,%zmm6"); 2417 asm volatile("vblendmpd %zmm4,%zmm5,%zmm6"); 2418 2419 /* AVX-512: Op code 0f 38 66 */ 2420 2421 asm volatile("vpblendmb %zmm4,%zmm5,%zmm6"); 2422 asm volatile("vpblendmw %zmm4,%zmm5,%zmm6"); 2423 2424 /* AVX-512: Op code 0f 38 68 */ 2425 2426 asm volatile("vp2intersectd %xmm1, %xmm2, %k3"); 2427 asm volatile("vp2intersectd %ymm1, %ymm2, %k3"); 2428 asm volatile("vp2intersectd %zmm1, %zmm2, %k3"); 2429 asm volatile("vp2intersectd 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 2430 2431 asm volatile("vp2intersectq %xmm1, %xmm2, %k3"); 2432 asm volatile("vp2intersectq %ymm1, %ymm2, %k3"); 2433 asm volatile("vp2intersectq %zmm1, %zmm2, %k3"); 2434 asm volatile("vp2intersectq 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 2435 2436 /* AVX-512: Op code 0f 38 70 */ 2437 2438 asm volatile("vpshldvw %xmm1, %xmm2, %xmm3"); 2439 asm volatile("vpshldvw %ymm1, %ymm2, %ymm3"); 2440 asm volatile("vpshldvw %zmm1, %zmm2, %zmm3"); 2441 asm volatile("vpshldvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2442 2443 /* AVX-512: Op code 0f 38 71 */ 2444 2445 asm volatile("vpshldvd %xmm1, %xmm2, %xmm3"); 2446 asm volatile("vpshldvd %ymm1, %ymm2, %ymm3"); 2447 asm volatile("vpshldvd %zmm1, %zmm2, %zmm3"); 2448 asm volatile("vpshldvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2449 2450 asm volatile("vpshldvq %xmm1, %xmm2, %xmm3"); 2451 asm volatile("vpshldvq %ymm1, %ymm2, %ymm3"); 2452 asm volatile("vpshldvq %zmm1, %zmm2, %zmm3"); 2453 asm volatile("vpshldvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2454 2455 /* AVX-512: Op code 0f 38 72 */ 2456 2457 asm volatile("vcvtne2ps2bf16 %xmm1, %xmm2, %xmm3"); 2458 asm volatile("vcvtne2ps2bf16 %ymm1, %ymm2, %ymm3"); 2459 asm volatile("vcvtne2ps2bf16 %zmm1, %zmm2, %zmm3"); 2460 asm volatile("vcvtne2ps2bf16 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2461 2462 asm volatile("vcvtneps2bf16 %xmm1, %xmm2"); 2463 asm volatile("vcvtneps2bf16 %ymm1, %xmm2"); 2464 asm volatile("vcvtneps2bf16 %zmm1, %ymm2"); 2465 asm volatile("vcvtneps2bf16 0x12345678(%eax,%ecx,8),%ymm2"); 2466 2467 asm volatile("vpshrdvw %xmm1, %xmm2, %xmm3"); 2468 asm volatile("vpshrdvw %ymm1, %ymm2, %ymm3"); 2469 asm volatile("vpshrdvw %zmm1, %zmm2, %zmm3"); 2470 asm volatile("vpshrdvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2471 2472 /* AVX-512: Op code 0f 38 73 */ 2473 2474 asm volatile("vpshrdvd %xmm1, %xmm2, %xmm3"); 2475 asm volatile("vpshrdvd %ymm1, %ymm2, %ymm3"); 2476 asm volatile("vpshrdvd %zmm1, %zmm2, %zmm3"); 2477 asm volatile("vpshrdvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2478 2479 asm volatile("vpshrdvq %xmm1, %xmm2, %xmm3"); 2480 asm volatile("vpshrdvq %ymm1, %ymm2, %ymm3"); 2481 asm volatile("vpshrdvq %zmm1, %zmm2, %zmm3"); 2482 asm volatile("vpshrdvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2483 2484 /* AVX-512: Op code 0f 38 75 */ 2485 2486 asm volatile("vpermi2b %zmm4,%zmm5,%zmm6"); 2487 asm volatile("vpermi2w %zmm4,%zmm5,%zmm6"); 2488 2489 /* AVX-512: Op code 0f 38 76 */ 2490 2491 asm volatile("vpermi2d %zmm4,%zmm5,%zmm6"); 2492 asm volatile("vpermi2q %zmm4,%zmm5,%zmm6"); 2493 2494 /* AVX-512: Op code 0f 38 77 */ 2495 2496 asm volatile("vpermi2ps %zmm4,%zmm5,%zmm6"); 2497 asm volatile("vpermi2pd %zmm4,%zmm5,%zmm6"); 2498 2499 /* AVX-512: Op code 0f 38 7a */ 2500 2501 asm volatile("vpbroadcastb %eax,%xmm3"); 2502 2503 /* AVX-512: Op code 0f 38 7b */ 2504 2505 asm volatile("vpbroadcastw %eax,%xmm3"); 2506 2507 /* AVX-512: Op code 0f 38 7c */ 2508 2509 asm volatile("vpbroadcastd %eax,%xmm3"); 2510 2511 /* AVX-512: Op code 0f 38 7d */ 2512 2513 asm volatile("vpermt2b %zmm4,%zmm5,%zmm6"); 2514 asm volatile("vpermt2w %zmm4,%zmm5,%zmm6"); 2515 2516 /* AVX-512: Op code 0f 38 7e */ 2517 2518 asm volatile("vpermt2d %zmm4,%zmm5,%zmm6"); 2519 asm volatile("vpermt2q %zmm4,%zmm5,%zmm6"); 2520 2521 /* AVX-512: Op code 0f 38 7f */ 2522 2523 asm volatile("vpermt2ps %zmm4,%zmm5,%zmm6"); 2524 asm volatile("vpermt2pd %zmm4,%zmm5,%zmm6"); 2525 2526 /* AVX-512: Op code 0f 38 83 */ 2527 2528 asm volatile("vpmultishiftqb %zmm4,%zmm5,%zmm6"); 2529 2530 /* AVX-512: Op code 0f 38 88 */ 2531 2532 asm volatile("vexpandps (%ecx),%zmm6"); 2533 asm volatile("vexpandpd (%ecx),%zmm6"); 2534 2535 /* AVX-512: Op code 0f 38 89 */ 2536 2537 asm volatile("vpexpandd (%ecx),%zmm6"); 2538 asm volatile("vpexpandq (%ecx),%zmm6"); 2539 2540 /* AVX-512: Op code 0f 38 8a */ 2541 2542 asm volatile("vcompressps %zmm6,(%ecx)"); 2543 asm volatile("vcompresspd %zmm6,(%ecx)"); 2544 2545 /* AVX-512: Op code 0f 38 8b */ 2546 2547 asm volatile("vpcompressd %zmm6,(%ecx)"); 2548 asm volatile("vpcompressq %zmm6,(%ecx)"); 2549 2550 /* AVX-512: Op code 0f 38 8d */ 2551 2552 asm volatile("vpermb %zmm4,%zmm5,%zmm6"); 2553 asm volatile("vpermw %zmm4,%zmm5,%zmm6"); 2554 2555 /* AVX-512: Op code 0f 38 8f */ 2556 2557 asm volatile("vpshufbitqmb %xmm1, %xmm2, %k3"); 2558 asm volatile("vpshufbitqmb %ymm1, %ymm2, %k3"); 2559 asm volatile("vpshufbitqmb %zmm1, %zmm2, %k3"); 2560 asm volatile("vpshufbitqmb 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 2561 2562 /* AVX-512: Op code 0f 38 90 */ 2563 2564 asm volatile("vpgatherdd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2565 asm volatile("vpgatherdq %xmm2,0x04(%ebp,%xmm7,2),%xmm1"); 2566 asm volatile("vpgatherdd 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 2567 asm volatile("vpgatherdq 0x7b(%ebp,%ymm7,8),%zmm6{%k1}"); 2568 2569 /* AVX-512: Op code 0f 38 91 */ 2570 2571 asm volatile("vpgatherqd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2572 asm volatile("vpgatherqq %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2573 asm volatile("vpgatherqd 0x7b(%ebp,%zmm7,8),%ymm6{%k1}"); 2574 asm volatile("vpgatherqq 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 2575 2576 /* AVX-512: Op code 0f 38 9a */ 2577 2578 asm volatile("vfmsub132ps %xmm1, %xmm2, %xmm3"); 2579 asm volatile("vfmsub132ps %ymm1, %ymm2, %ymm3"); 2580 asm volatile("vfmsub132ps %zmm1, %zmm2, %zmm3"); 2581 asm volatile("vfmsub132ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2582 2583 asm volatile("vfmsub132pd %xmm1, %xmm2, %xmm3"); 2584 asm volatile("vfmsub132pd %ymm1, %ymm2, %ymm3"); 2585 asm volatile("vfmsub132pd %zmm1, %zmm2, %zmm3"); 2586 asm volatile("vfmsub132pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2587 2588 asm volatile("v4fmaddps (%eax), %zmm0, %zmm4"); 2589 asm volatile("v4fmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 2590 2591 /* AVX-512: Op code 0f 38 9b */ 2592 2593 asm volatile("vfmsub132ss %xmm1, %xmm2, %xmm3"); 2594 asm volatile("vfmsub132ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 2595 2596 asm volatile("vfmsub132sd %xmm1, %xmm2, %xmm3"); 2597 asm volatile("vfmsub132sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 2598 2599 asm volatile("v4fmaddss (%eax), %xmm0, %xmm4"); 2600 asm volatile("v4fmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 2601 2602 /* AVX-512: Op code 0f 38 a0 */ 2603 2604 asm volatile("vpscatterdd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2605 asm volatile("vpscatterdq %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 2606 2607 /* AVX-512: Op code 0f 38 a1 */ 2608 2609 asm volatile("vpscatterqd %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2610 asm volatile("vpscatterqq %ymm6,0x7b(%ebp,%ymm7,8){%k1}"); 2611 2612 /* AVX-512: Op code 0f 38 a2 */ 2613 2614 asm volatile("vscatterdps %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2615 asm volatile("vscatterdpd %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 2616 2617 /* AVX-512: Op code 0f 38 a3 */ 2618 2619 asm volatile("vscatterqps %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2620 asm volatile("vscatterqpd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2621 2622 /* AVX-512: Op code 0f 38 aa */ 2623 2624 asm volatile("vfmsub213ps %xmm1, %xmm2, %xmm3"); 2625 asm volatile("vfmsub213ps %ymm1, %ymm2, %ymm3"); 2626 asm volatile("vfmsub213ps %zmm1, %zmm2, %zmm3"); 2627 asm volatile("vfmsub213ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2628 2629 asm volatile("vfmsub213pd %xmm1, %xmm2, %xmm3"); 2630 asm volatile("vfmsub213pd %ymm1, %ymm2, %ymm3"); 2631 asm volatile("vfmsub213pd %zmm1, %zmm2, %zmm3"); 2632 asm volatile("vfmsub213pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2633 2634 asm volatile("v4fnmaddps (%eax), %zmm0, %zmm4"); 2635 asm volatile("v4fnmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 2636 2637 /* AVX-512: Op code 0f 38 ab */ 2638 2639 asm volatile("vfmsub213ss %xmm1, %xmm2, %xmm3"); 2640 asm volatile("vfmsub213ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 2641 2642 asm volatile("vfmsub213sd %xmm1, %xmm2, %xmm3"); 2643 asm volatile("vfmsub213sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 2644 2645 asm volatile("v4fnmaddss (%eax), %xmm0, %xmm4"); 2646 asm volatile("v4fnmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 2647 2648 /* AVX-512: Op code 0f 38 b4 */ 2649 2650 asm volatile("vpmadd52luq %zmm4,%zmm5,%zmm6"); 2651 2652 /* AVX-512: Op code 0f 38 b5 */ 2653 2654 asm volatile("vpmadd52huq %zmm4,%zmm5,%zmm6"); 2655 2656 /* AVX-512: Op code 0f 38 c4 */ 2657 2658 asm volatile("vpconflictd %zmm5,%zmm6"); 2659 asm volatile("vpconflictq %zmm5,%zmm6"); 2660 2661 /* AVX-512: Op code 0f 38 c8 */ 2662 2663 asm volatile("vexp2ps %zmm6,%zmm7"); 2664 asm volatile("vexp2pd %zmm6,%zmm7"); 2665 2666 /* AVX-512: Op code 0f 38 ca */ 2667 2668 asm volatile("vrcp28ps %zmm6,%zmm7"); 2669 asm volatile("vrcp28pd %zmm6,%zmm7"); 2670 2671 /* AVX-512: Op code 0f 38 cb */ 2672 2673 asm volatile("vrcp28ss %xmm5,%xmm6,%xmm7{%k7}"); 2674 asm volatile("vrcp28sd %xmm5,%xmm6,%xmm7{%k7}"); 2675 2676 /* AVX-512: Op code 0f 38 cc */ 2677 2678 asm volatile("vrsqrt28ps %zmm6,%zmm7"); 2679 asm volatile("vrsqrt28pd %zmm6,%zmm7"); 2680 2681 /* AVX-512: Op code 0f 38 cd */ 2682 2683 asm volatile("vrsqrt28ss %xmm5,%xmm6,%xmm7{%k7}"); 2684 asm volatile("vrsqrt28sd %xmm5,%xmm6,%xmm7{%k7}"); 2685 2686 /* AVX-512: Op code 0f 38 cf */ 2687 2688 asm volatile("gf2p8mulb %xmm1, %xmm3"); 2689 asm volatile("gf2p8mulb 0x12345678(%eax,%ecx,8),%xmm3"); 2690 2691 asm volatile("vgf2p8mulb %xmm1, %xmm2, %xmm3"); 2692 asm volatile("vgf2p8mulb %ymm1, %ymm2, %ymm3"); 2693 asm volatile("vgf2p8mulb %zmm1, %zmm2, %zmm3"); 2694 asm volatile("vgf2p8mulb 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2695 2696 /* AVX-512: Op code 0f 38 dc */ 2697 2698 asm volatile("vaesenc %xmm1, %xmm2, %xmm3"); 2699 asm volatile("vaesenc %ymm1, %ymm2, %ymm3"); 2700 asm volatile("vaesenc %zmm1, %zmm2, %zmm3"); 2701 asm volatile("vaesenc 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2702 2703 /* AVX-512: Op code 0f 38 dd */ 2704 2705 asm volatile("vaesenclast %xmm1, %xmm2, %xmm3"); 2706 asm volatile("vaesenclast %ymm1, %ymm2, %ymm3"); 2707 asm volatile("vaesenclast %zmm1, %zmm2, %zmm3"); 2708 asm volatile("vaesenclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2709 2710 /* AVX-512: Op code 0f 38 de */ 2711 2712 asm volatile("vaesdec %xmm1, %xmm2, %xmm3"); 2713 asm volatile("vaesdec %ymm1, %ymm2, %ymm3"); 2714 asm volatile("vaesdec %zmm1, %zmm2, %zmm3"); 2715 asm volatile("vaesdec 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2716 2717 /* AVX-512: Op code 0f 38 df */ 2718 2719 asm volatile("vaesdeclast %xmm1, %xmm2, %xmm3"); 2720 asm volatile("vaesdeclast %ymm1, %ymm2, %ymm3"); 2721 asm volatile("vaesdeclast %zmm1, %zmm2, %zmm3"); 2722 asm volatile("vaesdeclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 2723 2724 /* AVX-512: Op code 0f 3a 03 */ 2725 2726 asm volatile("valignd $0x12,%zmm5,%zmm6,%zmm7"); 2727 asm volatile("valignq $0x12,%zmm5,%zmm6,%zmm7"); 2728 2729 /* AVX-512: Op code 0f 3a 08 */ 2730 2731 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 2732 asm volatile("vrndscaleps $0x12,%zmm5,%zmm6"); 2733 2734 /* AVX-512: Op code 0f 3a 09 */ 2735 2736 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 2737 asm volatile("vrndscalepd $0x12,%zmm5,%zmm6"); 2738 2739 /* AVX-512: Op code 0f 3a 0a */ 2740 2741 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 2742 asm volatile("vrndscaless $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2743 2744 /* AVX-512: Op code 0f 3a 0b */ 2745 2746 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 2747 asm volatile("vrndscalesd $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2748 2749 /* AVX-512: Op code 0f 3a 18 */ 2750 2751 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 2752 asm volatile("vinsertf32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2753 asm volatile("vinsertf64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2754 2755 /* AVX-512: Op code 0f 3a 19 */ 2756 2757 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 2758 asm volatile("vextractf32x4 $0x12,%zmm5,%xmm6{%k7}"); 2759 asm volatile("vextractf64x2 $0x12,%zmm5,%xmm6{%k7}"); 2760 2761 /* AVX-512: Op code 0f 3a 1a */ 2762 2763 asm volatile("vinsertf32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2764 asm volatile("vinsertf64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2765 2766 /* AVX-512: Op code 0f 3a 1b */ 2767 2768 asm volatile("vextractf32x8 $0x12,%zmm6,%ymm7{%k7}"); 2769 asm volatile("vextractf64x4 $0x12,%zmm6,%ymm7{%k7}"); 2770 2771 /* AVX-512: Op code 0f 3a 1e */ 2772 2773 asm volatile("vpcmpud $0x12,%zmm6,%zmm7,%k5"); 2774 asm volatile("vpcmpuq $0x12,%zmm6,%zmm7,%k5"); 2775 2776 /* AVX-512: Op code 0f 3a 1f */ 2777 2778 asm volatile("vpcmpd $0x12,%zmm6,%zmm7,%k5"); 2779 asm volatile("vpcmpq $0x12,%zmm6,%zmm7,%k5"); 2780 2781 /* AVX-512: Op code 0f 3a 23 */ 2782 2783 asm volatile("vshuff32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2784 asm volatile("vshuff64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2785 2786 /* AVX-512: Op code 0f 3a 25 */ 2787 2788 asm volatile("vpternlogd $0x12,%zmm5,%zmm6,%zmm7"); 2789 asm volatile("vpternlogq $0x12,%zmm5,%zmm6,%zmm7"); 2790 2791 /* AVX-512: Op code 0f 3a 26 */ 2792 2793 asm volatile("vgetmantps $0x12,%zmm6,%zmm7"); 2794 asm volatile("vgetmantpd $0x12,%zmm6,%zmm7"); 2795 2796 /* AVX-512: Op code 0f 3a 27 */ 2797 2798 asm volatile("vgetmantss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2799 asm volatile("vgetmantsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2800 2801 /* AVX-512: Op code 0f 3a 38 */ 2802 2803 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 2804 asm volatile("vinserti32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2805 asm volatile("vinserti64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2806 2807 /* AVX-512: Op code 0f 3a 39 */ 2808 2809 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 2810 asm volatile("vextracti32x4 $0x12,%zmm5,%xmm6{%k7}"); 2811 asm volatile("vextracti64x2 $0x12,%zmm5,%xmm6{%k7}"); 2812 2813 /* AVX-512: Op code 0f 3a 3a */ 2814 2815 asm volatile("vinserti32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2816 asm volatile("vinserti64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2817 2818 /* AVX-512: Op code 0f 3a 3b */ 2819 2820 asm volatile("vextracti32x8 $0x12,%zmm6,%ymm7{%k7}"); 2821 asm volatile("vextracti64x4 $0x12,%zmm6,%ymm7{%k7}"); 2822 2823 /* AVX-512: Op code 0f 3a 3e */ 2824 2825 asm volatile("vpcmpub $0x12,%zmm6,%zmm7,%k5"); 2826 asm volatile("vpcmpuw $0x12,%zmm6,%zmm7,%k5"); 2827 2828 /* AVX-512: Op code 0f 3a 3f */ 2829 2830 asm volatile("vpcmpb $0x12,%zmm6,%zmm7,%k5"); 2831 asm volatile("vpcmpw $0x12,%zmm6,%zmm7,%k5"); 2832 2833 /* AVX-512: Op code 0f 3a 42 */ 2834 2835 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 2836 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 2837 2838 /* AVX-512: Op code 0f 3a 43 */ 2839 2840 asm volatile("vshufi32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2841 asm volatile("vshufi64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2842 2843 /* AVX-512: Op code 0f 3a 44 */ 2844 2845 asm volatile("vpclmulqdq $0x12,%xmm1,%xmm2,%xmm3"); 2846 asm volatile("vpclmulqdq $0x12,%ymm1,%ymm2,%ymm3"); 2847 asm volatile("vpclmulqdq $0x12,%zmm1,%zmm2,%zmm3"); 2848 2849 /* AVX-512: Op code 0f 3a 50 */ 2850 2851 asm volatile("vrangeps $0x12,%zmm5,%zmm6,%zmm7"); 2852 asm volatile("vrangepd $0x12,%zmm5,%zmm6,%zmm7"); 2853 2854 /* AVX-512: Op code 0f 3a 51 */ 2855 2856 asm volatile("vrangess $0x12,%xmm5,%xmm6,%xmm7"); 2857 asm volatile("vrangesd $0x12,%xmm5,%xmm6,%xmm7"); 2858 2859 /* AVX-512: Op code 0f 3a 54 */ 2860 2861 asm volatile("vfixupimmps $0x12,%zmm5,%zmm6,%zmm7"); 2862 asm volatile("vfixupimmpd $0x12,%zmm5,%zmm6,%zmm7"); 2863 2864 /* AVX-512: Op code 0f 3a 55 */ 2865 2866 asm volatile("vfixupimmss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2867 asm volatile("vfixupimmsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2868 2869 /* AVX-512: Op code 0f 3a 56 */ 2870 2871 asm volatile("vreduceps $0x12,%zmm6,%zmm7"); 2872 asm volatile("vreducepd $0x12,%zmm6,%zmm7"); 2873 2874 /* AVX-512: Op code 0f 3a 57 */ 2875 2876 asm volatile("vreducess $0x12,%xmm5,%xmm6,%xmm7"); 2877 asm volatile("vreducesd $0x12,%xmm5,%xmm6,%xmm7"); 2878 2879 /* AVX-512: Op code 0f 3a 66 */ 2880 2881 asm volatile("vfpclassps $0x12,%zmm7,%k5"); 2882 asm volatile("vfpclasspd $0x12,%zmm7,%k5"); 2883 2884 /* AVX-512: Op code 0f 3a 67 */ 2885 2886 asm volatile("vfpclassss $0x12,%xmm7,%k5"); 2887 asm volatile("vfpclasssd $0x12,%xmm7,%k5"); 2888 2889 /* AVX-512: Op code 0f 3a 70 */ 2890 2891 asm volatile("vpshldw $0x12,%xmm1,%xmm2,%xmm3"); 2892 asm volatile("vpshldw $0x12,%ymm1,%ymm2,%ymm3"); 2893 asm volatile("vpshldw $0x12,%zmm1,%zmm2,%zmm3"); 2894 2895 /* AVX-512: Op code 0f 3a 71 */ 2896 2897 asm volatile("vpshldd $0x12,%xmm1,%xmm2,%xmm3"); 2898 asm volatile("vpshldd $0x12,%ymm1,%ymm2,%ymm3"); 2899 asm volatile("vpshldd $0x12,%zmm1,%zmm2,%zmm3"); 2900 2901 asm volatile("vpshldq $0x12,%xmm1,%xmm2,%xmm3"); 2902 asm volatile("vpshldq $0x12,%ymm1,%ymm2,%ymm3"); 2903 asm volatile("vpshldq $0x12,%zmm1,%zmm2,%zmm3"); 2904 2905 /* AVX-512: Op code 0f 3a 72 */ 2906 2907 asm volatile("vpshrdw $0x12,%xmm1,%xmm2,%xmm3"); 2908 asm volatile("vpshrdw $0x12,%ymm1,%ymm2,%ymm3"); 2909 asm volatile("vpshrdw $0x12,%zmm1,%zmm2,%zmm3"); 2910 2911 /* AVX-512: Op code 0f 3a 73 */ 2912 2913 asm volatile("vpshrdd $0x12,%xmm1,%xmm2,%xmm3"); 2914 asm volatile("vpshrdd $0x12,%ymm1,%ymm2,%ymm3"); 2915 asm volatile("vpshrdd $0x12,%zmm1,%zmm2,%zmm3"); 2916 2917 asm volatile("vpshrdq $0x12,%xmm1,%xmm2,%xmm3"); 2918 asm volatile("vpshrdq $0x12,%ymm1,%ymm2,%ymm3"); 2919 asm volatile("vpshrdq $0x12,%zmm1,%zmm2,%zmm3"); 2920 2921 /* AVX-512: Op code 0f 3a ce */ 2922 2923 asm volatile("gf2p8affineqb $0x12,%xmm1,%xmm3"); 2924 2925 asm volatile("vgf2p8affineqb $0x12,%xmm1,%xmm2,%xmm3"); 2926 asm volatile("vgf2p8affineqb $0x12,%ymm1,%ymm2,%ymm3"); 2927 asm volatile("vgf2p8affineqb $0x12,%zmm1,%zmm2,%zmm3"); 2928 2929 /* AVX-512: Op code 0f 3a cf */ 2930 2931 asm volatile("gf2p8affineinvqb $0x12,%xmm1,%xmm3"); 2932 2933 asm volatile("vgf2p8affineinvqb $0x12,%xmm1,%xmm2,%xmm3"); 2934 asm volatile("vgf2p8affineinvqb $0x12,%ymm1,%ymm2,%ymm3"); 2935 asm volatile("vgf2p8affineinvqb $0x12,%zmm1,%zmm2,%zmm3"); 2936 2937 /* AVX-512: Op code 0f 72 (Grp13) */ 2938 2939 asm volatile("vprord $0x12,%zmm5,%zmm6"); 2940 asm volatile("vprorq $0x12,%zmm5,%zmm6"); 2941 asm volatile("vprold $0x12,%zmm5,%zmm6"); 2942 asm volatile("vprolq $0x12,%zmm5,%zmm6"); 2943 asm volatile("psrad $0x2,%mm6"); 2944 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 2945 asm volatile("vpsrad $0x5,%zmm6,%zmm2"); 2946 asm volatile("vpsraq $0x5,%zmm6,%zmm2"); 2947 2948 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 2949 2950 asm volatile("vgatherpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2951 asm volatile("vgatherpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2952 asm volatile("vgatherpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2953 asm volatile("vgatherpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2954 asm volatile("vscatterpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2955 asm volatile("vscatterpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2956 asm volatile("vscatterpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2957 asm volatile("vscatterpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2958 2959 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 2960 2961 asm volatile("vgatherpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2962 asm volatile("vgatherpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2963 asm volatile("vgatherpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2964 asm volatile("vgatherpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2965 asm volatile("vscatterpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2966 asm volatile("vscatterpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2967 asm volatile("vscatterpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2968 asm volatile("vscatterpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2969 2970 /* AVX-512: Examples */ 2971 2972 asm volatile("vaddpd %zmm4,%zmm5,%zmm6"); 2973 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}"); 2974 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}{z}"); 2975 asm volatile("vaddpd {rn-sae},%zmm4,%zmm5,%zmm6"); 2976 asm volatile("vaddpd {ru-sae},%zmm4,%zmm5,%zmm6"); 2977 asm volatile("vaddpd {rd-sae},%zmm4,%zmm5,%zmm6"); 2978 asm volatile("vaddpd {rz-sae},%zmm4,%zmm5,%zmm6"); 2979 asm volatile("vaddpd (%ecx),%zmm5,%zmm6"); 2980 asm volatile("vaddpd 0x123(%eax,%ecx,8),%zmm5,%zmm6"); 2981 asm volatile("vaddpd (%ecx){1to8},%zmm5,%zmm6"); 2982 asm volatile("vaddpd 0x1fc0(%edx),%zmm5,%zmm6"); 2983 asm volatile("vaddpd 0x3f8(%edx){1to8},%zmm5,%zmm6"); 2984 asm volatile("vcmpeq_uqps 0x1fc(%edx){1to16},%zmm6,%k5"); 2985 asm volatile("vcmpltsd 0x123(%eax,%ecx,8),%xmm3,%k5{%k7}"); 2986 asm volatile("vcmplesd {sae},%xmm4,%xmm5,%k5{%k7}"); 2987 asm volatile("vgetmantss $0x5b,0x123(%eax,%ecx,8),%xmm4,%xmm5{%k7}"); 2988 2989 /* bndmk m32, bnd */ 2990 2991 asm volatile("bndmk (%eax), %bnd0"); 2992 asm volatile("bndmk (0x12345678), %bnd0"); 2993 asm volatile("bndmk (%eax), %bnd3"); 2994 asm volatile("bndmk (%ecx,%eax,1), %bnd0"); 2995 asm volatile("bndmk 0x12345678(,%eax,1), %bnd0"); 2996 asm volatile("bndmk (%eax,%ecx,1), %bnd0"); 2997 asm volatile("bndmk (%eax,%ecx,8), %bnd0"); 2998 asm volatile("bndmk 0x12(%eax), %bnd0"); 2999 asm volatile("bndmk 0x12(%ebp), %bnd0"); 3000 asm volatile("bndmk 0x12(%ecx,%eax,1), %bnd0"); 3001 asm volatile("bndmk 0x12(%ebp,%eax,1), %bnd0"); 3002 asm volatile("bndmk 0x12(%eax,%ecx,1), %bnd0"); 3003 asm volatile("bndmk 0x12(%eax,%ecx,8), %bnd0"); 3004 asm volatile("bndmk 0x12345678(%eax), %bnd0"); 3005 asm volatile("bndmk 0x12345678(%ebp), %bnd0"); 3006 asm volatile("bndmk 0x12345678(%ecx,%eax,1), %bnd0"); 3007 asm volatile("bndmk 0x12345678(%ebp,%eax,1), %bnd0"); 3008 asm volatile("bndmk 0x12345678(%eax,%ecx,1), %bnd0"); 3009 asm volatile("bndmk 0x12345678(%eax,%ecx,8), %bnd0"); 3010 3011 /* bndcl r/m32, bnd */ 3012 3013 asm volatile("bndcl (%eax), %bnd0"); 3014 asm volatile("bndcl (0x12345678), %bnd0"); 3015 asm volatile("bndcl (%eax), %bnd3"); 3016 asm volatile("bndcl (%ecx,%eax,1), %bnd0"); 3017 asm volatile("bndcl 0x12345678(,%eax,1), %bnd0"); 3018 asm volatile("bndcl (%eax,%ecx,1), %bnd0"); 3019 asm volatile("bndcl (%eax,%ecx,8), %bnd0"); 3020 asm volatile("bndcl 0x12(%eax), %bnd0"); 3021 asm volatile("bndcl 0x12(%ebp), %bnd0"); 3022 asm volatile("bndcl 0x12(%ecx,%eax,1), %bnd0"); 3023 asm volatile("bndcl 0x12(%ebp,%eax,1), %bnd0"); 3024 asm volatile("bndcl 0x12(%eax,%ecx,1), %bnd0"); 3025 asm volatile("bndcl 0x12(%eax,%ecx,8), %bnd0"); 3026 asm volatile("bndcl 0x12345678(%eax), %bnd0"); 3027 asm volatile("bndcl 0x12345678(%ebp), %bnd0"); 3028 asm volatile("bndcl 0x12345678(%ecx,%eax,1), %bnd0"); 3029 asm volatile("bndcl 0x12345678(%ebp,%eax,1), %bnd0"); 3030 asm volatile("bndcl 0x12345678(%eax,%ecx,1), %bnd0"); 3031 asm volatile("bndcl 0x12345678(%eax,%ecx,8), %bnd0"); 3032 asm volatile("bndcl %eax, %bnd0"); 3033 3034 /* bndcu r/m32, bnd */ 3035 3036 asm volatile("bndcu (%eax), %bnd0"); 3037 asm volatile("bndcu (0x12345678), %bnd0"); 3038 asm volatile("bndcu (%eax), %bnd3"); 3039 asm volatile("bndcu (%ecx,%eax,1), %bnd0"); 3040 asm volatile("bndcu 0x12345678(,%eax,1), %bnd0"); 3041 asm volatile("bndcu (%eax,%ecx,1), %bnd0"); 3042 asm volatile("bndcu (%eax,%ecx,8), %bnd0"); 3043 asm volatile("bndcu 0x12(%eax), %bnd0"); 3044 asm volatile("bndcu 0x12(%ebp), %bnd0"); 3045 asm volatile("bndcu 0x12(%ecx,%eax,1), %bnd0"); 3046 asm volatile("bndcu 0x12(%ebp,%eax,1), %bnd0"); 3047 asm volatile("bndcu 0x12(%eax,%ecx,1), %bnd0"); 3048 asm volatile("bndcu 0x12(%eax,%ecx,8), %bnd0"); 3049 asm volatile("bndcu 0x12345678(%eax), %bnd0"); 3050 asm volatile("bndcu 0x12345678(%ebp), %bnd0"); 3051 asm volatile("bndcu 0x12345678(%ecx,%eax,1), %bnd0"); 3052 asm volatile("bndcu 0x12345678(%ebp,%eax,1), %bnd0"); 3053 asm volatile("bndcu 0x12345678(%eax,%ecx,1), %bnd0"); 3054 asm volatile("bndcu 0x12345678(%eax,%ecx,8), %bnd0"); 3055 asm volatile("bndcu %eax, %bnd0"); 3056 3057 /* bndcn r/m32, bnd */ 3058 3059 asm volatile("bndcn (%eax), %bnd0"); 3060 asm volatile("bndcn (0x12345678), %bnd0"); 3061 asm volatile("bndcn (%eax), %bnd3"); 3062 asm volatile("bndcn (%ecx,%eax,1), %bnd0"); 3063 asm volatile("bndcn 0x12345678(,%eax,1), %bnd0"); 3064 asm volatile("bndcn (%eax,%ecx,1), %bnd0"); 3065 asm volatile("bndcn (%eax,%ecx,8), %bnd0"); 3066 asm volatile("bndcn 0x12(%eax), %bnd0"); 3067 asm volatile("bndcn 0x12(%ebp), %bnd0"); 3068 asm volatile("bndcn 0x12(%ecx,%eax,1), %bnd0"); 3069 asm volatile("bndcn 0x12(%ebp,%eax,1), %bnd0"); 3070 asm volatile("bndcn 0x12(%eax,%ecx,1), %bnd0"); 3071 asm volatile("bndcn 0x12(%eax,%ecx,8), %bnd0"); 3072 asm volatile("bndcn 0x12345678(%eax), %bnd0"); 3073 asm volatile("bndcn 0x12345678(%ebp), %bnd0"); 3074 asm volatile("bndcn 0x12345678(%ecx,%eax,1), %bnd0"); 3075 asm volatile("bndcn 0x12345678(%ebp,%eax,1), %bnd0"); 3076 asm volatile("bndcn 0x12345678(%eax,%ecx,1), %bnd0"); 3077 asm volatile("bndcn 0x12345678(%eax,%ecx,8), %bnd0"); 3078 asm volatile("bndcn %eax, %bnd0"); 3079 3080 /* bndmov m64, bnd */ 3081 3082 asm volatile("bndmov (%eax), %bnd0"); 3083 asm volatile("bndmov (0x12345678), %bnd0"); 3084 asm volatile("bndmov (%eax), %bnd3"); 3085 asm volatile("bndmov (%ecx,%eax,1), %bnd0"); 3086 asm volatile("bndmov 0x12345678(,%eax,1), %bnd0"); 3087 asm volatile("bndmov (%eax,%ecx,1), %bnd0"); 3088 asm volatile("bndmov (%eax,%ecx,8), %bnd0"); 3089 asm volatile("bndmov 0x12(%eax), %bnd0"); 3090 asm volatile("bndmov 0x12(%ebp), %bnd0"); 3091 asm volatile("bndmov 0x12(%ecx,%eax,1), %bnd0"); 3092 asm volatile("bndmov 0x12(%ebp,%eax,1), %bnd0"); 3093 asm volatile("bndmov 0x12(%eax,%ecx,1), %bnd0"); 3094 asm volatile("bndmov 0x12(%eax,%ecx,8), %bnd0"); 3095 asm volatile("bndmov 0x12345678(%eax), %bnd0"); 3096 asm volatile("bndmov 0x12345678(%ebp), %bnd0"); 3097 asm volatile("bndmov 0x12345678(%ecx,%eax,1), %bnd0"); 3098 asm volatile("bndmov 0x12345678(%ebp,%eax,1), %bnd0"); 3099 asm volatile("bndmov 0x12345678(%eax,%ecx,1), %bnd0"); 3100 asm volatile("bndmov 0x12345678(%eax,%ecx,8), %bnd0"); 3101 3102 /* bndmov bnd, m64 */ 3103 3104 asm volatile("bndmov %bnd0, (%eax)"); 3105 asm volatile("bndmov %bnd0, (0x12345678)"); 3106 asm volatile("bndmov %bnd3, (%eax)"); 3107 asm volatile("bndmov %bnd0, (%ecx,%eax,1)"); 3108 asm volatile("bndmov %bnd0, 0x12345678(,%eax,1)"); 3109 asm volatile("bndmov %bnd0, (%eax,%ecx,1)"); 3110 asm volatile("bndmov %bnd0, (%eax,%ecx,8)"); 3111 asm volatile("bndmov %bnd0, 0x12(%eax)"); 3112 asm volatile("bndmov %bnd0, 0x12(%ebp)"); 3113 asm volatile("bndmov %bnd0, 0x12(%ecx,%eax,1)"); 3114 asm volatile("bndmov %bnd0, 0x12(%ebp,%eax,1)"); 3115 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,1)"); 3116 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,8)"); 3117 asm volatile("bndmov %bnd0, 0x12345678(%eax)"); 3118 asm volatile("bndmov %bnd0, 0x12345678(%ebp)"); 3119 asm volatile("bndmov %bnd0, 0x12345678(%ecx,%eax,1)"); 3120 asm volatile("bndmov %bnd0, 0x12345678(%ebp,%eax,1)"); 3121 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,1)"); 3122 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,8)"); 3123 3124 /* bndmov bnd2, bnd1 */ 3125 3126 asm volatile("bndmov %bnd0, %bnd1"); 3127 asm volatile("bndmov %bnd1, %bnd0"); 3128 3129 /* bndldx mib, bnd */ 3130 3131 asm volatile("bndldx (%eax), %bnd0"); 3132 asm volatile("bndldx (0x12345678), %bnd0"); 3133 asm volatile("bndldx (%eax), %bnd3"); 3134 asm volatile("bndldx (%ecx,%eax,1), %bnd0"); 3135 asm volatile("bndldx 0x12345678(,%eax,1), %bnd0"); 3136 asm volatile("bndldx (%eax,%ecx,1), %bnd0"); 3137 asm volatile("bndldx 0x12(%eax), %bnd0"); 3138 asm volatile("bndldx 0x12(%ebp), %bnd0"); 3139 asm volatile("bndldx 0x12(%ecx,%eax,1), %bnd0"); 3140 asm volatile("bndldx 0x12(%ebp,%eax,1), %bnd0"); 3141 asm volatile("bndldx 0x12(%eax,%ecx,1), %bnd0"); 3142 asm volatile("bndldx 0x12345678(%eax), %bnd0"); 3143 asm volatile("bndldx 0x12345678(%ebp), %bnd0"); 3144 asm volatile("bndldx 0x12345678(%ecx,%eax,1), %bnd0"); 3145 asm volatile("bndldx 0x12345678(%ebp,%eax,1), %bnd0"); 3146 asm volatile("bndldx 0x12345678(%eax,%ecx,1), %bnd0"); 3147 3148 /* bndstx bnd, mib */ 3149 3150 asm volatile("bndstx %bnd0, (%eax)"); 3151 asm volatile("bndstx %bnd0, (0x12345678)"); 3152 asm volatile("bndstx %bnd3, (%eax)"); 3153 asm volatile("bndstx %bnd0, (%ecx,%eax,1)"); 3154 asm volatile("bndstx %bnd0, 0x12345678(,%eax,1)"); 3155 asm volatile("bndstx %bnd0, (%eax,%ecx,1)"); 3156 asm volatile("bndstx %bnd0, 0x12(%eax)"); 3157 asm volatile("bndstx %bnd0, 0x12(%ebp)"); 3158 asm volatile("bndstx %bnd0, 0x12(%ecx,%eax,1)"); 3159 asm volatile("bndstx %bnd0, 0x12(%ebp,%eax,1)"); 3160 asm volatile("bndstx %bnd0, 0x12(%eax,%ecx,1)"); 3161 asm volatile("bndstx %bnd0, 0x12345678(%eax)"); 3162 asm volatile("bndstx %bnd0, 0x12345678(%ebp)"); 3163 asm volatile("bndstx %bnd0, 0x12345678(%ecx,%eax,1)"); 3164 asm volatile("bndstx %bnd0, 0x12345678(%ebp,%eax,1)"); 3165 asm volatile("bndstx %bnd0, 0x12345678(%eax,%ecx,1)"); 3166 3167 /* bnd prefix on call, ret, jmp and all jcc */ 3168 3169 asm volatile("bnd call label1"); /* Expecting: call unconditional 0xfffffffc */ 3170 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 3171 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 3172 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 3173 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 3174 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 3175 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0xfffffffc */ 3176 3177 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 3178 3179 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 3180 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 3181 asm volatile("sha1rnds4 $0x91, (%eax), %xmm0"); 3182 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 3183 asm volatile("sha1rnds4 $0x91, (%eax), %xmm3"); 3184 asm volatile("sha1rnds4 $0x91, (%ecx,%eax,1), %xmm0"); 3185 asm volatile("sha1rnds4 $0x91, 0x12345678(,%eax,1), %xmm0"); 3186 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,1), %xmm0"); 3187 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,8), %xmm0"); 3188 asm volatile("sha1rnds4 $0x91, 0x12(%eax), %xmm0"); 3189 asm volatile("sha1rnds4 $0x91, 0x12(%ebp), %xmm0"); 3190 asm volatile("sha1rnds4 $0x91, 0x12(%ecx,%eax,1), %xmm0"); 3191 asm volatile("sha1rnds4 $0x91, 0x12(%ebp,%eax,1), %xmm0"); 3192 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,1), %xmm0"); 3193 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,8), %xmm0"); 3194 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax), %xmm0"); 3195 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp), %xmm0"); 3196 asm volatile("sha1rnds4 $0x91, 0x12345678(%ecx,%eax,1), %xmm0"); 3197 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp,%eax,1), %xmm0"); 3198 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,1), %xmm0"); 3199 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,8), %xmm0"); 3200 3201 /* sha1nexte xmm2/m128, xmm1 */ 3202 3203 asm volatile("sha1nexte %xmm1, %xmm0"); 3204 asm volatile("sha1nexte %xmm7, %xmm2"); 3205 asm volatile("sha1nexte (%eax), %xmm0"); 3206 asm volatile("sha1nexte (0x12345678), %xmm0"); 3207 asm volatile("sha1nexte (%eax), %xmm3"); 3208 asm volatile("sha1nexte (%ecx,%eax,1), %xmm0"); 3209 asm volatile("sha1nexte 0x12345678(,%eax,1), %xmm0"); 3210 asm volatile("sha1nexte (%eax,%ecx,1), %xmm0"); 3211 asm volatile("sha1nexte (%eax,%ecx,8), %xmm0"); 3212 asm volatile("sha1nexte 0x12(%eax), %xmm0"); 3213 asm volatile("sha1nexte 0x12(%ebp), %xmm0"); 3214 asm volatile("sha1nexte 0x12(%ecx,%eax,1), %xmm0"); 3215 asm volatile("sha1nexte 0x12(%ebp,%eax,1), %xmm0"); 3216 asm volatile("sha1nexte 0x12(%eax,%ecx,1), %xmm0"); 3217 asm volatile("sha1nexte 0x12(%eax,%ecx,8), %xmm0"); 3218 asm volatile("sha1nexte 0x12345678(%eax), %xmm0"); 3219 asm volatile("sha1nexte 0x12345678(%ebp), %xmm0"); 3220 asm volatile("sha1nexte 0x12345678(%ecx,%eax,1), %xmm0"); 3221 asm volatile("sha1nexte 0x12345678(%ebp,%eax,1), %xmm0"); 3222 asm volatile("sha1nexte 0x12345678(%eax,%ecx,1), %xmm0"); 3223 asm volatile("sha1nexte 0x12345678(%eax,%ecx,8), %xmm0"); 3224 3225 /* sha1msg1 xmm2/m128, xmm1 */ 3226 3227 asm volatile("sha1msg1 %xmm1, %xmm0"); 3228 asm volatile("sha1msg1 %xmm7, %xmm2"); 3229 asm volatile("sha1msg1 (%eax), %xmm0"); 3230 asm volatile("sha1msg1 (0x12345678), %xmm0"); 3231 asm volatile("sha1msg1 (%eax), %xmm3"); 3232 asm volatile("sha1msg1 (%ecx,%eax,1), %xmm0"); 3233 asm volatile("sha1msg1 0x12345678(,%eax,1), %xmm0"); 3234 asm volatile("sha1msg1 (%eax,%ecx,1), %xmm0"); 3235 asm volatile("sha1msg1 (%eax,%ecx,8), %xmm0"); 3236 asm volatile("sha1msg1 0x12(%eax), %xmm0"); 3237 asm volatile("sha1msg1 0x12(%ebp), %xmm0"); 3238 asm volatile("sha1msg1 0x12(%ecx,%eax,1), %xmm0"); 3239 asm volatile("sha1msg1 0x12(%ebp,%eax,1), %xmm0"); 3240 asm volatile("sha1msg1 0x12(%eax,%ecx,1), %xmm0"); 3241 asm volatile("sha1msg1 0x12(%eax,%ecx,8), %xmm0"); 3242 asm volatile("sha1msg1 0x12345678(%eax), %xmm0"); 3243 asm volatile("sha1msg1 0x12345678(%ebp), %xmm0"); 3244 asm volatile("sha1msg1 0x12345678(%ecx,%eax,1), %xmm0"); 3245 asm volatile("sha1msg1 0x12345678(%ebp,%eax,1), %xmm0"); 3246 asm volatile("sha1msg1 0x12345678(%eax,%ecx,1), %xmm0"); 3247 asm volatile("sha1msg1 0x12345678(%eax,%ecx,8), %xmm0"); 3248 3249 /* sha1msg2 xmm2/m128, xmm1 */ 3250 3251 asm volatile("sha1msg2 %xmm1, %xmm0"); 3252 asm volatile("sha1msg2 %xmm7, %xmm2"); 3253 asm volatile("sha1msg2 (%eax), %xmm0"); 3254 asm volatile("sha1msg2 (0x12345678), %xmm0"); 3255 asm volatile("sha1msg2 (%eax), %xmm3"); 3256 asm volatile("sha1msg2 (%ecx,%eax,1), %xmm0"); 3257 asm volatile("sha1msg2 0x12345678(,%eax,1), %xmm0"); 3258 asm volatile("sha1msg2 (%eax,%ecx,1), %xmm0"); 3259 asm volatile("sha1msg2 (%eax,%ecx,8), %xmm0"); 3260 asm volatile("sha1msg2 0x12(%eax), %xmm0"); 3261 asm volatile("sha1msg2 0x12(%ebp), %xmm0"); 3262 asm volatile("sha1msg2 0x12(%ecx,%eax,1), %xmm0"); 3263 asm volatile("sha1msg2 0x12(%ebp,%eax,1), %xmm0"); 3264 asm volatile("sha1msg2 0x12(%eax,%ecx,1), %xmm0"); 3265 asm volatile("sha1msg2 0x12(%eax,%ecx,8), %xmm0"); 3266 asm volatile("sha1msg2 0x12345678(%eax), %xmm0"); 3267 asm volatile("sha1msg2 0x12345678(%ebp), %xmm0"); 3268 asm volatile("sha1msg2 0x12345678(%ecx,%eax,1), %xmm0"); 3269 asm volatile("sha1msg2 0x12345678(%ebp,%eax,1), %xmm0"); 3270 asm volatile("sha1msg2 0x12345678(%eax,%ecx,1), %xmm0"); 3271 asm volatile("sha1msg2 0x12345678(%eax,%ecx,8), %xmm0"); 3272 3273 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 3274 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 3275 3276 asm volatile("sha256rnds2 %xmm4, %xmm1"); 3277 asm volatile("sha256rnds2 %xmm7, %xmm2"); 3278 asm volatile("sha256rnds2 (%eax), %xmm1"); 3279 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 3280 asm volatile("sha256rnds2 (%eax), %xmm3"); 3281 asm volatile("sha256rnds2 (%ecx,%eax,1), %xmm1"); 3282 asm volatile("sha256rnds2 0x12345678(,%eax,1), %xmm1"); 3283 asm volatile("sha256rnds2 (%eax,%ecx,1), %xmm1"); 3284 asm volatile("sha256rnds2 (%eax,%ecx,8), %xmm1"); 3285 asm volatile("sha256rnds2 0x12(%eax), %xmm1"); 3286 asm volatile("sha256rnds2 0x12(%ebp), %xmm1"); 3287 asm volatile("sha256rnds2 0x12(%ecx,%eax,1), %xmm1"); 3288 asm volatile("sha256rnds2 0x12(%ebp,%eax,1), %xmm1"); 3289 asm volatile("sha256rnds2 0x12(%eax,%ecx,1), %xmm1"); 3290 asm volatile("sha256rnds2 0x12(%eax,%ecx,8), %xmm1"); 3291 asm volatile("sha256rnds2 0x12345678(%eax), %xmm1"); 3292 asm volatile("sha256rnds2 0x12345678(%ebp), %xmm1"); 3293 asm volatile("sha256rnds2 0x12345678(%ecx,%eax,1), %xmm1"); 3294 asm volatile("sha256rnds2 0x12345678(%ebp,%eax,1), %xmm1"); 3295 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,1), %xmm1"); 3296 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,8), %xmm1"); 3297 3298 /* sha256msg1 xmm2/m128, xmm1 */ 3299 3300 asm volatile("sha256msg1 %xmm1, %xmm0"); 3301 asm volatile("sha256msg1 %xmm7, %xmm2"); 3302 asm volatile("sha256msg1 (%eax), %xmm0"); 3303 asm volatile("sha256msg1 (0x12345678), %xmm0"); 3304 asm volatile("sha256msg1 (%eax), %xmm3"); 3305 asm volatile("sha256msg1 (%ecx,%eax,1), %xmm0"); 3306 asm volatile("sha256msg1 0x12345678(,%eax,1), %xmm0"); 3307 asm volatile("sha256msg1 (%eax,%ecx,1), %xmm0"); 3308 asm volatile("sha256msg1 (%eax,%ecx,8), %xmm0"); 3309 asm volatile("sha256msg1 0x12(%eax), %xmm0"); 3310 asm volatile("sha256msg1 0x12(%ebp), %xmm0"); 3311 asm volatile("sha256msg1 0x12(%ecx,%eax,1), %xmm0"); 3312 asm volatile("sha256msg1 0x12(%ebp,%eax,1), %xmm0"); 3313 asm volatile("sha256msg1 0x12(%eax,%ecx,1), %xmm0"); 3314 asm volatile("sha256msg1 0x12(%eax,%ecx,8), %xmm0"); 3315 asm volatile("sha256msg1 0x12345678(%eax), %xmm0"); 3316 asm volatile("sha256msg1 0x12345678(%ebp), %xmm0"); 3317 asm volatile("sha256msg1 0x12345678(%ecx,%eax,1), %xmm0"); 3318 asm volatile("sha256msg1 0x12345678(%ebp,%eax,1), %xmm0"); 3319 asm volatile("sha256msg1 0x12345678(%eax,%ecx,1), %xmm0"); 3320 asm volatile("sha256msg1 0x12345678(%eax,%ecx,8), %xmm0"); 3321 3322 /* sha256msg2 xmm2/m128, xmm1 */ 3323 3324 asm volatile("sha256msg2 %xmm1, %xmm0"); 3325 asm volatile("sha256msg2 %xmm7, %xmm2"); 3326 asm volatile("sha256msg2 (%eax), %xmm0"); 3327 asm volatile("sha256msg2 (0x12345678), %xmm0"); 3328 asm volatile("sha256msg2 (%eax), %xmm3"); 3329 asm volatile("sha256msg2 (%ecx,%eax,1), %xmm0"); 3330 asm volatile("sha256msg2 0x12345678(,%eax,1), %xmm0"); 3331 asm volatile("sha256msg2 (%eax,%ecx,1), %xmm0"); 3332 asm volatile("sha256msg2 (%eax,%ecx,8), %xmm0"); 3333 asm volatile("sha256msg2 0x12(%eax), %xmm0"); 3334 asm volatile("sha256msg2 0x12(%ebp), %xmm0"); 3335 asm volatile("sha256msg2 0x12(%ecx,%eax,1), %xmm0"); 3336 asm volatile("sha256msg2 0x12(%ebp,%eax,1), %xmm0"); 3337 asm volatile("sha256msg2 0x12(%eax,%ecx,1), %xmm0"); 3338 asm volatile("sha256msg2 0x12(%eax,%ecx,8), %xmm0"); 3339 asm volatile("sha256msg2 0x12345678(%eax), %xmm0"); 3340 asm volatile("sha256msg2 0x12345678(%ebp), %xmm0"); 3341 asm volatile("sha256msg2 0x12345678(%ecx,%eax,1), %xmm0"); 3342 asm volatile("sha256msg2 0x12345678(%ebp,%eax,1), %xmm0"); 3343 asm volatile("sha256msg2 0x12345678(%eax,%ecx,1), %xmm0"); 3344 asm volatile("sha256msg2 0x12345678(%eax,%ecx,8), %xmm0"); 3345 3346 /* clflushopt m8 */ 3347 3348 asm volatile("clflushopt (%eax)"); 3349 asm volatile("clflushopt (0x12345678)"); 3350 asm volatile("clflushopt 0x12345678(%eax,%ecx,8)"); 3351 /* Also check instructions in the same group encoding as clflushopt */ 3352 asm volatile("clflush (%eax)"); 3353 asm volatile("sfence"); 3354 3355 /* clwb m8 */ 3356 3357 asm volatile("clwb (%eax)"); 3358 asm volatile("clwb (0x12345678)"); 3359 asm volatile("clwb 0x12345678(%eax,%ecx,8)"); 3360 /* Also check instructions in the same group encoding as clwb */ 3361 asm volatile("xsaveopt (%eax)"); 3362 asm volatile("mfence"); 3363 3364 /* cldemote m8 */ 3365 3366 asm volatile("cldemote (%eax)"); 3367 asm volatile("cldemote (0x12345678)"); 3368 asm volatile("cldemote 0x12345678(%eax,%ecx,8)"); 3369 3370 /* xsavec mem */ 3371 3372 asm volatile("xsavec (%eax)"); 3373 asm volatile("xsavec (0x12345678)"); 3374 asm volatile("xsavec 0x12345678(%eax,%ecx,8)"); 3375 3376 /* xsaves mem */ 3377 3378 asm volatile("xsaves (%eax)"); 3379 asm volatile("xsaves (0x12345678)"); 3380 asm volatile("xsaves 0x12345678(%eax,%ecx,8)"); 3381 3382 /* xrstors mem */ 3383 3384 asm volatile("xrstors (%eax)"); 3385 asm volatile("xrstors (0x12345678)"); 3386 asm volatile("xrstors 0x12345678(%eax,%ecx,8)"); 3387 3388 /* ptwrite */ 3389 3390 asm volatile("ptwrite (%eax)"); 3391 asm volatile("ptwrite (0x12345678)"); 3392 asm volatile("ptwrite 0x12345678(%eax,%ecx,8)"); 3393 3394 asm volatile("ptwritel (%eax)"); 3395 asm volatile("ptwritel (0x12345678)"); 3396 asm volatile("ptwritel 0x12345678(%eax,%ecx,8)"); 3397 3398 /* tpause */ 3399 3400 asm volatile("tpause %ebx"); 3401 3402 /* umonitor */ 3403 3404 asm volatile("umonitor %ax"); 3405 asm volatile("umonitor %eax"); 3406 3407 /* umwait */ 3408 3409 asm volatile("umwait %eax"); 3410 3411 /* movdiri */ 3412 3413 asm volatile("movdiri %eax,(%ebx)"); 3414 asm volatile("movdiri %ecx,0x12345678(%eax)"); 3415 3416 /* movdir64b */ 3417 3418 asm volatile("movdir64b (%eax),%ebx"); 3419 asm volatile("movdir64b 0x12345678(%eax),%ecx"); 3420 asm volatile("movdir64b (%si),%bx"); 3421 asm volatile("movdir64b 0x1234(%si),%cx"); 3422 3423 /* enqcmd */ 3424 3425 asm volatile("enqcmd (%eax),%ebx"); 3426 asm volatile("enqcmd 0x12345678(%eax),%ecx"); 3427 asm volatile("enqcmd (%si),%bx"); 3428 asm volatile("enqcmd 0x1234(%si),%cx"); 3429 3430 /* enqcmds */ 3431 3432 asm volatile("enqcmds (%eax),%ebx"); 3433 asm volatile("enqcmds 0x12345678(%eax),%ecx"); 3434 asm volatile("enqcmds (%si),%bx"); 3435 asm volatile("enqcmds 0x1234(%si),%cx"); 3436 3437 #endif /* #ifndef __x86_64__ */ 3438 3439 /* SGX */ 3440 3441 asm volatile("encls"); 3442 asm volatile("enclu"); 3443 asm volatile("enclv"); 3444 3445 /* pconfig */ 3446 3447 asm volatile("pconfig"); 3448 3449 /* wbnoinvd */ 3450 3451 asm volatile("wbnoinvd"); 3452 3453 /* Following line is a marker for the awk script - do not change */ 3454 asm volatile("rdtsc"); /* Stop here */ 3455 3456 return 0; 3457 } 3458