1 /* 2 * This file contains instructions for testing by the test titled: 3 * 4 * "Test x86 instruction decoder - new instructions" 5 * 6 * Note that the 'Expecting' comment lines are consumed by the 7 * gen-insn-x86-dat.awk script and have the format: 8 * 9 * Expecting: <op> <branch> <rel> 10 * 11 * If this file is changed, remember to run the gen-insn-x86-dat.sh 12 * script and commit the result. 13 * 14 * Refer to insn-x86.c for more details. 15 */ 16 17 int main(void) 18 { 19 /* Following line is a marker for the awk script - do not change */ 20 asm volatile("rdtsc"); /* Start here */ 21 22 /* Test fix for vcvtph2ps in x86-opcode-map.txt */ 23 24 asm volatile("vcvtph2ps %xmm3,%ymm5"); 25 26 #ifdef __x86_64__ 27 28 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 29 30 asm volatile("cmovno %rax,%rbx"); 31 asm volatile("cmovno 0x12345678(%rax),%rcx"); 32 asm volatile("cmovno 0x12345678(%rax),%cx"); 33 34 asm volatile("cmove %rax,%rbx"); 35 asm volatile("cmove 0x12345678(%rax),%rcx"); 36 asm volatile("cmove 0x12345678(%rax),%cx"); 37 38 asm volatile("seto 0x12345678(%rax)"); 39 asm volatile("setno 0x12345678(%rax)"); 40 asm volatile("setb 0x12345678(%rax)"); 41 asm volatile("setc 0x12345678(%rax)"); 42 asm volatile("setnae 0x12345678(%rax)"); 43 asm volatile("setae 0x12345678(%rax)"); 44 asm volatile("setnb 0x12345678(%rax)"); 45 asm volatile("setnc 0x12345678(%rax)"); 46 asm volatile("sets 0x12345678(%rax)"); 47 asm volatile("setns 0x12345678(%rax)"); 48 49 /* AVX-512: Mask Instructions */ 50 51 asm volatile("kandw %k7,%k6,%k5"); 52 asm volatile("kandq %k7,%k6,%k5"); 53 asm volatile("kandb %k7,%k6,%k5"); 54 asm volatile("kandd %k7,%k6,%k5"); 55 56 asm volatile("kandnw %k7,%k6,%k5"); 57 asm volatile("kandnq %k7,%k6,%k5"); 58 asm volatile("kandnb %k7,%k6,%k5"); 59 asm volatile("kandnd %k7,%k6,%k5"); 60 61 asm volatile("knotw %k7,%k6"); 62 asm volatile("knotq %k7,%k6"); 63 asm volatile("knotb %k7,%k6"); 64 asm volatile("knotd %k7,%k6"); 65 66 asm volatile("korw %k7,%k6,%k5"); 67 asm volatile("korq %k7,%k6,%k5"); 68 asm volatile("korb %k7,%k6,%k5"); 69 asm volatile("kord %k7,%k6,%k5"); 70 71 asm volatile("kxnorw %k7,%k6,%k5"); 72 asm volatile("kxnorq %k7,%k6,%k5"); 73 asm volatile("kxnorb %k7,%k6,%k5"); 74 asm volatile("kxnord %k7,%k6,%k5"); 75 76 asm volatile("kxorw %k7,%k6,%k5"); 77 asm volatile("kxorq %k7,%k6,%k5"); 78 asm volatile("kxorb %k7,%k6,%k5"); 79 asm volatile("kxord %k7,%k6,%k5"); 80 81 asm volatile("kaddw %k7,%k6,%k5"); 82 asm volatile("kaddq %k7,%k6,%k5"); 83 asm volatile("kaddb %k7,%k6,%k5"); 84 asm volatile("kaddd %k7,%k6,%k5"); 85 86 asm volatile("kunpckbw %k7,%k6,%k5"); 87 asm volatile("kunpckwd %k7,%k6,%k5"); 88 asm volatile("kunpckdq %k7,%k6,%k5"); 89 90 asm volatile("kmovw %k6,%k5"); 91 asm volatile("kmovw (%rcx),%k5"); 92 asm volatile("kmovw 0x123(%rax,%r14,8),%k5"); 93 asm volatile("kmovw %k5,(%rcx)"); 94 asm volatile("kmovw %k5,0x123(%rax,%r14,8)"); 95 asm volatile("kmovw %eax,%k5"); 96 asm volatile("kmovw %ebp,%k5"); 97 asm volatile("kmovw %r13d,%k5"); 98 asm volatile("kmovw %k5,%eax"); 99 asm volatile("kmovw %k5,%ebp"); 100 asm volatile("kmovw %k5,%r13d"); 101 102 asm volatile("kmovq %k6,%k5"); 103 asm volatile("kmovq (%rcx),%k5"); 104 asm volatile("kmovq 0x123(%rax,%r14,8),%k5"); 105 asm volatile("kmovq %k5,(%rcx)"); 106 asm volatile("kmovq %k5,0x123(%rax,%r14,8)"); 107 asm volatile("kmovq %rax,%k5"); 108 asm volatile("kmovq %rbp,%k5"); 109 asm volatile("kmovq %r13,%k5"); 110 asm volatile("kmovq %k5,%rax"); 111 asm volatile("kmovq %k5,%rbp"); 112 asm volatile("kmovq %k5,%r13"); 113 114 asm volatile("kmovb %k6,%k5"); 115 asm volatile("kmovb (%rcx),%k5"); 116 asm volatile("kmovb 0x123(%rax,%r14,8),%k5"); 117 asm volatile("kmovb %k5,(%rcx)"); 118 asm volatile("kmovb %k5,0x123(%rax,%r14,8)"); 119 asm volatile("kmovb %eax,%k5"); 120 asm volatile("kmovb %ebp,%k5"); 121 asm volatile("kmovb %r13d,%k5"); 122 asm volatile("kmovb %k5,%eax"); 123 asm volatile("kmovb %k5,%ebp"); 124 asm volatile("kmovb %k5,%r13d"); 125 126 asm volatile("kmovd %k6,%k5"); 127 asm volatile("kmovd (%rcx),%k5"); 128 asm volatile("kmovd 0x123(%rax,%r14,8),%k5"); 129 asm volatile("kmovd %k5,(%rcx)"); 130 asm volatile("kmovd %k5,0x123(%rax,%r14,8)"); 131 asm volatile("kmovd %eax,%k5"); 132 asm volatile("kmovd %ebp,%k5"); 133 asm volatile("kmovd %r13d,%k5"); 134 asm volatile("kmovd %k5,%eax"); 135 asm volatile("kmovd %k5,%ebp"); 136 asm volatile("kmovd %k5,%r13d"); 137 138 asm volatile("kortestw %k6,%k5"); 139 asm volatile("kortestq %k6,%k5"); 140 asm volatile("kortestb %k6,%k5"); 141 asm volatile("kortestd %k6,%k5"); 142 143 asm volatile("ktestw %k6,%k5"); 144 asm volatile("ktestq %k6,%k5"); 145 asm volatile("ktestb %k6,%k5"); 146 asm volatile("ktestd %k6,%k5"); 147 148 asm volatile("kshiftrw $0x12,%k6,%k5"); 149 asm volatile("kshiftrq $0x5b,%k6,%k5"); 150 asm volatile("kshiftlw $0x12,%k6,%k5"); 151 asm volatile("kshiftlq $0x5b,%k6,%k5"); 152 153 /* AVX-512: Op code 0f 5b */ 154 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 155 asm volatile("vcvtqq2ps %zmm29,%ymm6{%k7}"); 156 asm volatile("vcvtps2dq %xmm5,%xmm6"); 157 asm volatile("vcvttps2dq %xmm5,%xmm6"); 158 159 /* AVX-512: Op code 0f 6f */ 160 161 asm volatile("movq %mm0,%mm4"); 162 asm volatile("vmovdqa %ymm4,%ymm6"); 163 asm volatile("vmovdqa32 %zmm25,%zmm26"); 164 asm volatile("vmovdqa64 %zmm25,%zmm26"); 165 asm volatile("vmovdqu %ymm4,%ymm6"); 166 asm volatile("vmovdqu32 %zmm29,%zmm30"); 167 asm volatile("vmovdqu64 %zmm25,%zmm26"); 168 asm volatile("vmovdqu8 %zmm29,%zmm30"); 169 asm volatile("vmovdqu16 %zmm25,%zmm26"); 170 171 /* AVX-512: Op code 0f 78 */ 172 173 asm volatile("vmread %rax,%rbx"); 174 asm volatile("vcvttps2udq %zmm25,%zmm26"); 175 asm volatile("vcvttpd2udq %zmm29,%ymm6{%k7}"); 176 asm volatile("vcvttsd2usi %xmm6,%rax"); 177 asm volatile("vcvttss2usi %xmm6,%rax"); 178 asm volatile("vcvttps2uqq %ymm5,%zmm26{%k7}"); 179 asm volatile("vcvttpd2uqq %zmm29,%zmm30"); 180 181 /* AVX-512: Op code 0f 79 */ 182 183 asm volatile("vmwrite %rax,%rbx"); 184 asm volatile("vcvtps2udq %zmm25,%zmm26"); 185 asm volatile("vcvtpd2udq %zmm29,%ymm6{%k7}"); 186 asm volatile("vcvtsd2usi %xmm6,%rax"); 187 asm volatile("vcvtss2usi %xmm6,%rax"); 188 asm volatile("vcvtps2uqq %ymm5,%zmm26{%k7}"); 189 asm volatile("vcvtpd2uqq %zmm29,%zmm30"); 190 191 /* AVX-512: Op code 0f 7a */ 192 193 asm volatile("vcvtudq2pd %ymm5,%zmm29{%k7}"); 194 asm volatile("vcvtuqq2pd %zmm25,%zmm26"); 195 asm volatile("vcvtudq2ps %zmm29,%zmm30"); 196 asm volatile("vcvtuqq2ps %zmm25,%ymm26{%k7}"); 197 asm volatile("vcvttps2qq %ymm25,%zmm26{%k7}"); 198 asm volatile("vcvttpd2qq %zmm29,%zmm30"); 199 200 /* AVX-512: Op code 0f 7b */ 201 202 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 203 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 204 asm volatile("vcvtps2qq %ymm5,%zmm26{%k7}"); 205 asm volatile("vcvtpd2qq %zmm29,%zmm30"); 206 207 /* AVX-512: Op code 0f 7f */ 208 209 asm volatile("movq.s %mm0,%mm4"); 210 asm volatile("vmovdqa %ymm8,%ymm6"); 211 asm volatile("vmovdqa32.s %zmm25,%zmm26"); 212 asm volatile("vmovdqa64.s %zmm25,%zmm26"); 213 asm volatile("vmovdqu %ymm8,%ymm6"); 214 asm volatile("vmovdqu32.s %zmm25,%zmm26"); 215 asm volatile("vmovdqu64.s %zmm25,%zmm26"); 216 asm volatile("vmovdqu8.s %zmm30,(%rcx)"); 217 asm volatile("vmovdqu16.s %zmm25,%zmm26"); 218 219 /* AVX-512: Op code 0f db */ 220 221 asm volatile("pand %mm1,%mm2"); 222 asm volatile("pand %xmm1,%xmm2"); 223 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 224 asm volatile("vpandd %zmm24,%zmm25,%zmm26"); 225 asm volatile("vpandq %zmm24,%zmm25,%zmm26"); 226 227 /* AVX-512: Op code 0f df */ 228 229 asm volatile("pandn %mm1,%mm2"); 230 asm volatile("pandn %xmm1,%xmm2"); 231 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 232 asm volatile("vpandnd %zmm24,%zmm25,%zmm26"); 233 asm volatile("vpandnq %zmm24,%zmm25,%zmm26"); 234 235 /* AVX-512: Op code 0f e6 */ 236 237 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 238 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 239 asm volatile("vcvtdq2pd %ymm5,%zmm26{%k7}"); 240 asm volatile("vcvtqq2pd %zmm25,%zmm26"); 241 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 242 243 /* AVX-512: Op code 0f eb */ 244 245 asm volatile("por %mm4,%mm6"); 246 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 247 asm volatile("vpord %zmm24,%zmm25,%zmm26"); 248 asm volatile("vporq %zmm24,%zmm25,%zmm26"); 249 250 /* AVX-512: Op code 0f ef */ 251 252 asm volatile("pxor %mm4,%mm6"); 253 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 254 asm volatile("vpxord %zmm24,%zmm25,%zmm26"); 255 asm volatile("vpxorq %zmm24,%zmm25,%zmm26"); 256 257 /* AVX-512: Op code 0f 38 10 */ 258 259 asm volatile("pblendvb %xmm1,%xmm0"); 260 asm volatile("vpsrlvw %zmm27,%zmm28,%zmm29"); 261 asm volatile("vpmovuswb %zmm28,%ymm6{%k7}"); 262 263 /* AVX-512: Op code 0f 38 11 */ 264 265 asm volatile("vpmovusdb %zmm28,%xmm6{%k7}"); 266 asm volatile("vpsravw %zmm27,%zmm28,%zmm29"); 267 268 /* AVX-512: Op code 0f 38 12 */ 269 270 asm volatile("vpmovusqb %zmm27,%xmm6{%k7}"); 271 asm volatile("vpsllvw %zmm27,%zmm28,%zmm29"); 272 273 /* AVX-512: Op code 0f 38 13 */ 274 275 asm volatile("vcvtph2ps %xmm3,%ymm5"); 276 asm volatile("vcvtph2ps %ymm5,%zmm27{%k7}"); 277 asm volatile("vpmovusdw %zmm27,%ymm6{%k7}"); 278 279 /* AVX-512: Op code 0f 38 14 */ 280 281 asm volatile("blendvps %xmm1,%xmm0"); 282 asm volatile("vpmovusqw %zmm27,%xmm6{%k7}"); 283 asm volatile("vprorvd %zmm27,%zmm28,%zmm29"); 284 asm volatile("vprorvq %zmm27,%zmm28,%zmm29"); 285 286 /* AVX-512: Op code 0f 38 15 */ 287 288 asm volatile("blendvpd %xmm1,%xmm0"); 289 asm volatile("vpmovusqd %zmm27,%ymm6{%k7}"); 290 asm volatile("vprolvd %zmm27,%zmm28,%zmm29"); 291 asm volatile("vprolvq %zmm27,%zmm28,%zmm29"); 292 293 /* AVX-512: Op code 0f 38 16 */ 294 295 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 296 asm volatile("vpermps %ymm24,%ymm26,%ymm22{%k7}"); 297 asm volatile("vpermpd %ymm24,%ymm26,%ymm22{%k7}"); 298 299 /* AVX-512: Op code 0f 38 19 */ 300 301 asm volatile("vbroadcastsd %xmm4,%ymm6"); 302 asm volatile("vbroadcastf32x2 %xmm27,%zmm26"); 303 304 /* AVX-512: Op code 0f 38 1a */ 305 306 asm volatile("vbroadcastf128 (%rcx),%ymm4"); 307 asm volatile("vbroadcastf32x4 (%rcx),%zmm26"); 308 asm volatile("vbroadcastf64x2 (%rcx),%zmm26"); 309 310 /* AVX-512: Op code 0f 38 1b */ 311 312 asm volatile("vbroadcastf32x8 (%rcx),%zmm27"); 313 asm volatile("vbroadcastf64x4 (%rcx),%zmm26"); 314 315 /* AVX-512: Op code 0f 38 1f */ 316 317 asm volatile("vpabsq %zmm27,%zmm28"); 318 319 /* AVX-512: Op code 0f 38 20 */ 320 321 asm volatile("vpmovsxbw %xmm4,%xmm5"); 322 asm volatile("vpmovswb %zmm27,%ymm6{%k7}"); 323 324 /* AVX-512: Op code 0f 38 21 */ 325 326 asm volatile("vpmovsxbd %xmm4,%ymm6"); 327 asm volatile("vpmovsdb %zmm27,%xmm6{%k7}"); 328 329 /* AVX-512: Op code 0f 38 22 */ 330 331 asm volatile("vpmovsxbq %xmm4,%ymm4"); 332 asm volatile("vpmovsqb %zmm27,%xmm6{%k7}"); 333 334 /* AVX-512: Op code 0f 38 23 */ 335 336 asm volatile("vpmovsxwd %xmm4,%ymm4"); 337 asm volatile("vpmovsdw %zmm27,%ymm6{%k7}"); 338 339 /* AVX-512: Op code 0f 38 24 */ 340 341 asm volatile("vpmovsxwq %xmm4,%ymm6"); 342 asm volatile("vpmovsqw %zmm27,%xmm6{%k7}"); 343 344 /* AVX-512: Op code 0f 38 25 */ 345 346 asm volatile("vpmovsxdq %xmm4,%ymm4"); 347 asm volatile("vpmovsqd %zmm27,%ymm6{%k7}"); 348 349 /* AVX-512: Op code 0f 38 26 */ 350 351 asm volatile("vptestmb %zmm27,%zmm28,%k5"); 352 asm volatile("vptestmw %zmm27,%zmm28,%k5"); 353 asm volatile("vptestnmb %zmm26,%zmm27,%k5"); 354 asm volatile("vptestnmw %zmm26,%zmm27,%k5"); 355 356 /* AVX-512: Op code 0f 38 27 */ 357 358 asm volatile("vptestmd %zmm27,%zmm28,%k5"); 359 asm volatile("vptestmq %zmm27,%zmm28,%k5"); 360 asm volatile("vptestnmd %zmm26,%zmm27,%k5"); 361 asm volatile("vptestnmq %zmm26,%zmm27,%k5"); 362 363 /* AVX-512: Op code 0f 38 28 */ 364 365 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 366 asm volatile("vpmovm2b %k5,%zmm28"); 367 asm volatile("vpmovm2w %k5,%zmm28"); 368 369 /* AVX-512: Op code 0f 38 29 */ 370 371 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 372 asm volatile("vpmovb2m %zmm28,%k5"); 373 asm volatile("vpmovw2m %zmm28,%k5"); 374 375 /* AVX-512: Op code 0f 38 2a */ 376 377 asm volatile("vmovntdqa (%rcx),%ymm4"); 378 asm volatile("vpbroadcastmb2q %k6,%zmm30"); 379 380 /* AVX-512: Op code 0f 38 2c */ 381 382 asm volatile("vmaskmovps (%rcx),%ymm4,%ymm6"); 383 asm volatile("vscalefps %zmm24,%zmm25,%zmm26"); 384 asm volatile("vscalefpd %zmm24,%zmm25,%zmm26"); 385 386 /* AVX-512: Op code 0f 38 2d */ 387 388 asm volatile("vmaskmovpd (%rcx),%ymm4,%ymm6"); 389 asm volatile("vscalefss %xmm24,%xmm25,%xmm26{%k7}"); 390 asm volatile("vscalefsd %xmm24,%xmm25,%xmm26{%k7}"); 391 392 /* AVX-512: Op code 0f 38 30 */ 393 394 asm volatile("vpmovzxbw %xmm4,%ymm4"); 395 asm volatile("vpmovwb %zmm27,%ymm6{%k7}"); 396 397 /* AVX-512: Op code 0f 38 31 */ 398 399 asm volatile("vpmovzxbd %xmm4,%ymm6"); 400 asm volatile("vpmovdb %zmm27,%xmm6{%k7}"); 401 402 /* AVX-512: Op code 0f 38 32 */ 403 404 asm volatile("vpmovzxbq %xmm4,%ymm4"); 405 asm volatile("vpmovqb %zmm27,%xmm6{%k7}"); 406 407 /* AVX-512: Op code 0f 38 33 */ 408 409 asm volatile("vpmovzxwd %xmm4,%ymm4"); 410 asm volatile("vpmovdw %zmm27,%ymm6{%k7}"); 411 412 /* AVX-512: Op code 0f 38 34 */ 413 414 asm volatile("vpmovzxwq %xmm4,%ymm6"); 415 asm volatile("vpmovqw %zmm27,%xmm6{%k7}"); 416 417 /* AVX-512: Op code 0f 38 35 */ 418 419 asm volatile("vpmovzxdq %xmm4,%ymm4"); 420 asm volatile("vpmovqd %zmm27,%ymm6{%k7}"); 421 422 /* AVX-512: Op code 0f 38 38 */ 423 424 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 425 asm volatile("vpermd %ymm24,%ymm26,%ymm22{%k7}"); 426 asm volatile("vpermq %ymm24,%ymm26,%ymm22{%k7}"); 427 428 /* AVX-512: Op code 0f 38 38 */ 429 430 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 431 asm volatile("vpmovm2d %k5,%zmm28"); 432 asm volatile("vpmovm2q %k5,%zmm28"); 433 434 /* AVX-512: Op code 0f 38 39 */ 435 436 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 437 asm volatile("vpminsd %zmm24,%zmm25,%zmm26"); 438 asm volatile("vpminsq %zmm24,%zmm25,%zmm26"); 439 asm volatile("vpmovd2m %zmm28,%k5"); 440 asm volatile("vpmovq2m %zmm28,%k5"); 441 442 /* AVX-512: Op code 0f 38 3a */ 443 444 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 445 asm volatile("vpbroadcastmw2d %k6,%zmm28"); 446 447 /* AVX-512: Op code 0f 38 3b */ 448 449 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 450 asm volatile("vpminud %zmm24,%zmm25,%zmm26"); 451 asm volatile("vpminuq %zmm24,%zmm25,%zmm26"); 452 453 /* AVX-512: Op code 0f 38 3d */ 454 455 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 456 asm volatile("vpmaxsd %zmm24,%zmm25,%zmm26"); 457 asm volatile("vpmaxsq %zmm24,%zmm25,%zmm26"); 458 459 /* AVX-512: Op code 0f 38 3f */ 460 461 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 462 asm volatile("vpmaxud %zmm24,%zmm25,%zmm26"); 463 asm volatile("vpmaxuq %zmm24,%zmm25,%zmm26"); 464 465 /* AVX-512: Op code 0f 38 42 */ 466 467 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 468 asm volatile("vpmulld %zmm24,%zmm25,%zmm26"); 469 asm volatile("vpmullq %zmm24,%zmm25,%zmm26"); 470 471 /* AVX-512: Op code 0f 38 42 */ 472 473 asm volatile("vgetexpps %zmm25,%zmm26"); 474 asm volatile("vgetexppd %zmm27,%zmm28"); 475 476 /* AVX-512: Op code 0f 38 43 */ 477 478 asm volatile("vgetexpss %xmm24,%xmm25,%xmm26{%k7}"); 479 asm volatile("vgetexpsd %xmm28,%xmm29,%xmm30{%k7}"); 480 481 /* AVX-512: Op code 0f 38 44 */ 482 483 asm volatile("vplzcntd %zmm27,%zmm28"); 484 asm volatile("vplzcntq %zmm27,%zmm28"); 485 486 /* AVX-512: Op code 0f 38 46 */ 487 488 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 489 asm volatile("vpsravd %zmm24,%zmm25,%zmm26"); 490 asm volatile("vpsravq %zmm24,%zmm25,%zmm26"); 491 492 /* AVX-512: Op code 0f 38 4c */ 493 494 asm volatile("vrcp14ps %zmm25,%zmm26"); 495 asm volatile("vrcp14pd %zmm27,%zmm28"); 496 497 /* AVX-512: Op code 0f 38 4d */ 498 499 asm volatile("vrcp14ss %xmm24,%xmm25,%xmm26{%k7}"); 500 asm volatile("vrcp14sd %xmm24,%xmm25,%xmm26{%k7}"); 501 502 /* AVX-512: Op code 0f 38 4e */ 503 504 asm volatile("vrsqrt14ps %zmm25,%zmm26"); 505 asm volatile("vrsqrt14pd %zmm27,%zmm28"); 506 507 /* AVX-512: Op code 0f 38 4f */ 508 509 asm volatile("vrsqrt14ss %xmm24,%xmm25,%xmm26{%k7}"); 510 asm volatile("vrsqrt14sd %xmm24,%xmm25,%xmm26{%k7}"); 511 512 /* AVX-512: Op code 0f 38 59 */ 513 514 asm volatile("vpbroadcastq %xmm4,%xmm6"); 515 asm volatile("vbroadcasti32x2 %xmm27,%zmm26"); 516 517 /* AVX-512: Op code 0f 38 5a */ 518 519 asm volatile("vbroadcasti128 (%rcx),%ymm4"); 520 asm volatile("vbroadcasti32x4 (%rcx),%zmm26"); 521 asm volatile("vbroadcasti64x2 (%rcx),%zmm26"); 522 523 /* AVX-512: Op code 0f 38 5b */ 524 525 asm volatile("vbroadcasti32x8 (%rcx),%zmm28"); 526 asm volatile("vbroadcasti64x4 (%rcx),%zmm26"); 527 528 /* AVX-512: Op code 0f 38 64 */ 529 530 asm volatile("vpblendmd %zmm26,%zmm27,%zmm28"); 531 asm volatile("vpblendmq %zmm26,%zmm27,%zmm28"); 532 533 /* AVX-512: Op code 0f 38 65 */ 534 535 asm volatile("vblendmps %zmm24,%zmm25,%zmm26"); 536 asm volatile("vblendmpd %zmm26,%zmm27,%zmm28"); 537 538 /* AVX-512: Op code 0f 38 66 */ 539 540 asm volatile("vpblendmb %zmm26,%zmm27,%zmm28"); 541 asm volatile("vpblendmw %zmm26,%zmm27,%zmm28"); 542 543 /* AVX-512: Op code 0f 38 75 */ 544 545 asm volatile("vpermi2b %zmm24,%zmm25,%zmm26"); 546 asm volatile("vpermi2w %zmm26,%zmm27,%zmm28"); 547 548 /* AVX-512: Op code 0f 38 76 */ 549 550 asm volatile("vpermi2d %zmm26,%zmm27,%zmm28"); 551 asm volatile("vpermi2q %zmm26,%zmm27,%zmm28"); 552 553 /* AVX-512: Op code 0f 38 77 */ 554 555 asm volatile("vpermi2ps %zmm26,%zmm27,%zmm28"); 556 asm volatile("vpermi2pd %zmm26,%zmm27,%zmm28"); 557 558 /* AVX-512: Op code 0f 38 7a */ 559 560 asm volatile("vpbroadcastb %eax,%xmm30"); 561 562 /* AVX-512: Op code 0f 38 7b */ 563 564 asm volatile("vpbroadcastw %eax,%xmm30"); 565 566 /* AVX-512: Op code 0f 38 7c */ 567 568 asm volatile("vpbroadcastd %eax,%xmm30"); 569 asm volatile("vpbroadcastq %rax,%zmm30"); 570 571 /* AVX-512: Op code 0f 38 7d */ 572 573 asm volatile("vpermt2b %zmm26,%zmm27,%zmm28"); 574 asm volatile("vpermt2w %zmm26,%zmm27,%zmm28"); 575 576 /* AVX-512: Op code 0f 38 7e */ 577 578 asm volatile("vpermt2d %zmm26,%zmm27,%zmm28"); 579 asm volatile("vpermt2q %zmm26,%zmm27,%zmm28"); 580 581 /* AVX-512: Op code 0f 38 7f */ 582 583 asm volatile("vpermt2ps %zmm26,%zmm27,%zmm28"); 584 asm volatile("vpermt2pd %zmm26,%zmm27,%zmm28"); 585 586 /* AVX-512: Op code 0f 38 83 */ 587 588 asm volatile("vpmultishiftqb %zmm26,%zmm27,%zmm28"); 589 590 /* AVX-512: Op code 0f 38 88 */ 591 592 asm volatile("vexpandps (%rcx),%zmm26"); 593 asm volatile("vexpandpd (%rcx),%zmm28"); 594 595 /* AVX-512: Op code 0f 38 89 */ 596 597 asm volatile("vpexpandd (%rcx),%zmm28"); 598 asm volatile("vpexpandq (%rcx),%zmm26"); 599 600 /* AVX-512: Op code 0f 38 8a */ 601 602 asm volatile("vcompressps %zmm28,(%rcx)"); 603 asm volatile("vcompresspd %zmm28,(%rcx)"); 604 605 /* AVX-512: Op code 0f 38 8b */ 606 607 asm volatile("vpcompressd %zmm28,(%rcx)"); 608 asm volatile("vpcompressq %zmm26,(%rcx)"); 609 610 /* AVX-512: Op code 0f 38 8d */ 611 612 asm volatile("vpermb %zmm26,%zmm27,%zmm28"); 613 asm volatile("vpermw %zmm26,%zmm27,%zmm28"); 614 615 /* AVX-512: Op code 0f 38 90 */ 616 617 asm volatile("vpgatherdd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 618 asm volatile("vpgatherdq %xmm2,0x04(%rbp,%xmm7,2),%xmm1"); 619 asm volatile("vpgatherdd 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 620 asm volatile("vpgatherdq 0x7b(%rbp,%ymm27,8),%zmm26{%k1}"); 621 622 /* AVX-512: Op code 0f 38 91 */ 623 624 asm volatile("vpgatherqd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 625 asm volatile("vpgatherqq %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 626 asm volatile("vpgatherqd 0x7b(%rbp,%zmm27,8),%ymm26{%k1}"); 627 asm volatile("vpgatherqq 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 628 629 /* AVX-512: Op code 0f 38 a0 */ 630 631 asm volatile("vpscatterdd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 632 asm volatile("vpscatterdq %zmm26,0x7b(%rbp,%ymm27,8){%k1}"); 633 634 /* AVX-512: Op code 0f 38 a1 */ 635 636 asm volatile("vpscatterqd %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 637 asm volatile("vpscatterqq %ymm6,0x7b(%rbp,%ymm27,8){%k1}"); 638 639 /* AVX-512: Op code 0f 38 a2 */ 640 641 asm volatile("vscatterdps %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 642 asm volatile("vscatterdpd %zmm28,0x7b(%rbp,%ymm27,8){%k1}"); 643 644 /* AVX-512: Op code 0f 38 a3 */ 645 646 asm volatile("vscatterqps %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 647 asm volatile("vscatterqpd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 648 649 /* AVX-512: Op code 0f 38 b4 */ 650 651 asm volatile("vpmadd52luq %zmm26,%zmm27,%zmm28"); 652 653 /* AVX-512: Op code 0f 38 b5 */ 654 655 asm volatile("vpmadd52huq %zmm26,%zmm27,%zmm28"); 656 657 /* AVX-512: Op code 0f 38 c4 */ 658 659 asm volatile("vpconflictd %zmm26,%zmm27"); 660 asm volatile("vpconflictq %zmm26,%zmm27"); 661 662 /* AVX-512: Op code 0f 38 c8 */ 663 664 asm volatile("vexp2ps %zmm29,%zmm30"); 665 asm volatile("vexp2pd %zmm26,%zmm27"); 666 667 /* AVX-512: Op code 0f 38 ca */ 668 669 asm volatile("vrcp28ps %zmm29,%zmm30"); 670 asm volatile("vrcp28pd %zmm26,%zmm27"); 671 672 /* AVX-512: Op code 0f 38 cb */ 673 674 asm volatile("vrcp28ss %xmm28,%xmm29,%xmm30{%k7}"); 675 asm volatile("vrcp28sd %xmm25,%xmm26,%xmm27{%k7}"); 676 677 /* AVX-512: Op code 0f 38 cc */ 678 679 asm volatile("vrsqrt28ps %zmm29,%zmm30"); 680 asm volatile("vrsqrt28pd %zmm26,%zmm27"); 681 682 /* AVX-512: Op code 0f 38 cd */ 683 684 asm volatile("vrsqrt28ss %xmm28,%xmm29,%xmm30{%k7}"); 685 asm volatile("vrsqrt28sd %xmm25,%xmm26,%xmm27{%k7}"); 686 687 /* AVX-512: Op code 0f 3a 03 */ 688 689 asm volatile("valignd $0x12,%zmm28,%zmm29,%zmm30"); 690 asm volatile("valignq $0x12,%zmm25,%zmm26,%zmm27"); 691 692 /* AVX-512: Op code 0f 3a 08 */ 693 694 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 695 asm volatile("vrndscaleps $0x12,%zmm25,%zmm26"); 696 697 /* AVX-512: Op code 0f 3a 09 */ 698 699 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 700 asm volatile("vrndscalepd $0x12,%zmm25,%zmm26"); 701 702 /* AVX-512: Op code 0f 3a 1a */ 703 704 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 705 asm volatile("vrndscaless $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 706 707 /* AVX-512: Op code 0f 3a 0b */ 708 709 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 710 asm volatile("vrndscalesd $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 711 712 /* AVX-512: Op code 0f 3a 18 */ 713 714 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 715 asm volatile("vinsertf32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 716 asm volatile("vinsertf64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 717 718 /* AVX-512: Op code 0f 3a 19 */ 719 720 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 721 asm volatile("vextractf32x4 $0x12,%zmm25,%xmm26{%k7}"); 722 asm volatile("vextractf64x2 $0x12,%zmm25,%xmm26{%k7}"); 723 724 /* AVX-512: Op code 0f 3a 1a */ 725 726 asm volatile("vinsertf32x8 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 727 asm volatile("vinsertf64x4 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 728 729 /* AVX-512: Op code 0f 3a 1b */ 730 731 asm volatile("vextractf32x8 $0x12,%zmm29,%ymm30{%k7}"); 732 asm volatile("vextractf64x4 $0x12,%zmm26,%ymm27{%k7}"); 733 734 /* AVX-512: Op code 0f 3a 1e */ 735 736 asm volatile("vpcmpud $0x12,%zmm29,%zmm30,%k5"); 737 asm volatile("vpcmpuq $0x12,%zmm26,%zmm27,%k5"); 738 739 /* AVX-512: Op code 0f 3a 1f */ 740 741 asm volatile("vpcmpd $0x12,%zmm29,%zmm30,%k5"); 742 asm volatile("vpcmpq $0x12,%zmm26,%zmm27,%k5"); 743 744 /* AVX-512: Op code 0f 3a 23 */ 745 746 asm volatile("vshuff32x4 $0x12,%zmm28,%zmm29,%zmm30"); 747 asm volatile("vshuff64x2 $0x12,%zmm25,%zmm26,%zmm27"); 748 749 /* AVX-512: Op code 0f 3a 25 */ 750 751 asm volatile("vpternlogd $0x12,%zmm28,%zmm29,%zmm30"); 752 asm volatile("vpternlogq $0x12,%zmm28,%zmm29,%zmm30"); 753 754 /* AVX-512: Op code 0f 3a 26 */ 755 756 asm volatile("vgetmantps $0x12,%zmm26,%zmm27"); 757 asm volatile("vgetmantpd $0x12,%zmm29,%zmm30"); 758 759 /* AVX-512: Op code 0f 3a 27 */ 760 761 asm volatile("vgetmantss $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 762 asm volatile("vgetmantsd $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 763 764 /* AVX-512: Op code 0f 3a 38 */ 765 766 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 767 asm volatile("vinserti32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 768 asm volatile("vinserti64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 769 770 /* AVX-512: Op code 0f 3a 39 */ 771 772 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 773 asm volatile("vextracti32x4 $0x12,%zmm25,%xmm26{%k7}"); 774 asm volatile("vextracti64x2 $0x12,%zmm25,%xmm26{%k7}"); 775 776 /* AVX-512: Op code 0f 3a 3a */ 777 778 asm volatile("vinserti32x8 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 779 asm volatile("vinserti64x4 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 780 781 /* AVX-512: Op code 0f 3a 3b */ 782 783 asm volatile("vextracti32x8 $0x12,%zmm29,%ymm30{%k7}"); 784 asm volatile("vextracti64x4 $0x12,%zmm26,%ymm27{%k7}"); 785 786 /* AVX-512: Op code 0f 3a 3e */ 787 788 asm volatile("vpcmpub $0x12,%zmm29,%zmm30,%k5"); 789 asm volatile("vpcmpuw $0x12,%zmm26,%zmm27,%k5"); 790 791 /* AVX-512: Op code 0f 3a 3f */ 792 793 asm volatile("vpcmpb $0x12,%zmm29,%zmm30,%k5"); 794 asm volatile("vpcmpw $0x12,%zmm26,%zmm27,%k5"); 795 796 /* AVX-512: Op code 0f 3a 43 */ 797 798 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 799 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 800 801 /* AVX-512: Op code 0f 3a 43 */ 802 803 asm volatile("vshufi32x4 $0x12,%zmm25,%zmm26,%zmm27"); 804 asm volatile("vshufi64x2 $0x12,%zmm28,%zmm29,%zmm30"); 805 806 /* AVX-512: Op code 0f 3a 50 */ 807 808 asm volatile("vrangeps $0x12,%zmm25,%zmm26,%zmm27"); 809 asm volatile("vrangepd $0x12,%zmm28,%zmm29,%zmm30"); 810 811 /* AVX-512: Op code 0f 3a 51 */ 812 813 asm volatile("vrangess $0x12,%xmm25,%xmm26,%xmm27"); 814 asm volatile("vrangesd $0x12,%xmm28,%xmm29,%xmm30"); 815 816 /* AVX-512: Op code 0f 3a 54 */ 817 818 asm volatile("vfixupimmps $0x12,%zmm28,%zmm29,%zmm30"); 819 asm volatile("vfixupimmpd $0x12,%zmm25,%zmm26,%zmm27"); 820 821 /* AVX-512: Op code 0f 3a 55 */ 822 823 asm volatile("vfixupimmss $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 824 asm volatile("vfixupimmsd $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 825 826 /* AVX-512: Op code 0f 3a 56 */ 827 828 asm volatile("vreduceps $0x12,%zmm26,%zmm27"); 829 asm volatile("vreducepd $0x12,%zmm29,%zmm30"); 830 831 /* AVX-512: Op code 0f 3a 57 */ 832 833 asm volatile("vreducess $0x12,%xmm25,%xmm26,%xmm27"); 834 asm volatile("vreducesd $0x12,%xmm28,%xmm29,%xmm30"); 835 836 /* AVX-512: Op code 0f 3a 66 */ 837 838 asm volatile("vfpclassps $0x12,%zmm27,%k5"); 839 asm volatile("vfpclasspd $0x12,%zmm30,%k5"); 840 841 /* AVX-512: Op code 0f 3a 67 */ 842 843 asm volatile("vfpclassss $0x12,%xmm27,%k5"); 844 asm volatile("vfpclasssd $0x12,%xmm30,%k5"); 845 846 /* AVX-512: Op code 0f 72 (Grp13) */ 847 848 asm volatile("vprord $0x12,%zmm25,%zmm26"); 849 asm volatile("vprorq $0x12,%zmm25,%zmm26"); 850 asm volatile("vprold $0x12,%zmm29,%zmm30"); 851 asm volatile("vprolq $0x12,%zmm29,%zmm30"); 852 asm volatile("psrad $0x2,%mm6"); 853 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 854 asm volatile("vpsrad $0x5,%zmm26,%zmm22"); 855 asm volatile("vpsraq $0x5,%zmm26,%zmm22"); 856 857 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 858 859 asm volatile("vgatherpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 860 asm volatile("vgatherpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 861 asm volatile("vgatherpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 862 asm volatile("vgatherpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 863 asm volatile("vscatterpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 864 asm volatile("vscatterpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 865 asm volatile("vscatterpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 866 asm volatile("vscatterpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 867 868 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 869 870 asm volatile("vgatherpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 871 asm volatile("vgatherpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 872 asm volatile("vgatherpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 873 asm volatile("vgatherpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 874 asm volatile("vscatterpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 875 asm volatile("vscatterpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 876 asm volatile("vscatterpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 877 asm volatile("vscatterpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 878 879 /* AVX-512: Examples */ 880 881 asm volatile("vaddpd %zmm28,%zmm29,%zmm30"); 882 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}"); 883 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}{z}"); 884 asm volatile("vaddpd {rn-sae},%zmm28,%zmm29,%zmm30"); 885 asm volatile("vaddpd {ru-sae},%zmm28,%zmm29,%zmm30"); 886 asm volatile("vaddpd {rd-sae},%zmm28,%zmm29,%zmm30"); 887 asm volatile("vaddpd {rz-sae},%zmm28,%zmm29,%zmm30"); 888 asm volatile("vaddpd (%rcx),%zmm29,%zmm30"); 889 asm volatile("vaddpd 0x123(%rax,%r14,8),%zmm29,%zmm30"); 890 asm volatile("vaddpd (%rcx){1to8},%zmm29,%zmm30"); 891 asm volatile("vaddpd 0x1fc0(%rdx),%zmm29,%zmm30"); 892 asm volatile("vaddpd 0x3f8(%rdx){1to8},%zmm29,%zmm30"); 893 asm volatile("vcmpeq_uqps 0x1fc(%rdx){1to16},%zmm30,%k5"); 894 asm volatile("vcmpltsd 0x123(%rax,%r14,8),%xmm29,%k5{%k7}"); 895 asm volatile("vcmplesd {sae},%xmm28,%xmm29,%k5{%k7}"); 896 asm volatile("vgetmantss $0x5b,0x123(%rax,%r14,8),%xmm29,%xmm30{%k7}"); 897 898 /* bndmk m64, bnd */ 899 900 asm volatile("bndmk (%rax), %bnd0"); 901 asm volatile("bndmk (%r8), %bnd0"); 902 asm volatile("bndmk (0x12345678), %bnd0"); 903 asm volatile("bndmk (%rax), %bnd3"); 904 asm volatile("bndmk (%rcx,%rax,1), %bnd0"); 905 asm volatile("bndmk 0x12345678(,%rax,1), %bnd0"); 906 asm volatile("bndmk (%rax,%rcx,1), %bnd0"); 907 asm volatile("bndmk (%rax,%rcx,8), %bnd0"); 908 asm volatile("bndmk 0x12(%rax), %bnd0"); 909 asm volatile("bndmk 0x12(%rbp), %bnd0"); 910 asm volatile("bndmk 0x12(%rcx,%rax,1), %bnd0"); 911 asm volatile("bndmk 0x12(%rbp,%rax,1), %bnd0"); 912 asm volatile("bndmk 0x12(%rax,%rcx,1), %bnd0"); 913 asm volatile("bndmk 0x12(%rax,%rcx,8), %bnd0"); 914 asm volatile("bndmk 0x12345678(%rax), %bnd0"); 915 asm volatile("bndmk 0x12345678(%rbp), %bnd0"); 916 asm volatile("bndmk 0x12345678(%rcx,%rax,1), %bnd0"); 917 asm volatile("bndmk 0x12345678(%rbp,%rax,1), %bnd0"); 918 asm volatile("bndmk 0x12345678(%rax,%rcx,1), %bnd0"); 919 asm volatile("bndmk 0x12345678(%rax,%rcx,8), %bnd0"); 920 921 /* bndcl r/m64, bnd */ 922 923 asm volatile("bndcl (%rax), %bnd0"); 924 asm volatile("bndcl (%r8), %bnd0"); 925 asm volatile("bndcl (0x12345678), %bnd0"); 926 asm volatile("bndcl (%rax), %bnd3"); 927 asm volatile("bndcl (%rcx,%rax,1), %bnd0"); 928 asm volatile("bndcl 0x12345678(,%rax,1), %bnd0"); 929 asm volatile("bndcl (%rax,%rcx,1), %bnd0"); 930 asm volatile("bndcl (%rax,%rcx,8), %bnd0"); 931 asm volatile("bndcl 0x12(%rax), %bnd0"); 932 asm volatile("bndcl 0x12(%rbp), %bnd0"); 933 asm volatile("bndcl 0x12(%rcx,%rax,1), %bnd0"); 934 asm volatile("bndcl 0x12(%rbp,%rax,1), %bnd0"); 935 asm volatile("bndcl 0x12(%rax,%rcx,1), %bnd0"); 936 asm volatile("bndcl 0x12(%rax,%rcx,8), %bnd0"); 937 asm volatile("bndcl 0x12345678(%rax), %bnd0"); 938 asm volatile("bndcl 0x12345678(%rbp), %bnd0"); 939 asm volatile("bndcl 0x12345678(%rcx,%rax,1), %bnd0"); 940 asm volatile("bndcl 0x12345678(%rbp,%rax,1), %bnd0"); 941 asm volatile("bndcl 0x12345678(%rax,%rcx,1), %bnd0"); 942 asm volatile("bndcl 0x12345678(%rax,%rcx,8), %bnd0"); 943 asm volatile("bndcl %rax, %bnd0"); 944 945 /* bndcu r/m64, bnd */ 946 947 asm volatile("bndcu (%rax), %bnd0"); 948 asm volatile("bndcu (%r8), %bnd0"); 949 asm volatile("bndcu (0x12345678), %bnd0"); 950 asm volatile("bndcu (%rax), %bnd3"); 951 asm volatile("bndcu (%rcx,%rax,1), %bnd0"); 952 asm volatile("bndcu 0x12345678(,%rax,1), %bnd0"); 953 asm volatile("bndcu (%rax,%rcx,1), %bnd0"); 954 asm volatile("bndcu (%rax,%rcx,8), %bnd0"); 955 asm volatile("bndcu 0x12(%rax), %bnd0"); 956 asm volatile("bndcu 0x12(%rbp), %bnd0"); 957 asm volatile("bndcu 0x12(%rcx,%rax,1), %bnd0"); 958 asm volatile("bndcu 0x12(%rbp,%rax,1), %bnd0"); 959 asm volatile("bndcu 0x12(%rax,%rcx,1), %bnd0"); 960 asm volatile("bndcu 0x12(%rax,%rcx,8), %bnd0"); 961 asm volatile("bndcu 0x12345678(%rax), %bnd0"); 962 asm volatile("bndcu 0x12345678(%rbp), %bnd0"); 963 asm volatile("bndcu 0x12345678(%rcx,%rax,1), %bnd0"); 964 asm volatile("bndcu 0x12345678(%rbp,%rax,1), %bnd0"); 965 asm volatile("bndcu 0x12345678(%rax,%rcx,1), %bnd0"); 966 asm volatile("bndcu 0x12345678(%rax,%rcx,8), %bnd0"); 967 asm volatile("bndcu %rax, %bnd0"); 968 969 /* bndcn r/m64, bnd */ 970 971 asm volatile("bndcn (%rax), %bnd0"); 972 asm volatile("bndcn (%r8), %bnd0"); 973 asm volatile("bndcn (0x12345678), %bnd0"); 974 asm volatile("bndcn (%rax), %bnd3"); 975 asm volatile("bndcn (%rcx,%rax,1), %bnd0"); 976 asm volatile("bndcn 0x12345678(,%rax,1), %bnd0"); 977 asm volatile("bndcn (%rax,%rcx,1), %bnd0"); 978 asm volatile("bndcn (%rax,%rcx,8), %bnd0"); 979 asm volatile("bndcn 0x12(%rax), %bnd0"); 980 asm volatile("bndcn 0x12(%rbp), %bnd0"); 981 asm volatile("bndcn 0x12(%rcx,%rax,1), %bnd0"); 982 asm volatile("bndcn 0x12(%rbp,%rax,1), %bnd0"); 983 asm volatile("bndcn 0x12(%rax,%rcx,1), %bnd0"); 984 asm volatile("bndcn 0x12(%rax,%rcx,8), %bnd0"); 985 asm volatile("bndcn 0x12345678(%rax), %bnd0"); 986 asm volatile("bndcn 0x12345678(%rbp), %bnd0"); 987 asm volatile("bndcn 0x12345678(%rcx,%rax,1), %bnd0"); 988 asm volatile("bndcn 0x12345678(%rbp,%rax,1), %bnd0"); 989 asm volatile("bndcn 0x12345678(%rax,%rcx,1), %bnd0"); 990 asm volatile("bndcn 0x12345678(%rax,%rcx,8), %bnd0"); 991 asm volatile("bndcn %rax, %bnd0"); 992 993 /* bndmov m128, bnd */ 994 995 asm volatile("bndmov (%rax), %bnd0"); 996 asm volatile("bndmov (%r8), %bnd0"); 997 asm volatile("bndmov (0x12345678), %bnd0"); 998 asm volatile("bndmov (%rax), %bnd3"); 999 asm volatile("bndmov (%rcx,%rax,1), %bnd0"); 1000 asm volatile("bndmov 0x12345678(,%rax,1), %bnd0"); 1001 asm volatile("bndmov (%rax,%rcx,1), %bnd0"); 1002 asm volatile("bndmov (%rax,%rcx,8), %bnd0"); 1003 asm volatile("bndmov 0x12(%rax), %bnd0"); 1004 asm volatile("bndmov 0x12(%rbp), %bnd0"); 1005 asm volatile("bndmov 0x12(%rcx,%rax,1), %bnd0"); 1006 asm volatile("bndmov 0x12(%rbp,%rax,1), %bnd0"); 1007 asm volatile("bndmov 0x12(%rax,%rcx,1), %bnd0"); 1008 asm volatile("bndmov 0x12(%rax,%rcx,8), %bnd0"); 1009 asm volatile("bndmov 0x12345678(%rax), %bnd0"); 1010 asm volatile("bndmov 0x12345678(%rbp), %bnd0"); 1011 asm volatile("bndmov 0x12345678(%rcx,%rax,1), %bnd0"); 1012 asm volatile("bndmov 0x12345678(%rbp,%rax,1), %bnd0"); 1013 asm volatile("bndmov 0x12345678(%rax,%rcx,1), %bnd0"); 1014 asm volatile("bndmov 0x12345678(%rax,%rcx,8), %bnd0"); 1015 1016 /* bndmov bnd, m128 */ 1017 1018 asm volatile("bndmov %bnd0, (%rax)"); 1019 asm volatile("bndmov %bnd0, (%r8)"); 1020 asm volatile("bndmov %bnd0, (0x12345678)"); 1021 asm volatile("bndmov %bnd3, (%rax)"); 1022 asm volatile("bndmov %bnd0, (%rcx,%rax,1)"); 1023 asm volatile("bndmov %bnd0, 0x12345678(,%rax,1)"); 1024 asm volatile("bndmov %bnd0, (%rax,%rcx,1)"); 1025 asm volatile("bndmov %bnd0, (%rax,%rcx,8)"); 1026 asm volatile("bndmov %bnd0, 0x12(%rax)"); 1027 asm volatile("bndmov %bnd0, 0x12(%rbp)"); 1028 asm volatile("bndmov %bnd0, 0x12(%rcx,%rax,1)"); 1029 asm volatile("bndmov %bnd0, 0x12(%rbp,%rax,1)"); 1030 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,1)"); 1031 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,8)"); 1032 asm volatile("bndmov %bnd0, 0x12345678(%rax)"); 1033 asm volatile("bndmov %bnd0, 0x12345678(%rbp)"); 1034 asm volatile("bndmov %bnd0, 0x12345678(%rcx,%rax,1)"); 1035 asm volatile("bndmov %bnd0, 0x12345678(%rbp,%rax,1)"); 1036 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,1)"); 1037 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,8)"); 1038 1039 /* bndmov bnd2, bnd1 */ 1040 1041 asm volatile("bndmov %bnd0, %bnd1"); 1042 asm volatile("bndmov %bnd1, %bnd0"); 1043 1044 /* bndldx mib, bnd */ 1045 1046 asm volatile("bndldx (%rax), %bnd0"); 1047 asm volatile("bndldx (%r8), %bnd0"); 1048 asm volatile("bndldx (0x12345678), %bnd0"); 1049 asm volatile("bndldx (%rax), %bnd3"); 1050 asm volatile("bndldx (%rcx,%rax,1), %bnd0"); 1051 asm volatile("bndldx 0x12345678(,%rax,1), %bnd0"); 1052 asm volatile("bndldx (%rax,%rcx,1), %bnd0"); 1053 asm volatile("bndldx 0x12(%rax), %bnd0"); 1054 asm volatile("bndldx 0x12(%rbp), %bnd0"); 1055 asm volatile("bndldx 0x12(%rcx,%rax,1), %bnd0"); 1056 asm volatile("bndldx 0x12(%rbp,%rax,1), %bnd0"); 1057 asm volatile("bndldx 0x12(%rax,%rcx,1), %bnd0"); 1058 asm volatile("bndldx 0x12345678(%rax), %bnd0"); 1059 asm volatile("bndldx 0x12345678(%rbp), %bnd0"); 1060 asm volatile("bndldx 0x12345678(%rcx,%rax,1), %bnd0"); 1061 asm volatile("bndldx 0x12345678(%rbp,%rax,1), %bnd0"); 1062 asm volatile("bndldx 0x12345678(%rax,%rcx,1), %bnd0"); 1063 1064 /* bndstx bnd, mib */ 1065 1066 asm volatile("bndstx %bnd0, (%rax)"); 1067 asm volatile("bndstx %bnd0, (%r8)"); 1068 asm volatile("bndstx %bnd0, (0x12345678)"); 1069 asm volatile("bndstx %bnd3, (%rax)"); 1070 asm volatile("bndstx %bnd0, (%rcx,%rax,1)"); 1071 asm volatile("bndstx %bnd0, 0x12345678(,%rax,1)"); 1072 asm volatile("bndstx %bnd0, (%rax,%rcx,1)"); 1073 asm volatile("bndstx %bnd0, 0x12(%rax)"); 1074 asm volatile("bndstx %bnd0, 0x12(%rbp)"); 1075 asm volatile("bndstx %bnd0, 0x12(%rcx,%rax,1)"); 1076 asm volatile("bndstx %bnd0, 0x12(%rbp,%rax,1)"); 1077 asm volatile("bndstx %bnd0, 0x12(%rax,%rcx,1)"); 1078 asm volatile("bndstx %bnd0, 0x12345678(%rax)"); 1079 asm volatile("bndstx %bnd0, 0x12345678(%rbp)"); 1080 asm volatile("bndstx %bnd0, 0x12345678(%rcx,%rax,1)"); 1081 asm volatile("bndstx %bnd0, 0x12345678(%rbp,%rax,1)"); 1082 asm volatile("bndstx %bnd0, 0x12345678(%rax,%rcx,1)"); 1083 1084 /* bnd prefix on call, ret, jmp and all jcc */ 1085 1086 asm volatile("bnd call label1"); /* Expecting: call unconditional 0 */ 1087 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 1088 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 1089 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1090 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1091 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 1092 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0 */ 1093 1094 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 1095 1096 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 1097 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 1098 asm volatile("sha1rnds4 $0x91, %xmm8, %xmm0"); 1099 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm8"); 1100 asm volatile("sha1rnds4 $0x91, %xmm15, %xmm8"); 1101 asm volatile("sha1rnds4 $0x91, (%rax), %xmm0"); 1102 asm volatile("sha1rnds4 $0x91, (%r8), %xmm0"); 1103 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 1104 asm volatile("sha1rnds4 $0x91, (%rax), %xmm3"); 1105 asm volatile("sha1rnds4 $0x91, (%rcx,%rax,1), %xmm0"); 1106 asm volatile("sha1rnds4 $0x91, 0x12345678(,%rax,1), %xmm0"); 1107 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,1), %xmm0"); 1108 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,8), %xmm0"); 1109 asm volatile("sha1rnds4 $0x91, 0x12(%rax), %xmm0"); 1110 asm volatile("sha1rnds4 $0x91, 0x12(%rbp), %xmm0"); 1111 asm volatile("sha1rnds4 $0x91, 0x12(%rcx,%rax,1), %xmm0"); 1112 asm volatile("sha1rnds4 $0x91, 0x12(%rbp,%rax,1), %xmm0"); 1113 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,1), %xmm0"); 1114 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,8), %xmm0"); 1115 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax), %xmm0"); 1116 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp), %xmm0"); 1117 asm volatile("sha1rnds4 $0x91, 0x12345678(%rcx,%rax,1), %xmm0"); 1118 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp,%rax,1), %xmm0"); 1119 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,1), %xmm0"); 1120 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm0"); 1121 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm15"); 1122 1123 /* sha1nexte xmm2/m128, xmm1 */ 1124 1125 asm volatile("sha1nexte %xmm1, %xmm0"); 1126 asm volatile("sha1nexte %xmm7, %xmm2"); 1127 asm volatile("sha1nexte %xmm8, %xmm0"); 1128 asm volatile("sha1nexte %xmm7, %xmm8"); 1129 asm volatile("sha1nexte %xmm15, %xmm8"); 1130 asm volatile("sha1nexte (%rax), %xmm0"); 1131 asm volatile("sha1nexte (%r8), %xmm0"); 1132 asm volatile("sha1nexte (0x12345678), %xmm0"); 1133 asm volatile("sha1nexte (%rax), %xmm3"); 1134 asm volatile("sha1nexte (%rcx,%rax,1), %xmm0"); 1135 asm volatile("sha1nexte 0x12345678(,%rax,1), %xmm0"); 1136 asm volatile("sha1nexte (%rax,%rcx,1), %xmm0"); 1137 asm volatile("sha1nexte (%rax,%rcx,8), %xmm0"); 1138 asm volatile("sha1nexte 0x12(%rax), %xmm0"); 1139 asm volatile("sha1nexte 0x12(%rbp), %xmm0"); 1140 asm volatile("sha1nexte 0x12(%rcx,%rax,1), %xmm0"); 1141 asm volatile("sha1nexte 0x12(%rbp,%rax,1), %xmm0"); 1142 asm volatile("sha1nexte 0x12(%rax,%rcx,1), %xmm0"); 1143 asm volatile("sha1nexte 0x12(%rax,%rcx,8), %xmm0"); 1144 asm volatile("sha1nexte 0x12345678(%rax), %xmm0"); 1145 asm volatile("sha1nexte 0x12345678(%rbp), %xmm0"); 1146 asm volatile("sha1nexte 0x12345678(%rcx,%rax,1), %xmm0"); 1147 asm volatile("sha1nexte 0x12345678(%rbp,%rax,1), %xmm0"); 1148 asm volatile("sha1nexte 0x12345678(%rax,%rcx,1), %xmm0"); 1149 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm0"); 1150 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm15"); 1151 1152 /* sha1msg1 xmm2/m128, xmm1 */ 1153 1154 asm volatile("sha1msg1 %xmm1, %xmm0"); 1155 asm volatile("sha1msg1 %xmm7, %xmm2"); 1156 asm volatile("sha1msg1 %xmm8, %xmm0"); 1157 asm volatile("sha1msg1 %xmm7, %xmm8"); 1158 asm volatile("sha1msg1 %xmm15, %xmm8"); 1159 asm volatile("sha1msg1 (%rax), %xmm0"); 1160 asm volatile("sha1msg1 (%r8), %xmm0"); 1161 asm volatile("sha1msg1 (0x12345678), %xmm0"); 1162 asm volatile("sha1msg1 (%rax), %xmm3"); 1163 asm volatile("sha1msg1 (%rcx,%rax,1), %xmm0"); 1164 asm volatile("sha1msg1 0x12345678(,%rax,1), %xmm0"); 1165 asm volatile("sha1msg1 (%rax,%rcx,1), %xmm0"); 1166 asm volatile("sha1msg1 (%rax,%rcx,8), %xmm0"); 1167 asm volatile("sha1msg1 0x12(%rax), %xmm0"); 1168 asm volatile("sha1msg1 0x12(%rbp), %xmm0"); 1169 asm volatile("sha1msg1 0x12(%rcx,%rax,1), %xmm0"); 1170 asm volatile("sha1msg1 0x12(%rbp,%rax,1), %xmm0"); 1171 asm volatile("sha1msg1 0x12(%rax,%rcx,1), %xmm0"); 1172 asm volatile("sha1msg1 0x12(%rax,%rcx,8), %xmm0"); 1173 asm volatile("sha1msg1 0x12345678(%rax), %xmm0"); 1174 asm volatile("sha1msg1 0x12345678(%rbp), %xmm0"); 1175 asm volatile("sha1msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1176 asm volatile("sha1msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1177 asm volatile("sha1msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1178 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1179 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1180 1181 /* sha1msg2 xmm2/m128, xmm1 */ 1182 1183 asm volatile("sha1msg2 %xmm1, %xmm0"); 1184 asm volatile("sha1msg2 %xmm7, %xmm2"); 1185 asm volatile("sha1msg2 %xmm8, %xmm0"); 1186 asm volatile("sha1msg2 %xmm7, %xmm8"); 1187 asm volatile("sha1msg2 %xmm15, %xmm8"); 1188 asm volatile("sha1msg2 (%rax), %xmm0"); 1189 asm volatile("sha1msg2 (%r8), %xmm0"); 1190 asm volatile("sha1msg2 (0x12345678), %xmm0"); 1191 asm volatile("sha1msg2 (%rax), %xmm3"); 1192 asm volatile("sha1msg2 (%rcx,%rax,1), %xmm0"); 1193 asm volatile("sha1msg2 0x12345678(,%rax,1), %xmm0"); 1194 asm volatile("sha1msg2 (%rax,%rcx,1), %xmm0"); 1195 asm volatile("sha1msg2 (%rax,%rcx,8), %xmm0"); 1196 asm volatile("sha1msg2 0x12(%rax), %xmm0"); 1197 asm volatile("sha1msg2 0x12(%rbp), %xmm0"); 1198 asm volatile("sha1msg2 0x12(%rcx,%rax,1), %xmm0"); 1199 asm volatile("sha1msg2 0x12(%rbp,%rax,1), %xmm0"); 1200 asm volatile("sha1msg2 0x12(%rax,%rcx,1), %xmm0"); 1201 asm volatile("sha1msg2 0x12(%rax,%rcx,8), %xmm0"); 1202 asm volatile("sha1msg2 0x12345678(%rax), %xmm0"); 1203 asm volatile("sha1msg2 0x12345678(%rbp), %xmm0"); 1204 asm volatile("sha1msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1205 asm volatile("sha1msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1206 asm volatile("sha1msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1207 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1208 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1209 1210 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 1211 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 1212 1213 asm volatile("sha256rnds2 %xmm4, %xmm1"); 1214 asm volatile("sha256rnds2 %xmm7, %xmm2"); 1215 asm volatile("sha256rnds2 %xmm8, %xmm1"); 1216 asm volatile("sha256rnds2 %xmm7, %xmm8"); 1217 asm volatile("sha256rnds2 %xmm15, %xmm8"); 1218 asm volatile("sha256rnds2 (%rax), %xmm1"); 1219 asm volatile("sha256rnds2 (%r8), %xmm1"); 1220 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 1221 asm volatile("sha256rnds2 (%rax), %xmm3"); 1222 asm volatile("sha256rnds2 (%rcx,%rax,1), %xmm1"); 1223 asm volatile("sha256rnds2 0x12345678(,%rax,1), %xmm1"); 1224 asm volatile("sha256rnds2 (%rax,%rcx,1), %xmm1"); 1225 asm volatile("sha256rnds2 (%rax,%rcx,8), %xmm1"); 1226 asm volatile("sha256rnds2 0x12(%rax), %xmm1"); 1227 asm volatile("sha256rnds2 0x12(%rbp), %xmm1"); 1228 asm volatile("sha256rnds2 0x12(%rcx,%rax,1), %xmm1"); 1229 asm volatile("sha256rnds2 0x12(%rbp,%rax,1), %xmm1"); 1230 asm volatile("sha256rnds2 0x12(%rax,%rcx,1), %xmm1"); 1231 asm volatile("sha256rnds2 0x12(%rax,%rcx,8), %xmm1"); 1232 asm volatile("sha256rnds2 0x12345678(%rax), %xmm1"); 1233 asm volatile("sha256rnds2 0x12345678(%rbp), %xmm1"); 1234 asm volatile("sha256rnds2 0x12345678(%rcx,%rax,1), %xmm1"); 1235 asm volatile("sha256rnds2 0x12345678(%rbp,%rax,1), %xmm1"); 1236 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,1), %xmm1"); 1237 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm1"); 1238 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm15"); 1239 1240 /* sha256msg1 xmm2/m128, xmm1 */ 1241 1242 asm volatile("sha256msg1 %xmm1, %xmm0"); 1243 asm volatile("sha256msg1 %xmm7, %xmm2"); 1244 asm volatile("sha256msg1 %xmm8, %xmm0"); 1245 asm volatile("sha256msg1 %xmm7, %xmm8"); 1246 asm volatile("sha256msg1 %xmm15, %xmm8"); 1247 asm volatile("sha256msg1 (%rax), %xmm0"); 1248 asm volatile("sha256msg1 (%r8), %xmm0"); 1249 asm volatile("sha256msg1 (0x12345678), %xmm0"); 1250 asm volatile("sha256msg1 (%rax), %xmm3"); 1251 asm volatile("sha256msg1 (%rcx,%rax,1), %xmm0"); 1252 asm volatile("sha256msg1 0x12345678(,%rax,1), %xmm0"); 1253 asm volatile("sha256msg1 (%rax,%rcx,1), %xmm0"); 1254 asm volatile("sha256msg1 (%rax,%rcx,8), %xmm0"); 1255 asm volatile("sha256msg1 0x12(%rax), %xmm0"); 1256 asm volatile("sha256msg1 0x12(%rbp), %xmm0"); 1257 asm volatile("sha256msg1 0x12(%rcx,%rax,1), %xmm0"); 1258 asm volatile("sha256msg1 0x12(%rbp,%rax,1), %xmm0"); 1259 asm volatile("sha256msg1 0x12(%rax,%rcx,1), %xmm0"); 1260 asm volatile("sha256msg1 0x12(%rax,%rcx,8), %xmm0"); 1261 asm volatile("sha256msg1 0x12345678(%rax), %xmm0"); 1262 asm volatile("sha256msg1 0x12345678(%rbp), %xmm0"); 1263 asm volatile("sha256msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1264 asm volatile("sha256msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1265 asm volatile("sha256msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1266 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1267 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1268 1269 /* sha256msg2 xmm2/m128, xmm1 */ 1270 1271 asm volatile("sha256msg2 %xmm1, %xmm0"); 1272 asm volatile("sha256msg2 %xmm7, %xmm2"); 1273 asm volatile("sha256msg2 %xmm8, %xmm0"); 1274 asm volatile("sha256msg2 %xmm7, %xmm8"); 1275 asm volatile("sha256msg2 %xmm15, %xmm8"); 1276 asm volatile("sha256msg2 (%rax), %xmm0"); 1277 asm volatile("sha256msg2 (%r8), %xmm0"); 1278 asm volatile("sha256msg2 (0x12345678), %xmm0"); 1279 asm volatile("sha256msg2 (%rax), %xmm3"); 1280 asm volatile("sha256msg2 (%rcx,%rax,1), %xmm0"); 1281 asm volatile("sha256msg2 0x12345678(,%rax,1), %xmm0"); 1282 asm volatile("sha256msg2 (%rax,%rcx,1), %xmm0"); 1283 asm volatile("sha256msg2 (%rax,%rcx,8), %xmm0"); 1284 asm volatile("sha256msg2 0x12(%rax), %xmm0"); 1285 asm volatile("sha256msg2 0x12(%rbp), %xmm0"); 1286 asm volatile("sha256msg2 0x12(%rcx,%rax,1), %xmm0"); 1287 asm volatile("sha256msg2 0x12(%rbp,%rax,1), %xmm0"); 1288 asm volatile("sha256msg2 0x12(%rax,%rcx,1), %xmm0"); 1289 asm volatile("sha256msg2 0x12(%rax,%rcx,8), %xmm0"); 1290 asm volatile("sha256msg2 0x12345678(%rax), %xmm0"); 1291 asm volatile("sha256msg2 0x12345678(%rbp), %xmm0"); 1292 asm volatile("sha256msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1293 asm volatile("sha256msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1294 asm volatile("sha256msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1295 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1296 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1297 1298 /* clflushopt m8 */ 1299 1300 asm volatile("clflushopt (%rax)"); 1301 asm volatile("clflushopt (%r8)"); 1302 asm volatile("clflushopt (0x12345678)"); 1303 asm volatile("clflushopt 0x12345678(%rax,%rcx,8)"); 1304 asm volatile("clflushopt 0x12345678(%r8,%rcx,8)"); 1305 /* Also check instructions in the same group encoding as clflushopt */ 1306 asm volatile("clflush (%rax)"); 1307 asm volatile("clflush (%r8)"); 1308 asm volatile("sfence"); 1309 1310 /* clwb m8 */ 1311 1312 asm volatile("clwb (%rax)"); 1313 asm volatile("clwb (%r8)"); 1314 asm volatile("clwb (0x12345678)"); 1315 asm volatile("clwb 0x12345678(%rax,%rcx,8)"); 1316 asm volatile("clwb 0x12345678(%r8,%rcx,8)"); 1317 /* Also check instructions in the same group encoding as clwb */ 1318 asm volatile("xsaveopt (%rax)"); 1319 asm volatile("xsaveopt (%r8)"); 1320 asm volatile("mfence"); 1321 1322 /* xsavec mem */ 1323 1324 asm volatile("xsavec (%rax)"); 1325 asm volatile("xsavec (%r8)"); 1326 asm volatile("xsavec (0x12345678)"); 1327 asm volatile("xsavec 0x12345678(%rax,%rcx,8)"); 1328 asm volatile("xsavec 0x12345678(%r8,%rcx,8)"); 1329 1330 /* xsaves mem */ 1331 1332 asm volatile("xsaves (%rax)"); 1333 asm volatile("xsaves (%r8)"); 1334 asm volatile("xsaves (0x12345678)"); 1335 asm volatile("xsaves 0x12345678(%rax,%rcx,8)"); 1336 asm volatile("xsaves 0x12345678(%r8,%rcx,8)"); 1337 1338 /* xrstors mem */ 1339 1340 asm volatile("xrstors (%rax)"); 1341 asm volatile("xrstors (%r8)"); 1342 asm volatile("xrstors (0x12345678)"); 1343 asm volatile("xrstors 0x12345678(%rax,%rcx,8)"); 1344 asm volatile("xrstors 0x12345678(%r8,%rcx,8)"); 1345 1346 #else /* #ifdef __x86_64__ */ 1347 1348 /* bound r32, mem (same op code as EVEX prefix) */ 1349 1350 asm volatile("bound %eax, 0x12345678(%ecx)"); 1351 asm volatile("bound %ecx, 0x12345678(%eax)"); 1352 asm volatile("bound %edx, 0x12345678(%eax)"); 1353 asm volatile("bound %ebx, 0x12345678(%eax)"); 1354 asm volatile("bound %esp, 0x12345678(%eax)"); 1355 asm volatile("bound %ebp, 0x12345678(%eax)"); 1356 asm volatile("bound %esi, 0x12345678(%eax)"); 1357 asm volatile("bound %edi, 0x12345678(%eax)"); 1358 asm volatile("bound %ecx, (%eax)"); 1359 asm volatile("bound %eax, (0x12345678)"); 1360 asm volatile("bound %edx, (%ecx,%eax,1)"); 1361 asm volatile("bound %edx, 0x12345678(,%eax,1)"); 1362 asm volatile("bound %edx, (%eax,%ecx,1)"); 1363 asm volatile("bound %edx, (%eax,%ecx,8)"); 1364 asm volatile("bound %edx, 0x12(%eax)"); 1365 asm volatile("bound %edx, 0x12(%ebp)"); 1366 asm volatile("bound %edx, 0x12(%ecx,%eax,1)"); 1367 asm volatile("bound %edx, 0x12(%ebp,%eax,1)"); 1368 asm volatile("bound %edx, 0x12(%eax,%ecx,1)"); 1369 asm volatile("bound %edx, 0x12(%eax,%ecx,8)"); 1370 asm volatile("bound %edx, 0x12345678(%eax)"); 1371 asm volatile("bound %edx, 0x12345678(%ebp)"); 1372 asm volatile("bound %edx, 0x12345678(%ecx,%eax,1)"); 1373 asm volatile("bound %edx, 0x12345678(%ebp,%eax,1)"); 1374 asm volatile("bound %edx, 0x12345678(%eax,%ecx,1)"); 1375 asm volatile("bound %edx, 0x12345678(%eax,%ecx,8)"); 1376 1377 /* bound r16, mem (same op code as EVEX prefix) */ 1378 1379 asm volatile("bound %ax, 0x12345678(%ecx)"); 1380 asm volatile("bound %cx, 0x12345678(%eax)"); 1381 asm volatile("bound %dx, 0x12345678(%eax)"); 1382 asm volatile("bound %bx, 0x12345678(%eax)"); 1383 asm volatile("bound %sp, 0x12345678(%eax)"); 1384 asm volatile("bound %bp, 0x12345678(%eax)"); 1385 asm volatile("bound %si, 0x12345678(%eax)"); 1386 asm volatile("bound %di, 0x12345678(%eax)"); 1387 asm volatile("bound %cx, (%eax)"); 1388 asm volatile("bound %ax, (0x12345678)"); 1389 asm volatile("bound %dx, (%ecx,%eax,1)"); 1390 asm volatile("bound %dx, 0x12345678(,%eax,1)"); 1391 asm volatile("bound %dx, (%eax,%ecx,1)"); 1392 asm volatile("bound %dx, (%eax,%ecx,8)"); 1393 asm volatile("bound %dx, 0x12(%eax)"); 1394 asm volatile("bound %dx, 0x12(%ebp)"); 1395 asm volatile("bound %dx, 0x12(%ecx,%eax,1)"); 1396 asm volatile("bound %dx, 0x12(%ebp,%eax,1)"); 1397 asm volatile("bound %dx, 0x12(%eax,%ecx,1)"); 1398 asm volatile("bound %dx, 0x12(%eax,%ecx,8)"); 1399 asm volatile("bound %dx, 0x12345678(%eax)"); 1400 asm volatile("bound %dx, 0x12345678(%ebp)"); 1401 asm volatile("bound %dx, 0x12345678(%ecx,%eax,1)"); 1402 asm volatile("bound %dx, 0x12345678(%ebp,%eax,1)"); 1403 asm volatile("bound %dx, 0x12345678(%eax,%ecx,1)"); 1404 asm volatile("bound %dx, 0x12345678(%eax,%ecx,8)"); 1405 1406 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 1407 1408 asm volatile("cmovno %eax,%ebx"); 1409 asm volatile("cmovno 0x12345678(%eax),%ecx"); 1410 asm volatile("cmovno 0x12345678(%eax),%cx"); 1411 1412 asm volatile("cmove %eax,%ebx"); 1413 asm volatile("cmove 0x12345678(%eax),%ecx"); 1414 asm volatile("cmove 0x12345678(%eax),%cx"); 1415 1416 asm volatile("seto 0x12345678(%eax)"); 1417 asm volatile("setno 0x12345678(%eax)"); 1418 asm volatile("setb 0x12345678(%eax)"); 1419 asm volatile("setc 0x12345678(%eax)"); 1420 asm volatile("setnae 0x12345678(%eax)"); 1421 asm volatile("setae 0x12345678(%eax)"); 1422 asm volatile("setnb 0x12345678(%eax)"); 1423 asm volatile("setnc 0x12345678(%eax)"); 1424 asm volatile("sets 0x12345678(%eax)"); 1425 asm volatile("setns 0x12345678(%eax)"); 1426 1427 /* AVX-512: Mask Instructions */ 1428 1429 asm volatile("kandw %k7,%k6,%k5"); 1430 asm volatile("kandq %k7,%k6,%k5"); 1431 asm volatile("kandb %k7,%k6,%k5"); 1432 asm volatile("kandd %k7,%k6,%k5"); 1433 1434 asm volatile("kandnw %k7,%k6,%k5"); 1435 asm volatile("kandnq %k7,%k6,%k5"); 1436 asm volatile("kandnb %k7,%k6,%k5"); 1437 asm volatile("kandnd %k7,%k6,%k5"); 1438 1439 asm volatile("knotw %k7,%k6"); 1440 asm volatile("knotq %k7,%k6"); 1441 asm volatile("knotb %k7,%k6"); 1442 asm volatile("knotd %k7,%k6"); 1443 1444 asm volatile("korw %k7,%k6,%k5"); 1445 asm volatile("korq %k7,%k6,%k5"); 1446 asm volatile("korb %k7,%k6,%k5"); 1447 asm volatile("kord %k7,%k6,%k5"); 1448 1449 asm volatile("kxnorw %k7,%k6,%k5"); 1450 asm volatile("kxnorq %k7,%k6,%k5"); 1451 asm volatile("kxnorb %k7,%k6,%k5"); 1452 asm volatile("kxnord %k7,%k6,%k5"); 1453 1454 asm volatile("kxorw %k7,%k6,%k5"); 1455 asm volatile("kxorq %k7,%k6,%k5"); 1456 asm volatile("kxorb %k7,%k6,%k5"); 1457 asm volatile("kxord %k7,%k6,%k5"); 1458 1459 asm volatile("kaddw %k7,%k6,%k5"); 1460 asm volatile("kaddq %k7,%k6,%k5"); 1461 asm volatile("kaddb %k7,%k6,%k5"); 1462 asm volatile("kaddd %k7,%k6,%k5"); 1463 1464 asm volatile("kunpckbw %k7,%k6,%k5"); 1465 asm volatile("kunpckwd %k7,%k6,%k5"); 1466 asm volatile("kunpckdq %k7,%k6,%k5"); 1467 1468 asm volatile("kmovw %k6,%k5"); 1469 asm volatile("kmovw (%ecx),%k5"); 1470 asm volatile("kmovw 0x123(%eax,%ecx,8),%k5"); 1471 asm volatile("kmovw %k5,(%ecx)"); 1472 asm volatile("kmovw %k5,0x123(%eax,%ecx,8)"); 1473 asm volatile("kmovw %eax,%k5"); 1474 asm volatile("kmovw %ebp,%k5"); 1475 asm volatile("kmovw %k5,%eax"); 1476 asm volatile("kmovw %k5,%ebp"); 1477 1478 asm volatile("kmovq %k6,%k5"); 1479 asm volatile("kmovq (%ecx),%k5"); 1480 asm volatile("kmovq 0x123(%eax,%ecx,8),%k5"); 1481 asm volatile("kmovq %k5,(%ecx)"); 1482 asm volatile("kmovq %k5,0x123(%eax,%ecx,8)"); 1483 1484 asm volatile("kmovb %k6,%k5"); 1485 asm volatile("kmovb (%ecx),%k5"); 1486 asm volatile("kmovb 0x123(%eax,%ecx,8),%k5"); 1487 asm volatile("kmovb %k5,(%ecx)"); 1488 asm volatile("kmovb %k5,0x123(%eax,%ecx,8)"); 1489 asm volatile("kmovb %eax,%k5"); 1490 asm volatile("kmovb %ebp,%k5"); 1491 asm volatile("kmovb %k5,%eax"); 1492 asm volatile("kmovb %k5,%ebp"); 1493 1494 asm volatile("kmovd %k6,%k5"); 1495 asm volatile("kmovd (%ecx),%k5"); 1496 asm volatile("kmovd 0x123(%eax,%ecx,8),%k5"); 1497 asm volatile("kmovd %k5,(%ecx)"); 1498 asm volatile("kmovd %k5,0x123(%eax,%ecx,8)"); 1499 asm volatile("kmovd %eax,%k5"); 1500 asm volatile("kmovd %ebp,%k5"); 1501 asm volatile("kmovd %k5,%eax"); 1502 asm volatile("kmovd %k5,%ebp"); 1503 1504 asm volatile("kortestw %k6,%k5"); 1505 asm volatile("kortestq %k6,%k5"); 1506 asm volatile("kortestb %k6,%k5"); 1507 asm volatile("kortestd %k6,%k5"); 1508 1509 asm volatile("ktestw %k6,%k5"); 1510 asm volatile("ktestq %k6,%k5"); 1511 asm volatile("ktestb %k6,%k5"); 1512 asm volatile("ktestd %k6,%k5"); 1513 1514 asm volatile("kshiftrw $0x12,%k6,%k5"); 1515 asm volatile("kshiftrq $0x5b,%k6,%k5"); 1516 asm volatile("kshiftlw $0x12,%k6,%k5"); 1517 asm volatile("kshiftlq $0x5b,%k6,%k5"); 1518 1519 /* AVX-512: Op code 0f 5b */ 1520 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 1521 asm volatile("vcvtqq2ps %zmm5,%ymm6{%k7}"); 1522 asm volatile("vcvtps2dq %xmm5,%xmm6"); 1523 asm volatile("vcvttps2dq %xmm5,%xmm6"); 1524 1525 /* AVX-512: Op code 0f 6f */ 1526 1527 asm volatile("movq %mm0,%mm4"); 1528 asm volatile("vmovdqa %ymm4,%ymm6"); 1529 asm volatile("vmovdqa32 %zmm5,%zmm6"); 1530 asm volatile("vmovdqa64 %zmm5,%zmm6"); 1531 asm volatile("vmovdqu %ymm4,%ymm6"); 1532 asm volatile("vmovdqu32 %zmm5,%zmm6"); 1533 asm volatile("vmovdqu64 %zmm5,%zmm6"); 1534 asm volatile("vmovdqu8 %zmm5,%zmm6"); 1535 asm volatile("vmovdqu16 %zmm5,%zmm6"); 1536 1537 /* AVX-512: Op code 0f 78 */ 1538 1539 asm volatile("vmread %eax,%ebx"); 1540 asm volatile("vcvttps2udq %zmm5,%zmm6"); 1541 asm volatile("vcvttpd2udq %zmm5,%ymm6{%k7}"); 1542 asm volatile("vcvttsd2usi %xmm6,%eax"); 1543 asm volatile("vcvttss2usi %xmm6,%eax"); 1544 asm volatile("vcvttps2uqq %ymm5,%zmm6{%k7}"); 1545 asm volatile("vcvttpd2uqq %zmm5,%zmm6"); 1546 1547 /* AVX-512: Op code 0f 79 */ 1548 1549 asm volatile("vmwrite %eax,%ebx"); 1550 asm volatile("vcvtps2udq %zmm5,%zmm6"); 1551 asm volatile("vcvtpd2udq %zmm5,%ymm6{%k7}"); 1552 asm volatile("vcvtsd2usi %xmm6,%eax"); 1553 asm volatile("vcvtss2usi %xmm6,%eax"); 1554 asm volatile("vcvtps2uqq %ymm5,%zmm6{%k7}"); 1555 asm volatile("vcvtpd2uqq %zmm5,%zmm6"); 1556 1557 /* AVX-512: Op code 0f 7a */ 1558 1559 asm volatile("vcvtudq2pd %ymm5,%zmm6{%k7}"); 1560 asm volatile("vcvtuqq2pd %zmm5,%zmm6"); 1561 asm volatile("vcvtudq2ps %zmm5,%zmm6"); 1562 asm volatile("vcvtuqq2ps %zmm5,%ymm6{%k7}"); 1563 asm volatile("vcvttps2qq %ymm5,%zmm6{%k7}"); 1564 asm volatile("vcvttpd2qq %zmm5,%zmm6"); 1565 1566 /* AVX-512: Op code 0f 7b */ 1567 1568 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 1569 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 1570 asm volatile("vcvtps2qq %ymm5,%zmm6{%k7}"); 1571 asm volatile("vcvtpd2qq %zmm5,%zmm6"); 1572 1573 /* AVX-512: Op code 0f 7f */ 1574 1575 asm volatile("movq.s %mm0,%mm4"); 1576 asm volatile("vmovdqa.s %ymm5,%ymm6"); 1577 asm volatile("vmovdqa32.s %zmm5,%zmm6"); 1578 asm volatile("vmovdqa64.s %zmm5,%zmm6"); 1579 asm volatile("vmovdqu.s %ymm5,%ymm6"); 1580 asm volatile("vmovdqu32.s %zmm5,%zmm6"); 1581 asm volatile("vmovdqu64.s %zmm5,%zmm6"); 1582 asm volatile("vmovdqu8.s %zmm5,%zmm6"); 1583 asm volatile("vmovdqu16.s %zmm5,%zmm6"); 1584 1585 /* AVX-512: Op code 0f db */ 1586 1587 asm volatile("pand %mm1,%mm2"); 1588 asm volatile("pand %xmm1,%xmm2"); 1589 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 1590 asm volatile("vpandd %zmm4,%zmm5,%zmm6"); 1591 asm volatile("vpandq %zmm4,%zmm5,%zmm6"); 1592 1593 /* AVX-512: Op code 0f df */ 1594 1595 asm volatile("pandn %mm1,%mm2"); 1596 asm volatile("pandn %xmm1,%xmm2"); 1597 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 1598 asm volatile("vpandnd %zmm4,%zmm5,%zmm6"); 1599 asm volatile("vpandnq %zmm4,%zmm5,%zmm6"); 1600 1601 /* AVX-512: Op code 0f e6 */ 1602 1603 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 1604 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 1605 asm volatile("vcvtdq2pd %ymm5,%zmm6{%k7}"); 1606 asm volatile("vcvtqq2pd %zmm5,%zmm6"); 1607 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 1608 1609 /* AVX-512: Op code 0f eb */ 1610 1611 asm volatile("por %mm4,%mm6"); 1612 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 1613 asm volatile("vpord %zmm4,%zmm5,%zmm6"); 1614 asm volatile("vporq %zmm4,%zmm5,%zmm6"); 1615 1616 /* AVX-512: Op code 0f ef */ 1617 1618 asm volatile("pxor %mm4,%mm6"); 1619 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 1620 asm volatile("vpxord %zmm4,%zmm5,%zmm6"); 1621 asm volatile("vpxorq %zmm4,%zmm5,%zmm6"); 1622 1623 /* AVX-512: Op code 0f 38 10 */ 1624 1625 asm volatile("pblendvb %xmm1,%xmm0"); 1626 asm volatile("vpsrlvw %zmm4,%zmm5,%zmm6"); 1627 asm volatile("vpmovuswb %zmm5,%ymm6{%k7}"); 1628 1629 /* AVX-512: Op code 0f 38 11 */ 1630 1631 asm volatile("vpmovusdb %zmm5,%xmm6{%k7}"); 1632 asm volatile("vpsravw %zmm4,%zmm5,%zmm6"); 1633 1634 /* AVX-512: Op code 0f 38 12 */ 1635 1636 asm volatile("vpmovusqb %zmm5,%xmm6{%k7}"); 1637 asm volatile("vpsllvw %zmm4,%zmm5,%zmm6"); 1638 1639 /* AVX-512: Op code 0f 38 13 */ 1640 1641 asm volatile("vcvtph2ps %xmm3,%ymm5"); 1642 asm volatile("vcvtph2ps %ymm5,%zmm6{%k7}"); 1643 asm volatile("vpmovusdw %zmm5,%ymm6{%k7}"); 1644 1645 /* AVX-512: Op code 0f 38 14 */ 1646 1647 asm volatile("blendvps %xmm1,%xmm0"); 1648 asm volatile("vpmovusqw %zmm5,%xmm6{%k7}"); 1649 asm volatile("vprorvd %zmm4,%zmm5,%zmm6"); 1650 asm volatile("vprorvq %zmm4,%zmm5,%zmm6"); 1651 1652 /* AVX-512: Op code 0f 38 15 */ 1653 1654 asm volatile("blendvpd %xmm1,%xmm0"); 1655 asm volatile("vpmovusqd %zmm5,%ymm6{%k7}"); 1656 asm volatile("vprolvd %zmm4,%zmm5,%zmm6"); 1657 asm volatile("vprolvq %zmm4,%zmm5,%zmm6"); 1658 1659 /* AVX-512: Op code 0f 38 16 */ 1660 1661 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 1662 asm volatile("vpermps %ymm4,%ymm6,%ymm2{%k7}"); 1663 asm volatile("vpermpd %ymm4,%ymm6,%ymm2{%k7}"); 1664 1665 /* AVX-512: Op code 0f 38 19 */ 1666 1667 asm volatile("vbroadcastsd %xmm4,%ymm6"); 1668 asm volatile("vbroadcastf32x2 %xmm7,%zmm6"); 1669 1670 /* AVX-512: Op code 0f 38 1a */ 1671 1672 asm volatile("vbroadcastf128 (%ecx),%ymm4"); 1673 asm volatile("vbroadcastf32x4 (%ecx),%zmm6"); 1674 asm volatile("vbroadcastf64x2 (%ecx),%zmm6"); 1675 1676 /* AVX-512: Op code 0f 38 1b */ 1677 1678 asm volatile("vbroadcastf32x8 (%ecx),%zmm6"); 1679 asm volatile("vbroadcastf64x4 (%ecx),%zmm6"); 1680 1681 /* AVX-512: Op code 0f 38 1f */ 1682 1683 asm volatile("vpabsq %zmm4,%zmm6"); 1684 1685 /* AVX-512: Op code 0f 38 20 */ 1686 1687 asm volatile("vpmovsxbw %xmm4,%xmm5"); 1688 asm volatile("vpmovswb %zmm5,%ymm6{%k7}"); 1689 1690 /* AVX-512: Op code 0f 38 21 */ 1691 1692 asm volatile("vpmovsxbd %xmm4,%ymm6"); 1693 asm volatile("vpmovsdb %zmm5,%xmm6{%k7}"); 1694 1695 /* AVX-512: Op code 0f 38 22 */ 1696 1697 asm volatile("vpmovsxbq %xmm4,%ymm4"); 1698 asm volatile("vpmovsqb %zmm5,%xmm6{%k7}"); 1699 1700 /* AVX-512: Op code 0f 38 23 */ 1701 1702 asm volatile("vpmovsxwd %xmm4,%ymm4"); 1703 asm volatile("vpmovsdw %zmm5,%ymm6{%k7}"); 1704 1705 /* AVX-512: Op code 0f 38 24 */ 1706 1707 asm volatile("vpmovsxwq %xmm4,%ymm6"); 1708 asm volatile("vpmovsqw %zmm5,%xmm6{%k7}"); 1709 1710 /* AVX-512: Op code 0f 38 25 */ 1711 1712 asm volatile("vpmovsxdq %xmm4,%ymm4"); 1713 asm volatile("vpmovsqd %zmm5,%ymm6{%k7}"); 1714 1715 /* AVX-512: Op code 0f 38 26 */ 1716 1717 asm volatile("vptestmb %zmm5,%zmm6,%k5"); 1718 asm volatile("vptestmw %zmm5,%zmm6,%k5"); 1719 asm volatile("vptestnmb %zmm4,%zmm5,%k5"); 1720 asm volatile("vptestnmw %zmm4,%zmm5,%k5"); 1721 1722 /* AVX-512: Op code 0f 38 27 */ 1723 1724 asm volatile("vptestmd %zmm5,%zmm6,%k5"); 1725 asm volatile("vptestmq %zmm5,%zmm6,%k5"); 1726 asm volatile("vptestnmd %zmm4,%zmm5,%k5"); 1727 asm volatile("vptestnmq %zmm4,%zmm5,%k5"); 1728 1729 /* AVX-512: Op code 0f 38 28 */ 1730 1731 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 1732 asm volatile("vpmovm2b %k5,%zmm6"); 1733 asm volatile("vpmovm2w %k5,%zmm6"); 1734 1735 /* AVX-512: Op code 0f 38 29 */ 1736 1737 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 1738 asm volatile("vpmovb2m %zmm6,%k5"); 1739 asm volatile("vpmovw2m %zmm6,%k5"); 1740 1741 /* AVX-512: Op code 0f 38 2a */ 1742 1743 asm volatile("vmovntdqa (%ecx),%ymm4"); 1744 asm volatile("vpbroadcastmb2q %k6,%zmm1"); 1745 1746 /* AVX-512: Op code 0f 38 2c */ 1747 1748 asm volatile("vmaskmovps (%ecx),%ymm4,%ymm6"); 1749 asm volatile("vscalefps %zmm4,%zmm5,%zmm6"); 1750 asm volatile("vscalefpd %zmm4,%zmm5,%zmm6"); 1751 1752 /* AVX-512: Op code 0f 38 2d */ 1753 1754 asm volatile("vmaskmovpd (%ecx),%ymm4,%ymm6"); 1755 asm volatile("vscalefss %xmm4,%xmm5,%xmm6{%k7}"); 1756 asm volatile("vscalefsd %xmm4,%xmm5,%xmm6{%k7}"); 1757 1758 /* AVX-512: Op code 0f 38 30 */ 1759 1760 asm volatile("vpmovzxbw %xmm4,%ymm4"); 1761 asm volatile("vpmovwb %zmm5,%ymm6{%k7}"); 1762 1763 /* AVX-512: Op code 0f 38 31 */ 1764 1765 asm volatile("vpmovzxbd %xmm4,%ymm6"); 1766 asm volatile("vpmovdb %zmm5,%xmm6{%k7}"); 1767 1768 /* AVX-512: Op code 0f 38 32 */ 1769 1770 asm volatile("vpmovzxbq %xmm4,%ymm4"); 1771 asm volatile("vpmovqb %zmm5,%xmm6{%k7}"); 1772 1773 /* AVX-512: Op code 0f 38 33 */ 1774 1775 asm volatile("vpmovzxwd %xmm4,%ymm4"); 1776 asm volatile("vpmovdw %zmm5,%ymm6{%k7}"); 1777 1778 /* AVX-512: Op code 0f 38 34 */ 1779 1780 asm volatile("vpmovzxwq %xmm4,%ymm6"); 1781 asm volatile("vpmovqw %zmm5,%xmm6{%k7}"); 1782 1783 /* AVX-512: Op code 0f 38 35 */ 1784 1785 asm volatile("vpmovzxdq %xmm4,%ymm4"); 1786 asm volatile("vpmovqd %zmm5,%ymm6{%k7}"); 1787 1788 /* AVX-512: Op code 0f 38 36 */ 1789 1790 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 1791 asm volatile("vpermd %ymm4,%ymm6,%ymm2{%k7}"); 1792 asm volatile("vpermq %ymm4,%ymm6,%ymm2{%k7}"); 1793 1794 /* AVX-512: Op code 0f 38 38 */ 1795 1796 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 1797 asm volatile("vpmovm2d %k5,%zmm6"); 1798 asm volatile("vpmovm2q %k5,%zmm6"); 1799 1800 /* AVX-512: Op code 0f 38 39 */ 1801 1802 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 1803 asm volatile("vpminsd %zmm4,%zmm5,%zmm6"); 1804 asm volatile("vpminsq %zmm4,%zmm5,%zmm6"); 1805 asm volatile("vpmovd2m %zmm6,%k5"); 1806 asm volatile("vpmovq2m %zmm6,%k5"); 1807 1808 /* AVX-512: Op code 0f 38 3a */ 1809 1810 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 1811 asm volatile("vpbroadcastmw2d %k6,%zmm6"); 1812 1813 /* AVX-512: Op code 0f 38 3b */ 1814 1815 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 1816 asm volatile("vpminud %zmm4,%zmm5,%zmm6"); 1817 asm volatile("vpminuq %zmm4,%zmm5,%zmm6"); 1818 1819 /* AVX-512: Op code 0f 38 3d */ 1820 1821 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 1822 asm volatile("vpmaxsd %zmm4,%zmm5,%zmm6"); 1823 asm volatile("vpmaxsq %zmm4,%zmm5,%zmm6"); 1824 1825 /* AVX-512: Op code 0f 38 3f */ 1826 1827 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 1828 asm volatile("vpmaxud %zmm4,%zmm5,%zmm6"); 1829 asm volatile("vpmaxuq %zmm4,%zmm5,%zmm6"); 1830 1831 /* AVX-512: Op code 0f 38 40 */ 1832 1833 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 1834 asm volatile("vpmulld %zmm4,%zmm5,%zmm6"); 1835 asm volatile("vpmullq %zmm4,%zmm5,%zmm6"); 1836 1837 /* AVX-512: Op code 0f 38 42 */ 1838 1839 asm volatile("vgetexpps %zmm5,%zmm6"); 1840 asm volatile("vgetexppd %zmm5,%zmm6"); 1841 1842 /* AVX-512: Op code 0f 38 43 */ 1843 1844 asm volatile("vgetexpss %xmm4,%xmm5,%xmm6{%k7}"); 1845 asm volatile("vgetexpsd %xmm2,%xmm3,%xmm4{%k7}"); 1846 1847 /* AVX-512: Op code 0f 38 44 */ 1848 1849 asm volatile("vplzcntd %zmm5,%zmm6"); 1850 asm volatile("vplzcntq %zmm5,%zmm6"); 1851 1852 /* AVX-512: Op code 0f 38 46 */ 1853 1854 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 1855 asm volatile("vpsravd %zmm4,%zmm5,%zmm6"); 1856 asm volatile("vpsravq %zmm4,%zmm5,%zmm6"); 1857 1858 /* AVX-512: Op code 0f 38 4c */ 1859 1860 asm volatile("vrcp14ps %zmm5,%zmm6"); 1861 asm volatile("vrcp14pd %zmm5,%zmm6"); 1862 1863 /* AVX-512: Op code 0f 38 4d */ 1864 1865 asm volatile("vrcp14ss %xmm4,%xmm5,%xmm6{%k7}"); 1866 asm volatile("vrcp14sd %xmm4,%xmm5,%xmm6{%k7}"); 1867 1868 /* AVX-512: Op code 0f 38 4e */ 1869 1870 asm volatile("vrsqrt14ps %zmm5,%zmm6"); 1871 asm volatile("vrsqrt14pd %zmm5,%zmm6"); 1872 1873 /* AVX-512: Op code 0f 38 4f */ 1874 1875 asm volatile("vrsqrt14ss %xmm4,%xmm5,%xmm6{%k7}"); 1876 asm volatile("vrsqrt14sd %xmm4,%xmm5,%xmm6{%k7}"); 1877 1878 /* AVX-512: Op code 0f 38 59 */ 1879 1880 asm volatile("vpbroadcastq %xmm4,%xmm6"); 1881 asm volatile("vbroadcasti32x2 %xmm7,%zmm6"); 1882 1883 /* AVX-512: Op code 0f 38 5a */ 1884 1885 asm volatile("vbroadcasti128 (%ecx),%ymm4"); 1886 asm volatile("vbroadcasti32x4 (%ecx),%zmm6"); 1887 asm volatile("vbroadcasti64x2 (%ecx),%zmm6"); 1888 1889 /* AVX-512: Op code 0f 38 5b */ 1890 1891 asm volatile("vbroadcasti32x8 (%ecx),%zmm6"); 1892 asm volatile("vbroadcasti64x4 (%ecx),%zmm6"); 1893 1894 /* AVX-512: Op code 0f 38 64 */ 1895 1896 asm volatile("vpblendmd %zmm4,%zmm5,%zmm6"); 1897 asm volatile("vpblendmq %zmm4,%zmm5,%zmm6"); 1898 1899 /* AVX-512: Op code 0f 38 65 */ 1900 1901 asm volatile("vblendmps %zmm4,%zmm5,%zmm6"); 1902 asm volatile("vblendmpd %zmm4,%zmm5,%zmm6"); 1903 1904 /* AVX-512: Op code 0f 38 66 */ 1905 1906 asm volatile("vpblendmb %zmm4,%zmm5,%zmm6"); 1907 asm volatile("vpblendmw %zmm4,%zmm5,%zmm6"); 1908 1909 /* AVX-512: Op code 0f 38 75 */ 1910 1911 asm volatile("vpermi2b %zmm4,%zmm5,%zmm6"); 1912 asm volatile("vpermi2w %zmm4,%zmm5,%zmm6"); 1913 1914 /* AVX-512: Op code 0f 38 76 */ 1915 1916 asm volatile("vpermi2d %zmm4,%zmm5,%zmm6"); 1917 asm volatile("vpermi2q %zmm4,%zmm5,%zmm6"); 1918 1919 /* AVX-512: Op code 0f 38 77 */ 1920 1921 asm volatile("vpermi2ps %zmm4,%zmm5,%zmm6"); 1922 asm volatile("vpermi2pd %zmm4,%zmm5,%zmm6"); 1923 1924 /* AVX-512: Op code 0f 38 7a */ 1925 1926 asm volatile("vpbroadcastb %eax,%xmm3"); 1927 1928 /* AVX-512: Op code 0f 38 7b */ 1929 1930 asm volatile("vpbroadcastw %eax,%xmm3"); 1931 1932 /* AVX-512: Op code 0f 38 7c */ 1933 1934 asm volatile("vpbroadcastd %eax,%xmm3"); 1935 1936 /* AVX-512: Op code 0f 38 7d */ 1937 1938 asm volatile("vpermt2b %zmm4,%zmm5,%zmm6"); 1939 asm volatile("vpermt2w %zmm4,%zmm5,%zmm6"); 1940 1941 /* AVX-512: Op code 0f 38 7e */ 1942 1943 asm volatile("vpermt2d %zmm4,%zmm5,%zmm6"); 1944 asm volatile("vpermt2q %zmm4,%zmm5,%zmm6"); 1945 1946 /* AVX-512: Op code 0f 38 7f */ 1947 1948 asm volatile("vpermt2ps %zmm4,%zmm5,%zmm6"); 1949 asm volatile("vpermt2pd %zmm4,%zmm5,%zmm6"); 1950 1951 /* AVX-512: Op code 0f 38 83 */ 1952 1953 asm volatile("vpmultishiftqb %zmm4,%zmm5,%zmm6"); 1954 1955 /* AVX-512: Op code 0f 38 88 */ 1956 1957 asm volatile("vexpandps (%ecx),%zmm6"); 1958 asm volatile("vexpandpd (%ecx),%zmm6"); 1959 1960 /* AVX-512: Op code 0f 38 89 */ 1961 1962 asm volatile("vpexpandd (%ecx),%zmm6"); 1963 asm volatile("vpexpandq (%ecx),%zmm6"); 1964 1965 /* AVX-512: Op code 0f 38 8a */ 1966 1967 asm volatile("vcompressps %zmm6,(%ecx)"); 1968 asm volatile("vcompresspd %zmm6,(%ecx)"); 1969 1970 /* AVX-512: Op code 0f 38 8b */ 1971 1972 asm volatile("vpcompressd %zmm6,(%ecx)"); 1973 asm volatile("vpcompressq %zmm6,(%ecx)"); 1974 1975 /* AVX-512: Op code 0f 38 8d */ 1976 1977 asm volatile("vpermb %zmm4,%zmm5,%zmm6"); 1978 asm volatile("vpermw %zmm4,%zmm5,%zmm6"); 1979 1980 /* AVX-512: Op code 0f 38 90 */ 1981 1982 asm volatile("vpgatherdd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 1983 asm volatile("vpgatherdq %xmm2,0x04(%ebp,%xmm7,2),%xmm1"); 1984 asm volatile("vpgatherdd 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 1985 asm volatile("vpgatherdq 0x7b(%ebp,%ymm7,8),%zmm6{%k1}"); 1986 1987 /* AVX-512: Op code 0f 38 91 */ 1988 1989 asm volatile("vpgatherqd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 1990 asm volatile("vpgatherqq %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 1991 asm volatile("vpgatherqd 0x7b(%ebp,%zmm7,8),%ymm6{%k1}"); 1992 asm volatile("vpgatherqq 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 1993 1994 /* AVX-512: Op code 0f 38 a0 */ 1995 1996 asm volatile("vpscatterdd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 1997 asm volatile("vpscatterdq %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 1998 1999 /* AVX-512: Op code 0f 38 a1 */ 2000 2001 asm volatile("vpscatterqd %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2002 asm volatile("vpscatterqq %ymm6,0x7b(%ebp,%ymm7,8){%k1}"); 2003 2004 /* AVX-512: Op code 0f 38 a2 */ 2005 2006 asm volatile("vscatterdps %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2007 asm volatile("vscatterdpd %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 2008 2009 /* AVX-512: Op code 0f 38 a3 */ 2010 2011 asm volatile("vscatterqps %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2012 asm volatile("vscatterqpd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2013 2014 /* AVX-512: Op code 0f 38 b4 */ 2015 2016 asm volatile("vpmadd52luq %zmm4,%zmm5,%zmm6"); 2017 2018 /* AVX-512: Op code 0f 38 b5 */ 2019 2020 asm volatile("vpmadd52huq %zmm4,%zmm5,%zmm6"); 2021 2022 /* AVX-512: Op code 0f 38 c4 */ 2023 2024 asm volatile("vpconflictd %zmm5,%zmm6"); 2025 asm volatile("vpconflictq %zmm5,%zmm6"); 2026 2027 /* AVX-512: Op code 0f 38 c8 */ 2028 2029 asm volatile("vexp2ps %zmm6,%zmm7"); 2030 asm volatile("vexp2pd %zmm6,%zmm7"); 2031 2032 /* AVX-512: Op code 0f 38 ca */ 2033 2034 asm volatile("vrcp28ps %zmm6,%zmm7"); 2035 asm volatile("vrcp28pd %zmm6,%zmm7"); 2036 2037 /* AVX-512: Op code 0f 38 cb */ 2038 2039 asm volatile("vrcp28ss %xmm5,%xmm6,%xmm7{%k7}"); 2040 asm volatile("vrcp28sd %xmm5,%xmm6,%xmm7{%k7}"); 2041 2042 /* AVX-512: Op code 0f 38 cc */ 2043 2044 asm volatile("vrsqrt28ps %zmm6,%zmm7"); 2045 asm volatile("vrsqrt28pd %zmm6,%zmm7"); 2046 2047 /* AVX-512: Op code 0f 38 cd */ 2048 2049 asm volatile("vrsqrt28ss %xmm5,%xmm6,%xmm7{%k7}"); 2050 asm volatile("vrsqrt28sd %xmm5,%xmm6,%xmm7{%k7}"); 2051 2052 /* AVX-512: Op code 0f 3a 03 */ 2053 2054 asm volatile("valignd $0x12,%zmm5,%zmm6,%zmm7"); 2055 asm volatile("valignq $0x12,%zmm5,%zmm6,%zmm7"); 2056 2057 /* AVX-512: Op code 0f 3a 08 */ 2058 2059 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 2060 asm volatile("vrndscaleps $0x12,%zmm5,%zmm6"); 2061 2062 /* AVX-512: Op code 0f 3a 09 */ 2063 2064 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 2065 asm volatile("vrndscalepd $0x12,%zmm5,%zmm6"); 2066 2067 /* AVX-512: Op code 0f 3a 0a */ 2068 2069 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 2070 asm volatile("vrndscaless $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2071 2072 /* AVX-512: Op code 0f 3a 0b */ 2073 2074 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 2075 asm volatile("vrndscalesd $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2076 2077 /* AVX-512: Op code 0f 3a 18 */ 2078 2079 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 2080 asm volatile("vinsertf32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2081 asm volatile("vinsertf64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2082 2083 /* AVX-512: Op code 0f 3a 19 */ 2084 2085 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 2086 asm volatile("vextractf32x4 $0x12,%zmm5,%xmm6{%k7}"); 2087 asm volatile("vextractf64x2 $0x12,%zmm5,%xmm6{%k7}"); 2088 2089 /* AVX-512: Op code 0f 3a 1a */ 2090 2091 asm volatile("vinsertf32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2092 asm volatile("vinsertf64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2093 2094 /* AVX-512: Op code 0f 3a 1b */ 2095 2096 asm volatile("vextractf32x8 $0x12,%zmm6,%ymm7{%k7}"); 2097 asm volatile("vextractf64x4 $0x12,%zmm6,%ymm7{%k7}"); 2098 2099 /* AVX-512: Op code 0f 3a 1e */ 2100 2101 asm volatile("vpcmpud $0x12,%zmm6,%zmm7,%k5"); 2102 asm volatile("vpcmpuq $0x12,%zmm6,%zmm7,%k5"); 2103 2104 /* AVX-512: Op code 0f 3a 1f */ 2105 2106 asm volatile("vpcmpd $0x12,%zmm6,%zmm7,%k5"); 2107 asm volatile("vpcmpq $0x12,%zmm6,%zmm7,%k5"); 2108 2109 /* AVX-512: Op code 0f 3a 23 */ 2110 2111 asm volatile("vshuff32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2112 asm volatile("vshuff64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2113 2114 /* AVX-512: Op code 0f 3a 25 */ 2115 2116 asm volatile("vpternlogd $0x12,%zmm5,%zmm6,%zmm7"); 2117 asm volatile("vpternlogq $0x12,%zmm5,%zmm6,%zmm7"); 2118 2119 /* AVX-512: Op code 0f 3a 26 */ 2120 2121 asm volatile("vgetmantps $0x12,%zmm6,%zmm7"); 2122 asm volatile("vgetmantpd $0x12,%zmm6,%zmm7"); 2123 2124 /* AVX-512: Op code 0f 3a 27 */ 2125 2126 asm volatile("vgetmantss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2127 asm volatile("vgetmantsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2128 2129 /* AVX-512: Op code 0f 3a 38 */ 2130 2131 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 2132 asm volatile("vinserti32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2133 asm volatile("vinserti64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2134 2135 /* AVX-512: Op code 0f 3a 39 */ 2136 2137 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 2138 asm volatile("vextracti32x4 $0x12,%zmm5,%xmm6{%k7}"); 2139 asm volatile("vextracti64x2 $0x12,%zmm5,%xmm6{%k7}"); 2140 2141 /* AVX-512: Op code 0f 3a 3a */ 2142 2143 asm volatile("vinserti32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2144 asm volatile("vinserti64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2145 2146 /* AVX-512: Op code 0f 3a 3b */ 2147 2148 asm volatile("vextracti32x8 $0x12,%zmm6,%ymm7{%k7}"); 2149 asm volatile("vextracti64x4 $0x12,%zmm6,%ymm7{%k7}"); 2150 2151 /* AVX-512: Op code 0f 3a 3e */ 2152 2153 asm volatile("vpcmpub $0x12,%zmm6,%zmm7,%k5"); 2154 asm volatile("vpcmpuw $0x12,%zmm6,%zmm7,%k5"); 2155 2156 /* AVX-512: Op code 0f 3a 3f */ 2157 2158 asm volatile("vpcmpb $0x12,%zmm6,%zmm7,%k5"); 2159 asm volatile("vpcmpw $0x12,%zmm6,%zmm7,%k5"); 2160 2161 /* AVX-512: Op code 0f 3a 42 */ 2162 2163 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 2164 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 2165 2166 /* AVX-512: Op code 0f 3a 43 */ 2167 2168 asm volatile("vshufi32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2169 asm volatile("vshufi64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2170 2171 /* AVX-512: Op code 0f 3a 50 */ 2172 2173 asm volatile("vrangeps $0x12,%zmm5,%zmm6,%zmm7"); 2174 asm volatile("vrangepd $0x12,%zmm5,%zmm6,%zmm7"); 2175 2176 /* AVX-512: Op code 0f 3a 51 */ 2177 2178 asm volatile("vrangess $0x12,%xmm5,%xmm6,%xmm7"); 2179 asm volatile("vrangesd $0x12,%xmm5,%xmm6,%xmm7"); 2180 2181 /* AVX-512: Op code 0f 3a 54 */ 2182 2183 asm volatile("vfixupimmps $0x12,%zmm5,%zmm6,%zmm7"); 2184 asm volatile("vfixupimmpd $0x12,%zmm5,%zmm6,%zmm7"); 2185 2186 /* AVX-512: Op code 0f 3a 55 */ 2187 2188 asm volatile("vfixupimmss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2189 asm volatile("vfixupimmsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2190 2191 /* AVX-512: Op code 0f 3a 56 */ 2192 2193 asm volatile("vreduceps $0x12,%zmm6,%zmm7"); 2194 asm volatile("vreducepd $0x12,%zmm6,%zmm7"); 2195 2196 /* AVX-512: Op code 0f 3a 57 */ 2197 2198 asm volatile("vreducess $0x12,%xmm5,%xmm6,%xmm7"); 2199 asm volatile("vreducesd $0x12,%xmm5,%xmm6,%xmm7"); 2200 2201 /* AVX-512: Op code 0f 3a 66 */ 2202 2203 asm volatile("vfpclassps $0x12,%zmm7,%k5"); 2204 asm volatile("vfpclasspd $0x12,%zmm7,%k5"); 2205 2206 /* AVX-512: Op code 0f 3a 67 */ 2207 2208 asm volatile("vfpclassss $0x12,%xmm7,%k5"); 2209 asm volatile("vfpclasssd $0x12,%xmm7,%k5"); 2210 2211 /* AVX-512: Op code 0f 72 (Grp13) */ 2212 2213 asm volatile("vprord $0x12,%zmm5,%zmm6"); 2214 asm volatile("vprorq $0x12,%zmm5,%zmm6"); 2215 asm volatile("vprold $0x12,%zmm5,%zmm6"); 2216 asm volatile("vprolq $0x12,%zmm5,%zmm6"); 2217 asm volatile("psrad $0x2,%mm6"); 2218 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 2219 asm volatile("vpsrad $0x5,%zmm6,%zmm2"); 2220 asm volatile("vpsraq $0x5,%zmm6,%zmm2"); 2221 2222 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 2223 2224 asm volatile("vgatherpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2225 asm volatile("vgatherpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2226 asm volatile("vgatherpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2227 asm volatile("vgatherpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2228 asm volatile("vscatterpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2229 asm volatile("vscatterpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2230 asm volatile("vscatterpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2231 asm volatile("vscatterpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2232 2233 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 2234 2235 asm volatile("vgatherpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2236 asm volatile("vgatherpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2237 asm volatile("vgatherpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2238 asm volatile("vgatherpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2239 asm volatile("vscatterpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2240 asm volatile("vscatterpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2241 asm volatile("vscatterpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2242 asm volatile("vscatterpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2243 2244 /* AVX-512: Examples */ 2245 2246 asm volatile("vaddpd %zmm4,%zmm5,%zmm6"); 2247 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}"); 2248 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}{z}"); 2249 asm volatile("vaddpd {rn-sae},%zmm4,%zmm5,%zmm6"); 2250 asm volatile("vaddpd {ru-sae},%zmm4,%zmm5,%zmm6"); 2251 asm volatile("vaddpd {rd-sae},%zmm4,%zmm5,%zmm6"); 2252 asm volatile("vaddpd {rz-sae},%zmm4,%zmm5,%zmm6"); 2253 asm volatile("vaddpd (%ecx),%zmm5,%zmm6"); 2254 asm volatile("vaddpd 0x123(%eax,%ecx,8),%zmm5,%zmm6"); 2255 asm volatile("vaddpd (%ecx){1to8},%zmm5,%zmm6"); 2256 asm volatile("vaddpd 0x1fc0(%edx),%zmm5,%zmm6"); 2257 asm volatile("vaddpd 0x3f8(%edx){1to8},%zmm5,%zmm6"); 2258 asm volatile("vcmpeq_uqps 0x1fc(%edx){1to16},%zmm6,%k5"); 2259 asm volatile("vcmpltsd 0x123(%eax,%ecx,8),%xmm3,%k5{%k7}"); 2260 asm volatile("vcmplesd {sae},%xmm4,%xmm5,%k5{%k7}"); 2261 asm volatile("vgetmantss $0x5b,0x123(%eax,%ecx,8),%xmm4,%xmm5{%k7}"); 2262 2263 /* bndmk m32, bnd */ 2264 2265 asm volatile("bndmk (%eax), %bnd0"); 2266 asm volatile("bndmk (0x12345678), %bnd0"); 2267 asm volatile("bndmk (%eax), %bnd3"); 2268 asm volatile("bndmk (%ecx,%eax,1), %bnd0"); 2269 asm volatile("bndmk 0x12345678(,%eax,1), %bnd0"); 2270 asm volatile("bndmk (%eax,%ecx,1), %bnd0"); 2271 asm volatile("bndmk (%eax,%ecx,8), %bnd0"); 2272 asm volatile("bndmk 0x12(%eax), %bnd0"); 2273 asm volatile("bndmk 0x12(%ebp), %bnd0"); 2274 asm volatile("bndmk 0x12(%ecx,%eax,1), %bnd0"); 2275 asm volatile("bndmk 0x12(%ebp,%eax,1), %bnd0"); 2276 asm volatile("bndmk 0x12(%eax,%ecx,1), %bnd0"); 2277 asm volatile("bndmk 0x12(%eax,%ecx,8), %bnd0"); 2278 asm volatile("bndmk 0x12345678(%eax), %bnd0"); 2279 asm volatile("bndmk 0x12345678(%ebp), %bnd0"); 2280 asm volatile("bndmk 0x12345678(%ecx,%eax,1), %bnd0"); 2281 asm volatile("bndmk 0x12345678(%ebp,%eax,1), %bnd0"); 2282 asm volatile("bndmk 0x12345678(%eax,%ecx,1), %bnd0"); 2283 asm volatile("bndmk 0x12345678(%eax,%ecx,8), %bnd0"); 2284 2285 /* bndcl r/m32, bnd */ 2286 2287 asm volatile("bndcl (%eax), %bnd0"); 2288 asm volatile("bndcl (0x12345678), %bnd0"); 2289 asm volatile("bndcl (%eax), %bnd3"); 2290 asm volatile("bndcl (%ecx,%eax,1), %bnd0"); 2291 asm volatile("bndcl 0x12345678(,%eax,1), %bnd0"); 2292 asm volatile("bndcl (%eax,%ecx,1), %bnd0"); 2293 asm volatile("bndcl (%eax,%ecx,8), %bnd0"); 2294 asm volatile("bndcl 0x12(%eax), %bnd0"); 2295 asm volatile("bndcl 0x12(%ebp), %bnd0"); 2296 asm volatile("bndcl 0x12(%ecx,%eax,1), %bnd0"); 2297 asm volatile("bndcl 0x12(%ebp,%eax,1), %bnd0"); 2298 asm volatile("bndcl 0x12(%eax,%ecx,1), %bnd0"); 2299 asm volatile("bndcl 0x12(%eax,%ecx,8), %bnd0"); 2300 asm volatile("bndcl 0x12345678(%eax), %bnd0"); 2301 asm volatile("bndcl 0x12345678(%ebp), %bnd0"); 2302 asm volatile("bndcl 0x12345678(%ecx,%eax,1), %bnd0"); 2303 asm volatile("bndcl 0x12345678(%ebp,%eax,1), %bnd0"); 2304 asm volatile("bndcl 0x12345678(%eax,%ecx,1), %bnd0"); 2305 asm volatile("bndcl 0x12345678(%eax,%ecx,8), %bnd0"); 2306 asm volatile("bndcl %eax, %bnd0"); 2307 2308 /* bndcu r/m32, bnd */ 2309 2310 asm volatile("bndcu (%eax), %bnd0"); 2311 asm volatile("bndcu (0x12345678), %bnd0"); 2312 asm volatile("bndcu (%eax), %bnd3"); 2313 asm volatile("bndcu (%ecx,%eax,1), %bnd0"); 2314 asm volatile("bndcu 0x12345678(,%eax,1), %bnd0"); 2315 asm volatile("bndcu (%eax,%ecx,1), %bnd0"); 2316 asm volatile("bndcu (%eax,%ecx,8), %bnd0"); 2317 asm volatile("bndcu 0x12(%eax), %bnd0"); 2318 asm volatile("bndcu 0x12(%ebp), %bnd0"); 2319 asm volatile("bndcu 0x12(%ecx,%eax,1), %bnd0"); 2320 asm volatile("bndcu 0x12(%ebp,%eax,1), %bnd0"); 2321 asm volatile("bndcu 0x12(%eax,%ecx,1), %bnd0"); 2322 asm volatile("bndcu 0x12(%eax,%ecx,8), %bnd0"); 2323 asm volatile("bndcu 0x12345678(%eax), %bnd0"); 2324 asm volatile("bndcu 0x12345678(%ebp), %bnd0"); 2325 asm volatile("bndcu 0x12345678(%ecx,%eax,1), %bnd0"); 2326 asm volatile("bndcu 0x12345678(%ebp,%eax,1), %bnd0"); 2327 asm volatile("bndcu 0x12345678(%eax,%ecx,1), %bnd0"); 2328 asm volatile("bndcu 0x12345678(%eax,%ecx,8), %bnd0"); 2329 asm volatile("bndcu %eax, %bnd0"); 2330 2331 /* bndcn r/m32, bnd */ 2332 2333 asm volatile("bndcn (%eax), %bnd0"); 2334 asm volatile("bndcn (0x12345678), %bnd0"); 2335 asm volatile("bndcn (%eax), %bnd3"); 2336 asm volatile("bndcn (%ecx,%eax,1), %bnd0"); 2337 asm volatile("bndcn 0x12345678(,%eax,1), %bnd0"); 2338 asm volatile("bndcn (%eax,%ecx,1), %bnd0"); 2339 asm volatile("bndcn (%eax,%ecx,8), %bnd0"); 2340 asm volatile("bndcn 0x12(%eax), %bnd0"); 2341 asm volatile("bndcn 0x12(%ebp), %bnd0"); 2342 asm volatile("bndcn 0x12(%ecx,%eax,1), %bnd0"); 2343 asm volatile("bndcn 0x12(%ebp,%eax,1), %bnd0"); 2344 asm volatile("bndcn 0x12(%eax,%ecx,1), %bnd0"); 2345 asm volatile("bndcn 0x12(%eax,%ecx,8), %bnd0"); 2346 asm volatile("bndcn 0x12345678(%eax), %bnd0"); 2347 asm volatile("bndcn 0x12345678(%ebp), %bnd0"); 2348 asm volatile("bndcn 0x12345678(%ecx,%eax,1), %bnd0"); 2349 asm volatile("bndcn 0x12345678(%ebp,%eax,1), %bnd0"); 2350 asm volatile("bndcn 0x12345678(%eax,%ecx,1), %bnd0"); 2351 asm volatile("bndcn 0x12345678(%eax,%ecx,8), %bnd0"); 2352 asm volatile("bndcn %eax, %bnd0"); 2353 2354 /* bndmov m64, bnd */ 2355 2356 asm volatile("bndmov (%eax), %bnd0"); 2357 asm volatile("bndmov (0x12345678), %bnd0"); 2358 asm volatile("bndmov (%eax), %bnd3"); 2359 asm volatile("bndmov (%ecx,%eax,1), %bnd0"); 2360 asm volatile("bndmov 0x12345678(,%eax,1), %bnd0"); 2361 asm volatile("bndmov (%eax,%ecx,1), %bnd0"); 2362 asm volatile("bndmov (%eax,%ecx,8), %bnd0"); 2363 asm volatile("bndmov 0x12(%eax), %bnd0"); 2364 asm volatile("bndmov 0x12(%ebp), %bnd0"); 2365 asm volatile("bndmov 0x12(%ecx,%eax,1), %bnd0"); 2366 asm volatile("bndmov 0x12(%ebp,%eax,1), %bnd0"); 2367 asm volatile("bndmov 0x12(%eax,%ecx,1), %bnd0"); 2368 asm volatile("bndmov 0x12(%eax,%ecx,8), %bnd0"); 2369 asm volatile("bndmov 0x12345678(%eax), %bnd0"); 2370 asm volatile("bndmov 0x12345678(%ebp), %bnd0"); 2371 asm volatile("bndmov 0x12345678(%ecx,%eax,1), %bnd0"); 2372 asm volatile("bndmov 0x12345678(%ebp,%eax,1), %bnd0"); 2373 asm volatile("bndmov 0x12345678(%eax,%ecx,1), %bnd0"); 2374 asm volatile("bndmov 0x12345678(%eax,%ecx,8), %bnd0"); 2375 2376 /* bndmov bnd, m64 */ 2377 2378 asm volatile("bndmov %bnd0, (%eax)"); 2379 asm volatile("bndmov %bnd0, (0x12345678)"); 2380 asm volatile("bndmov %bnd3, (%eax)"); 2381 asm volatile("bndmov %bnd0, (%ecx,%eax,1)"); 2382 asm volatile("bndmov %bnd0, 0x12345678(,%eax,1)"); 2383 asm volatile("bndmov %bnd0, (%eax,%ecx,1)"); 2384 asm volatile("bndmov %bnd0, (%eax,%ecx,8)"); 2385 asm volatile("bndmov %bnd0, 0x12(%eax)"); 2386 asm volatile("bndmov %bnd0, 0x12(%ebp)"); 2387 asm volatile("bndmov %bnd0, 0x12(%ecx,%eax,1)"); 2388 asm volatile("bndmov %bnd0, 0x12(%ebp,%eax,1)"); 2389 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,1)"); 2390 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,8)"); 2391 asm volatile("bndmov %bnd0, 0x12345678(%eax)"); 2392 asm volatile("bndmov %bnd0, 0x12345678(%ebp)"); 2393 asm volatile("bndmov %bnd0, 0x12345678(%ecx,%eax,1)"); 2394 asm volatile("bndmov %bnd0, 0x12345678(%ebp,%eax,1)"); 2395 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,1)"); 2396 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,8)"); 2397 2398 /* bndmov bnd2, bnd1 */ 2399 2400 asm volatile("bndmov %bnd0, %bnd1"); 2401 asm volatile("bndmov %bnd1, %bnd0"); 2402 2403 /* bndldx mib, bnd */ 2404 2405 asm volatile("bndldx (%eax), %bnd0"); 2406 asm volatile("bndldx (0x12345678), %bnd0"); 2407 asm volatile("bndldx (%eax), %bnd3"); 2408 asm volatile("bndldx (%ecx,%eax,1), %bnd0"); 2409 asm volatile("bndldx 0x12345678(,%eax,1), %bnd0"); 2410 asm volatile("bndldx (%eax,%ecx,1), %bnd0"); 2411 asm volatile("bndldx 0x12(%eax), %bnd0"); 2412 asm volatile("bndldx 0x12(%ebp), %bnd0"); 2413 asm volatile("bndldx 0x12(%ecx,%eax,1), %bnd0"); 2414 asm volatile("bndldx 0x12(%ebp,%eax,1), %bnd0"); 2415 asm volatile("bndldx 0x12(%eax,%ecx,1), %bnd0"); 2416 asm volatile("bndldx 0x12345678(%eax), %bnd0"); 2417 asm volatile("bndldx 0x12345678(%ebp), %bnd0"); 2418 asm volatile("bndldx 0x12345678(%ecx,%eax,1), %bnd0"); 2419 asm volatile("bndldx 0x12345678(%ebp,%eax,1), %bnd0"); 2420 asm volatile("bndldx 0x12345678(%eax,%ecx,1), %bnd0"); 2421 2422 /* bndstx bnd, mib */ 2423 2424 asm volatile("bndstx %bnd0, (%eax)"); 2425 asm volatile("bndstx %bnd0, (0x12345678)"); 2426 asm volatile("bndstx %bnd3, (%eax)"); 2427 asm volatile("bndstx %bnd0, (%ecx,%eax,1)"); 2428 asm volatile("bndstx %bnd0, 0x12345678(,%eax,1)"); 2429 asm volatile("bndstx %bnd0, (%eax,%ecx,1)"); 2430 asm volatile("bndstx %bnd0, 0x12(%eax)"); 2431 asm volatile("bndstx %bnd0, 0x12(%ebp)"); 2432 asm volatile("bndstx %bnd0, 0x12(%ecx,%eax,1)"); 2433 asm volatile("bndstx %bnd0, 0x12(%ebp,%eax,1)"); 2434 asm volatile("bndstx %bnd0, 0x12(%eax,%ecx,1)"); 2435 asm volatile("bndstx %bnd0, 0x12345678(%eax)"); 2436 asm volatile("bndstx %bnd0, 0x12345678(%ebp)"); 2437 asm volatile("bndstx %bnd0, 0x12345678(%ecx,%eax,1)"); 2438 asm volatile("bndstx %bnd0, 0x12345678(%ebp,%eax,1)"); 2439 asm volatile("bndstx %bnd0, 0x12345678(%eax,%ecx,1)"); 2440 2441 /* bnd prefix on call, ret, jmp and all jcc */ 2442 2443 asm volatile("bnd call label1"); /* Expecting: call unconditional 0xfffffffc */ 2444 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 2445 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 2446 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 2447 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 2448 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 2449 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0xfffffffc */ 2450 2451 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 2452 2453 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 2454 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 2455 asm volatile("sha1rnds4 $0x91, (%eax), %xmm0"); 2456 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 2457 asm volatile("sha1rnds4 $0x91, (%eax), %xmm3"); 2458 asm volatile("sha1rnds4 $0x91, (%ecx,%eax,1), %xmm0"); 2459 asm volatile("sha1rnds4 $0x91, 0x12345678(,%eax,1), %xmm0"); 2460 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,1), %xmm0"); 2461 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,8), %xmm0"); 2462 asm volatile("sha1rnds4 $0x91, 0x12(%eax), %xmm0"); 2463 asm volatile("sha1rnds4 $0x91, 0x12(%ebp), %xmm0"); 2464 asm volatile("sha1rnds4 $0x91, 0x12(%ecx,%eax,1), %xmm0"); 2465 asm volatile("sha1rnds4 $0x91, 0x12(%ebp,%eax,1), %xmm0"); 2466 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,1), %xmm0"); 2467 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,8), %xmm0"); 2468 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax), %xmm0"); 2469 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp), %xmm0"); 2470 asm volatile("sha1rnds4 $0x91, 0x12345678(%ecx,%eax,1), %xmm0"); 2471 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp,%eax,1), %xmm0"); 2472 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,1), %xmm0"); 2473 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,8), %xmm0"); 2474 2475 /* sha1nexte xmm2/m128, xmm1 */ 2476 2477 asm volatile("sha1nexte %xmm1, %xmm0"); 2478 asm volatile("sha1nexte %xmm7, %xmm2"); 2479 asm volatile("sha1nexte (%eax), %xmm0"); 2480 asm volatile("sha1nexte (0x12345678), %xmm0"); 2481 asm volatile("sha1nexte (%eax), %xmm3"); 2482 asm volatile("sha1nexte (%ecx,%eax,1), %xmm0"); 2483 asm volatile("sha1nexte 0x12345678(,%eax,1), %xmm0"); 2484 asm volatile("sha1nexte (%eax,%ecx,1), %xmm0"); 2485 asm volatile("sha1nexte (%eax,%ecx,8), %xmm0"); 2486 asm volatile("sha1nexte 0x12(%eax), %xmm0"); 2487 asm volatile("sha1nexte 0x12(%ebp), %xmm0"); 2488 asm volatile("sha1nexte 0x12(%ecx,%eax,1), %xmm0"); 2489 asm volatile("sha1nexte 0x12(%ebp,%eax,1), %xmm0"); 2490 asm volatile("sha1nexte 0x12(%eax,%ecx,1), %xmm0"); 2491 asm volatile("sha1nexte 0x12(%eax,%ecx,8), %xmm0"); 2492 asm volatile("sha1nexte 0x12345678(%eax), %xmm0"); 2493 asm volatile("sha1nexte 0x12345678(%ebp), %xmm0"); 2494 asm volatile("sha1nexte 0x12345678(%ecx,%eax,1), %xmm0"); 2495 asm volatile("sha1nexte 0x12345678(%ebp,%eax,1), %xmm0"); 2496 asm volatile("sha1nexte 0x12345678(%eax,%ecx,1), %xmm0"); 2497 asm volatile("sha1nexte 0x12345678(%eax,%ecx,8), %xmm0"); 2498 2499 /* sha1msg1 xmm2/m128, xmm1 */ 2500 2501 asm volatile("sha1msg1 %xmm1, %xmm0"); 2502 asm volatile("sha1msg1 %xmm7, %xmm2"); 2503 asm volatile("sha1msg1 (%eax), %xmm0"); 2504 asm volatile("sha1msg1 (0x12345678), %xmm0"); 2505 asm volatile("sha1msg1 (%eax), %xmm3"); 2506 asm volatile("sha1msg1 (%ecx,%eax,1), %xmm0"); 2507 asm volatile("sha1msg1 0x12345678(,%eax,1), %xmm0"); 2508 asm volatile("sha1msg1 (%eax,%ecx,1), %xmm0"); 2509 asm volatile("sha1msg1 (%eax,%ecx,8), %xmm0"); 2510 asm volatile("sha1msg1 0x12(%eax), %xmm0"); 2511 asm volatile("sha1msg1 0x12(%ebp), %xmm0"); 2512 asm volatile("sha1msg1 0x12(%ecx,%eax,1), %xmm0"); 2513 asm volatile("sha1msg1 0x12(%ebp,%eax,1), %xmm0"); 2514 asm volatile("sha1msg1 0x12(%eax,%ecx,1), %xmm0"); 2515 asm volatile("sha1msg1 0x12(%eax,%ecx,8), %xmm0"); 2516 asm volatile("sha1msg1 0x12345678(%eax), %xmm0"); 2517 asm volatile("sha1msg1 0x12345678(%ebp), %xmm0"); 2518 asm volatile("sha1msg1 0x12345678(%ecx,%eax,1), %xmm0"); 2519 asm volatile("sha1msg1 0x12345678(%ebp,%eax,1), %xmm0"); 2520 asm volatile("sha1msg1 0x12345678(%eax,%ecx,1), %xmm0"); 2521 asm volatile("sha1msg1 0x12345678(%eax,%ecx,8), %xmm0"); 2522 2523 /* sha1msg2 xmm2/m128, xmm1 */ 2524 2525 asm volatile("sha1msg2 %xmm1, %xmm0"); 2526 asm volatile("sha1msg2 %xmm7, %xmm2"); 2527 asm volatile("sha1msg2 (%eax), %xmm0"); 2528 asm volatile("sha1msg2 (0x12345678), %xmm0"); 2529 asm volatile("sha1msg2 (%eax), %xmm3"); 2530 asm volatile("sha1msg2 (%ecx,%eax,1), %xmm0"); 2531 asm volatile("sha1msg2 0x12345678(,%eax,1), %xmm0"); 2532 asm volatile("sha1msg2 (%eax,%ecx,1), %xmm0"); 2533 asm volatile("sha1msg2 (%eax,%ecx,8), %xmm0"); 2534 asm volatile("sha1msg2 0x12(%eax), %xmm0"); 2535 asm volatile("sha1msg2 0x12(%ebp), %xmm0"); 2536 asm volatile("sha1msg2 0x12(%ecx,%eax,1), %xmm0"); 2537 asm volatile("sha1msg2 0x12(%ebp,%eax,1), %xmm0"); 2538 asm volatile("sha1msg2 0x12(%eax,%ecx,1), %xmm0"); 2539 asm volatile("sha1msg2 0x12(%eax,%ecx,8), %xmm0"); 2540 asm volatile("sha1msg2 0x12345678(%eax), %xmm0"); 2541 asm volatile("sha1msg2 0x12345678(%ebp), %xmm0"); 2542 asm volatile("sha1msg2 0x12345678(%ecx,%eax,1), %xmm0"); 2543 asm volatile("sha1msg2 0x12345678(%ebp,%eax,1), %xmm0"); 2544 asm volatile("sha1msg2 0x12345678(%eax,%ecx,1), %xmm0"); 2545 asm volatile("sha1msg2 0x12345678(%eax,%ecx,8), %xmm0"); 2546 2547 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 2548 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 2549 2550 asm volatile("sha256rnds2 %xmm4, %xmm1"); 2551 asm volatile("sha256rnds2 %xmm7, %xmm2"); 2552 asm volatile("sha256rnds2 (%eax), %xmm1"); 2553 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 2554 asm volatile("sha256rnds2 (%eax), %xmm3"); 2555 asm volatile("sha256rnds2 (%ecx,%eax,1), %xmm1"); 2556 asm volatile("sha256rnds2 0x12345678(,%eax,1), %xmm1"); 2557 asm volatile("sha256rnds2 (%eax,%ecx,1), %xmm1"); 2558 asm volatile("sha256rnds2 (%eax,%ecx,8), %xmm1"); 2559 asm volatile("sha256rnds2 0x12(%eax), %xmm1"); 2560 asm volatile("sha256rnds2 0x12(%ebp), %xmm1"); 2561 asm volatile("sha256rnds2 0x12(%ecx,%eax,1), %xmm1"); 2562 asm volatile("sha256rnds2 0x12(%ebp,%eax,1), %xmm1"); 2563 asm volatile("sha256rnds2 0x12(%eax,%ecx,1), %xmm1"); 2564 asm volatile("sha256rnds2 0x12(%eax,%ecx,8), %xmm1"); 2565 asm volatile("sha256rnds2 0x12345678(%eax), %xmm1"); 2566 asm volatile("sha256rnds2 0x12345678(%ebp), %xmm1"); 2567 asm volatile("sha256rnds2 0x12345678(%ecx,%eax,1), %xmm1"); 2568 asm volatile("sha256rnds2 0x12345678(%ebp,%eax,1), %xmm1"); 2569 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,1), %xmm1"); 2570 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,8), %xmm1"); 2571 2572 /* sha256msg1 xmm2/m128, xmm1 */ 2573 2574 asm volatile("sha256msg1 %xmm1, %xmm0"); 2575 asm volatile("sha256msg1 %xmm7, %xmm2"); 2576 asm volatile("sha256msg1 (%eax), %xmm0"); 2577 asm volatile("sha256msg1 (0x12345678), %xmm0"); 2578 asm volatile("sha256msg1 (%eax), %xmm3"); 2579 asm volatile("sha256msg1 (%ecx,%eax,1), %xmm0"); 2580 asm volatile("sha256msg1 0x12345678(,%eax,1), %xmm0"); 2581 asm volatile("sha256msg1 (%eax,%ecx,1), %xmm0"); 2582 asm volatile("sha256msg1 (%eax,%ecx,8), %xmm0"); 2583 asm volatile("sha256msg1 0x12(%eax), %xmm0"); 2584 asm volatile("sha256msg1 0x12(%ebp), %xmm0"); 2585 asm volatile("sha256msg1 0x12(%ecx,%eax,1), %xmm0"); 2586 asm volatile("sha256msg1 0x12(%ebp,%eax,1), %xmm0"); 2587 asm volatile("sha256msg1 0x12(%eax,%ecx,1), %xmm0"); 2588 asm volatile("sha256msg1 0x12(%eax,%ecx,8), %xmm0"); 2589 asm volatile("sha256msg1 0x12345678(%eax), %xmm0"); 2590 asm volatile("sha256msg1 0x12345678(%ebp), %xmm0"); 2591 asm volatile("sha256msg1 0x12345678(%ecx,%eax,1), %xmm0"); 2592 asm volatile("sha256msg1 0x12345678(%ebp,%eax,1), %xmm0"); 2593 asm volatile("sha256msg1 0x12345678(%eax,%ecx,1), %xmm0"); 2594 asm volatile("sha256msg1 0x12345678(%eax,%ecx,8), %xmm0"); 2595 2596 /* sha256msg2 xmm2/m128, xmm1 */ 2597 2598 asm volatile("sha256msg2 %xmm1, %xmm0"); 2599 asm volatile("sha256msg2 %xmm7, %xmm2"); 2600 asm volatile("sha256msg2 (%eax), %xmm0"); 2601 asm volatile("sha256msg2 (0x12345678), %xmm0"); 2602 asm volatile("sha256msg2 (%eax), %xmm3"); 2603 asm volatile("sha256msg2 (%ecx,%eax,1), %xmm0"); 2604 asm volatile("sha256msg2 0x12345678(,%eax,1), %xmm0"); 2605 asm volatile("sha256msg2 (%eax,%ecx,1), %xmm0"); 2606 asm volatile("sha256msg2 (%eax,%ecx,8), %xmm0"); 2607 asm volatile("sha256msg2 0x12(%eax), %xmm0"); 2608 asm volatile("sha256msg2 0x12(%ebp), %xmm0"); 2609 asm volatile("sha256msg2 0x12(%ecx,%eax,1), %xmm0"); 2610 asm volatile("sha256msg2 0x12(%ebp,%eax,1), %xmm0"); 2611 asm volatile("sha256msg2 0x12(%eax,%ecx,1), %xmm0"); 2612 asm volatile("sha256msg2 0x12(%eax,%ecx,8), %xmm0"); 2613 asm volatile("sha256msg2 0x12345678(%eax), %xmm0"); 2614 asm volatile("sha256msg2 0x12345678(%ebp), %xmm0"); 2615 asm volatile("sha256msg2 0x12345678(%ecx,%eax,1), %xmm0"); 2616 asm volatile("sha256msg2 0x12345678(%ebp,%eax,1), %xmm0"); 2617 asm volatile("sha256msg2 0x12345678(%eax,%ecx,1), %xmm0"); 2618 asm volatile("sha256msg2 0x12345678(%eax,%ecx,8), %xmm0"); 2619 2620 /* clflushopt m8 */ 2621 2622 asm volatile("clflushopt (%eax)"); 2623 asm volatile("clflushopt (0x12345678)"); 2624 asm volatile("clflushopt 0x12345678(%eax,%ecx,8)"); 2625 /* Also check instructions in the same group encoding as clflushopt */ 2626 asm volatile("clflush (%eax)"); 2627 asm volatile("sfence"); 2628 2629 /* clwb m8 */ 2630 2631 asm volatile("clwb (%eax)"); 2632 asm volatile("clwb (0x12345678)"); 2633 asm volatile("clwb 0x12345678(%eax,%ecx,8)"); 2634 /* Also check instructions in the same group encoding as clwb */ 2635 asm volatile("xsaveopt (%eax)"); 2636 asm volatile("mfence"); 2637 2638 /* xsavec mem */ 2639 2640 asm volatile("xsavec (%eax)"); 2641 asm volatile("xsavec (0x12345678)"); 2642 asm volatile("xsavec 0x12345678(%eax,%ecx,8)"); 2643 2644 /* xsaves mem */ 2645 2646 asm volatile("xsaves (%eax)"); 2647 asm volatile("xsaves (0x12345678)"); 2648 asm volatile("xsaves 0x12345678(%eax,%ecx,8)"); 2649 2650 /* xrstors mem */ 2651 2652 asm volatile("xrstors (%eax)"); 2653 asm volatile("xrstors (0x12345678)"); 2654 asm volatile("xrstors 0x12345678(%eax,%ecx,8)"); 2655 2656 #endif /* #ifndef __x86_64__ */ 2657 2658 /* Following line is a marker for the awk script - do not change */ 2659 asm volatile("rdtsc"); /* Stop here */ 2660 2661 return 0; 2662 } 2663