# RUN: llvm-mc --disassemble %s -triple=i386 | FileCheck %s --check-prefixes=ATT
# RUN: llvm-mc --disassemble %s -triple=i386 --output-asm-variant=1 | FileCheck %s --check-prefixes=INTEL

# ATT:   vaddbf16 %ymm4, %ymm3, %ymm2
# INTEL: vaddbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x58,0xd4

# ATT:   vaddbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x58,0xd4

# ATT:   vaddbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x58,0xd4

# ATT:   vaddbf16 %zmm4, %zmm3, %zmm2
# INTEL: vaddbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x58,0xd4

# ATT:   vaddbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x58,0xd4

# ATT:   vaddbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x58,0xd4

# ATT:   vaddbf16 %xmm4, %xmm3, %xmm2
# INTEL: vaddbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x58,0xd4

# ATT:   vaddbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x58,0xd4

# ATT:   vaddbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x58,0xd4

# ATT:   vaddbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x58,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vaddbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vaddbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x58,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vaddbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vaddbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x58,0x10

# ATT:   vaddbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vaddbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x58,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vaddbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x58,0x51,0x7f

# ATT:   vaddbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vaddbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x58,0x52,0x80

# ATT:   vaddbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x58,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vaddbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vaddbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x58,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vaddbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vaddbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x58,0x10

# ATT:   vaddbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vaddbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x58,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vaddbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x58,0x51,0x7f

# ATT:   vaddbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vaddbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x58,0x52,0x80

# ATT:   vaddbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x58,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vaddbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vaddbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x58,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vaddbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vaddbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x58,0x10

# ATT:   vaddbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vaddbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x58,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vaddbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x58,0x51,0x7f

# ATT:   vaddbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vaddbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x58,0x52,0x80

# ATT:   vcmpbf16 $123, %ymm4, %ymm3, %k5
# INTEL: vcmpbf16 k5, ymm3, ymm4, 123
0x62,0xf3,0x67,0x28,0xc2,0xec,0x7b

# ATT:   vcmpbf16 $123, %ymm4, %ymm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, ymm3, ymm4, 123
0x62,0xf3,0x67,0x2f,0xc2,0xec,0x7b

# ATT:   vcmpbf16 $123, %xmm4, %xmm3, %k5
# INTEL: vcmpbf16 k5, xmm3, xmm4, 123
0x62,0xf3,0x67,0x08,0xc2,0xec,0x7b

# ATT:   vcmpbf16 $123, %xmm4, %xmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, xmm3, xmm4, 123
0x62,0xf3,0x67,0x0f,0xc2,0xec,0x7b

# ATT:   vcmpbf16 $123, %zmm4, %zmm3, %k5
# INTEL: vcmpbf16 k5, zmm3, zmm4, 123
0x62,0xf3,0x67,0x48,0xc2,0xec,0x7b

# ATT:   vcmpbf16 $123, %zmm4, %zmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, zmm3, zmm4, 123
0x62,0xf3,0x67,0x4f,0xc2,0xec,0x7b

# ATT:   vcmpbf16  $123, 268435456(%esp,%esi,8), %zmm3, %k5
# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x48,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vcmpbf16  $123, 291(%edi,%eax,4), %zmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x4f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vcmpbf16  $123, (%eax){1to32}, %zmm3, %k5
# INTEL: vcmpbf16 k5, zmm3, word ptr [eax]{1to32}, 123
0x62,0xf3,0x67,0x58,0xc2,0x28,0x7b

# ATT:   vcmpbf16  $123, -2048(,%ebp,2), %zmm3, %k5
# INTEL: vcmpbf16 k5, zmm3, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x67,0x48,0xc2,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b

# ATT:   vcmpbf16  $123, 8128(%ecx), %zmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, zmm3, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x67,0x4f,0xc2,0x69,0x7f,0x7b

# ATT:   vcmpbf16  $123, -256(%edx){1to32}, %zmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, zmm3, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x67,0x5f,0xc2,0x6a,0x80,0x7b

# ATT:   vcmpbf16  $123, 268435456(%esp,%esi,8), %xmm3, %k5
# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x08,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vcmpbf16  $123, 291(%edi,%eax,4), %xmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x0f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vcmpbf16  $123, (%eax){1to8}, %xmm3, %k5
# INTEL: vcmpbf16 k5, xmm3, word ptr [eax]{1to8}, 123
0x62,0xf3,0x67,0x18,0xc2,0x28,0x7b

# ATT:   vcmpbf16  $123, -512(,%ebp,2), %xmm3, %k5
# INTEL: vcmpbf16 k5, xmm3, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x67,0x08,0xc2,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b

# ATT:   vcmpbf16  $123, 2032(%ecx), %xmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, xmm3, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x67,0x0f,0xc2,0x69,0x7f,0x7b

# ATT:   vcmpbf16  $123, -256(%edx){1to8}, %xmm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, xmm3, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x67,0x1f,0xc2,0x6a,0x80,0x7b

# ATT:   vcmpbf16  $123, 268435456(%esp,%esi,8), %ymm3, %k5
# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x67,0x28,0xc2,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vcmpbf16  $123, 291(%edi,%eax,4), %ymm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x67,0x2f,0xc2,0xac,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vcmpbf16  $123, (%eax){1to16}, %ymm3, %k5
# INTEL: vcmpbf16 k5, ymm3, word ptr [eax]{1to16}, 123
0x62,0xf3,0x67,0x38,0xc2,0x28,0x7b

# ATT:   vcmpbf16  $123, -1024(,%ebp,2), %ymm3, %k5
# INTEL: vcmpbf16 k5, ymm3, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x67,0x28,0xc2,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b

# ATT:   vcmpbf16  $123, 4064(%ecx), %ymm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, ymm3, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x67,0x2f,0xc2,0x69,0x7f,0x7b

# ATT:   vcmpbf16  $123, -256(%edx){1to16}, %ymm3, %k5 {%k7}
# INTEL: vcmpbf16 k5 {k7}, ymm3, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x67,0x3f,0xc2,0x6a,0x80,0x7b

# ATT:   vcomisbf16 %xmm3, %xmm2
# INTEL: vcomisbf16 xmm2, xmm3
0x62,0xf5,0x7d,0x08,0x2f,0xd3

# ATT:   vcomisbf16  268435456(%esp,%esi,8), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x08,0x2f,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vcomisbf16  291(%edi,%eax,4), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x08,0x2f,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vcomisbf16  (%eax), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [eax]
0x62,0xf5,0x7d,0x08,0x2f,0x10

# ATT:   vcomisbf16  -64(,%ebp,2), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [2*ebp - 64]
0x62,0xf5,0x7d,0x08,0x2f,0x14,0x6d,0xc0,0xff,0xff,0xff

# ATT:   vcomisbf16  254(%ecx), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [ecx + 254]
0x62,0xf5,0x7d,0x08,0x2f,0x51,0x7f

# ATT:   vcomisbf16  -256(%edx), %xmm2
# INTEL: vcomisbf16 xmm2, word ptr [edx - 256]
0x62,0xf5,0x7d,0x08,0x2f,0x52,0x80

# ATT:   vdivbf16 %ymm4, %ymm3, %ymm2
# INTEL: vdivbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5e,0xd4

# ATT:   vdivbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5e,0xd4

# ATT:   vdivbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5e,0xd4

# ATT:   vdivbf16 %zmm4, %zmm3, %zmm2
# INTEL: vdivbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5e,0xd4

# ATT:   vdivbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5e,0xd4

# ATT:   vdivbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5e,0xd4

# ATT:   vdivbf16 %xmm4, %xmm3, %xmm2
# INTEL: vdivbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5e,0xd4

# ATT:   vdivbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5e,0xd4

# ATT:   vdivbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5e,0xd4

# ATT:   vdivbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vdivbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vdivbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vdivbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vdivbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5e,0x10

# ATT:   vdivbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vdivbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5e,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vdivbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5e,0x51,0x7f

# ATT:   vdivbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vdivbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5e,0x52,0x80

# ATT:   vdivbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vdivbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vdivbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vdivbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vdivbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5e,0x10

# ATT:   vdivbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vdivbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5e,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vdivbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5e,0x51,0x7f

# ATT:   vdivbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vdivbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5e,0x52,0x80

# ATT:   vdivbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vdivbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vdivbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vdivbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vdivbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5e,0x10

# ATT:   vdivbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vdivbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5e,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vdivbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5e,0x51,0x7f

# ATT:   vdivbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vdivbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5e,0x52,0x80

# ATT:   vfmadd132bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmadd132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x98,0xd4

# ATT:   vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x98,0xd4

# ATT:   vfmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x98,0xd4

# ATT:   vfmadd132bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmadd132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x98,0xd4

# ATT:   vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x98,0xd4

# ATT:   vfmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x98,0xd4

# ATT:   vfmadd132bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmadd132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x98,0xd4

# ATT:   vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x98,0xd4

# ATT:   vfmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x98,0xd4

# ATT:   vfmadd132bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x98,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd132bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x98,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd132bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x98,0x10

# ATT:   vfmadd132bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x98,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmadd132bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x98,0x51,0x7f

# ATT:   vfmadd132bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x98,0x52,0x80

# ATT:   vfmadd132bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x98,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd132bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x98,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd132bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x98,0x10

# ATT:   vfmadd132bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x98,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmadd132bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x98,0x51,0x7f

# ATT:   vfmadd132bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x98,0x52,0x80

# ATT:   vfmadd132bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x98,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd132bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x98,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd132bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x98,0x10

# ATT:   vfmadd132bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x98,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmadd132bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x98,0x51,0x7f

# ATT:   vfmadd132bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x98,0x52,0x80

# ATT:   vfmadd213bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmadd213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xa8,0xd4

# ATT:   vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xa8,0xd4

# ATT:   vfmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xa8,0xd4

# ATT:   vfmadd213bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmadd213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xa8,0xd4

# ATT:   vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xa8,0xd4

# ATT:   vfmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xa8,0xd4

# ATT:   vfmadd213bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmadd213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xa8,0xd4

# ATT:   vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xa8,0xd4

# ATT:   vfmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xa8,0xd4

# ATT:   vfmadd213bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd213bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd213bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xa8,0x10

# ATT:   vfmadd213bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xa8,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmadd213bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xa8,0x51,0x7f

# ATT:   vfmadd213bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xa8,0x52,0x80

# ATT:   vfmadd213bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd213bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd213bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xa8,0x10

# ATT:   vfmadd213bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xa8,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmadd213bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xa8,0x51,0x7f

# ATT:   vfmadd213bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xa8,0x52,0x80

# ATT:   vfmadd213bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xa8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd213bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xa8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd213bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xa8,0x10

# ATT:   vfmadd213bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xa8,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmadd213bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xa8,0x51,0x7f

# ATT:   vfmadd213bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xa8,0x52,0x80

# ATT:   vfmadd231bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmadd231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xb8,0xd4

# ATT:   vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xb8,0xd4

# ATT:   vfmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xb8,0xd4

# ATT:   vfmadd231bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmadd231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xb8,0xd4

# ATT:   vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xb8,0xd4

# ATT:   vfmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xb8,0xd4

# ATT:   vfmadd231bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmadd231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xb8,0xd4

# ATT:   vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xb8,0xd4

# ATT:   vfmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xb8,0xd4

# ATT:   vfmadd231bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd231bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd231bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xb8,0x10

# ATT:   vfmadd231bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xb8,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmadd231bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xb8,0x51,0x7f

# ATT:   vfmadd231bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xb8,0x52,0x80

# ATT:   vfmadd231bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd231bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd231bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xb8,0x10

# ATT:   vfmadd231bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xb8,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmadd231bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xb8,0x51,0x7f

# ATT:   vfmadd231bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xb8,0x52,0x80

# ATT:   vfmadd231bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xb8,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmadd231bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xb8,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmadd231bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xb8,0x10

# ATT:   vfmadd231bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xb8,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmadd231bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xb8,0x51,0x7f

# ATT:   vfmadd231bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xb8,0x52,0x80

# ATT:   vfmsub132bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmsub132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9a,0xd4

# ATT:   vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9a,0xd4

# ATT:   vfmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9a,0xd4

# ATT:   vfmsub132bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmsub132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9a,0xd4

# ATT:   vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9a,0xd4

# ATT:   vfmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9a,0xd4

# ATT:   vfmsub132bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmsub132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9a,0xd4

# ATT:   vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9a,0xd4

# ATT:   vfmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9a,0xd4

# ATT:   vfmsub132bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub132bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub132bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9a,0x10

# ATT:   vfmsub132bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9a,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmsub132bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9a,0x51,0x7f

# ATT:   vfmsub132bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9a,0x52,0x80

# ATT:   vfmsub132bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub132bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub132bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9a,0x10

# ATT:   vfmsub132bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9a,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmsub132bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9a,0x51,0x7f

# ATT:   vfmsub132bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9a,0x52,0x80

# ATT:   vfmsub132bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9a,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub132bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9a,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub132bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9a,0x10

# ATT:   vfmsub132bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9a,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmsub132bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9a,0x51,0x7f

# ATT:   vfmsub132bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9a,0x52,0x80

# ATT:   vfmsub213bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmsub213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xaa,0xd4

# ATT:   vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xaa,0xd4

# ATT:   vfmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xaa,0xd4

# ATT:   vfmsub213bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmsub213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xaa,0xd4

# ATT:   vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xaa,0xd4

# ATT:   vfmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xaa,0xd4

# ATT:   vfmsub213bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmsub213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xaa,0xd4

# ATT:   vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xaa,0xd4

# ATT:   vfmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xaa,0xd4

# ATT:   vfmsub213bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub213bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub213bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xaa,0x10

# ATT:   vfmsub213bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xaa,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmsub213bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xaa,0x51,0x7f

# ATT:   vfmsub213bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xaa,0x52,0x80

# ATT:   vfmsub213bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub213bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub213bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xaa,0x10

# ATT:   vfmsub213bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xaa,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmsub213bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xaa,0x51,0x7f

# ATT:   vfmsub213bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xaa,0x52,0x80

# ATT:   vfmsub213bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xaa,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub213bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xaa,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub213bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xaa,0x10

# ATT:   vfmsub213bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xaa,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmsub213bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xaa,0x51,0x7f

# ATT:   vfmsub213bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xaa,0x52,0x80

# ATT:   vfmsub231bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfmsub231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xba,0xd4

# ATT:   vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xba,0xd4

# ATT:   vfmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xba,0xd4

# ATT:   vfmsub231bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfmsub231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xba,0xd4

# ATT:   vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xba,0xd4

# ATT:   vfmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xba,0xd4

# ATT:   vfmsub231bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfmsub231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xba,0xd4

# ATT:   vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xba,0xd4

# ATT:   vfmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xba,0xd4

# ATT:   vfmsub231bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xba,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub231bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xba,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub231bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xba,0x10

# ATT:   vfmsub231bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xba,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfmsub231bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xba,0x51,0x7f

# ATT:   vfmsub231bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xba,0x52,0x80

# ATT:   vfmsub231bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xba,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub231bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xba,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub231bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xba,0x10

# ATT:   vfmsub231bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xba,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfmsub231bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xba,0x51,0x7f

# ATT:   vfmsub231bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xba,0x52,0x80

# ATT:   vfmsub231bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xba,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfmsub231bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xba,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfmsub231bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xba,0x10

# ATT:   vfmsub231bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xba,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfmsub231bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xba,0x51,0x7f

# ATT:   vfmsub231bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xba,0x52,0x80

# ATT:   vfnmadd132bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmadd132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9c,0xd4

# ATT:   vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9c,0xd4

# ATT:   vfnmadd132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9c,0xd4

# ATT:   vfnmadd132bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmadd132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9c,0xd4

# ATT:   vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9c,0xd4

# ATT:   vfnmadd132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9c,0xd4

# ATT:   vfnmadd132bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmadd132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9c,0xd4

# ATT:   vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9c,0xd4

# ATT:   vfnmadd132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9c,0xd4

# ATT:   vfnmadd132bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd132bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd132bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmadd132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9c,0x10

# ATT:   vfnmadd132bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmadd132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9c,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmadd132bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9c,0x51,0x7f

# ATT:   vfnmadd132bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9c,0x52,0x80

# ATT:   vfnmadd132bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd132bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd132bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmadd132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9c,0x10

# ATT:   vfnmadd132bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmadd132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9c,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmadd132bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9c,0x51,0x7f

# ATT:   vfnmadd132bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9c,0x52,0x80

# ATT:   vfnmadd132bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd132bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd132bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmadd132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9c,0x10

# ATT:   vfnmadd132bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmadd132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9c,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmadd132bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9c,0x51,0x7f

# ATT:   vfnmadd132bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9c,0x52,0x80

# ATT:   vfnmadd213bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmadd213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xac,0xd4

# ATT:   vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xac,0xd4

# ATT:   vfnmadd213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xac,0xd4

# ATT:   vfnmadd213bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmadd213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xac,0xd4

# ATT:   vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xac,0xd4

# ATT:   vfnmadd213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xac,0xd4

# ATT:   vfnmadd213bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmadd213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xac,0xd4

# ATT:   vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xac,0xd4

# ATT:   vfnmadd213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xac,0xd4

# ATT:   vfnmadd213bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xac,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd213bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xac,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd213bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmadd213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xac,0x10

# ATT:   vfnmadd213bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmadd213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xac,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmadd213bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xac,0x51,0x7f

# ATT:   vfnmadd213bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xac,0x52,0x80

# ATT:   vfnmadd213bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xac,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd213bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xac,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd213bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmadd213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xac,0x10

# ATT:   vfnmadd213bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmadd213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xac,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmadd213bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xac,0x51,0x7f

# ATT:   vfnmadd213bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xac,0x52,0x80

# ATT:   vfnmadd213bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xac,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd213bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xac,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd213bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmadd213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xac,0x10

# ATT:   vfnmadd213bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmadd213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xac,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmadd213bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xac,0x51,0x7f

# ATT:   vfnmadd213bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xac,0x52,0x80

# ATT:   vfnmadd231bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmadd231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xbc,0xd4

# ATT:   vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xbc,0xd4

# ATT:   vfnmadd231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xbc,0xd4

# ATT:   vfnmadd231bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmadd231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xbc,0xd4

# ATT:   vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xbc,0xd4

# ATT:   vfnmadd231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xbc,0xd4

# ATT:   vfnmadd231bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmadd231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xbc,0xd4

# ATT:   vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xbc,0xd4

# ATT:   vfnmadd231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xbc,0xd4

# ATT:   vfnmadd231bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd231bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmadd231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd231bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmadd231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xbc,0x10

# ATT:   vfnmadd231bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmadd231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xbc,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmadd231bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xbc,0x51,0x7f

# ATT:   vfnmadd231bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xbc,0x52,0x80

# ATT:   vfnmadd231bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd231bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmadd231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd231bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmadd231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xbc,0x10

# ATT:   vfnmadd231bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmadd231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xbc,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmadd231bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xbc,0x51,0x7f

# ATT:   vfnmadd231bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmadd231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xbc,0x52,0x80

# ATT:   vfnmadd231bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xbc,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmadd231bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmadd231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xbc,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmadd231bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmadd231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xbc,0x10

# ATT:   vfnmadd231bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmadd231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xbc,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmadd231bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xbc,0x51,0x7f

# ATT:   vfnmadd231bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmadd231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xbc,0x52,0x80

# ATT:   vfnmsub132bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmsub132bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x9e,0xd4

# ATT:   vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x9e,0xd4

# ATT:   vfnmsub132bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x9e,0xd4

# ATT:   vfnmsub132bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmsub132bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x9e,0xd4

# ATT:   vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x9e,0xd4

# ATT:   vfnmsub132bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x9e,0xd4

# ATT:   vfnmsub132bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmsub132bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x9e,0xd4

# ATT:   vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x9e,0xd4

# ATT:   vfnmsub132bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x9e,0xd4

# ATT:   vfnmsub132bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub132bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub132bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub132bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmsub132bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x9e,0x10

# ATT:   vfnmsub132bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmsub132bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x9e,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmsub132bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x9e,0x51,0x7f

# ATT:   vfnmsub132bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x9e,0x52,0x80

# ATT:   vfnmsub132bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub132bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub132bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub132bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmsub132bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x9e,0x10

# ATT:   vfnmsub132bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmsub132bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x9e,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmsub132bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x9e,0x51,0x7f

# ATT:   vfnmsub132bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub132bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x9e,0x52,0x80

# ATT:   vfnmsub132bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x9e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub132bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub132bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x9e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub132bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmsub132bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x9e,0x10

# ATT:   vfnmsub132bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmsub132bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x9e,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmsub132bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x9e,0x51,0x7f

# ATT:   vfnmsub132bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub132bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x9e,0x52,0x80

# ATT:   vfnmsub213bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmsub213bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xae,0xd4

# ATT:   vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xae,0xd4

# ATT:   vfnmsub213bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xae,0xd4

# ATT:   vfnmsub213bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmsub213bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xae,0xd4

# ATT:   vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xae,0xd4

# ATT:   vfnmsub213bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xae,0xd4

# ATT:   vfnmsub213bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmsub213bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xae,0xd4

# ATT:   vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xae,0xd4

# ATT:   vfnmsub213bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xae,0xd4

# ATT:   vfnmsub213bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xae,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub213bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub213bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xae,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub213bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmsub213bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xae,0x10

# ATT:   vfnmsub213bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmsub213bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xae,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmsub213bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xae,0x51,0x7f

# ATT:   vfnmsub213bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xae,0x52,0x80

# ATT:   vfnmsub213bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xae,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub213bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub213bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xae,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub213bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmsub213bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xae,0x10

# ATT:   vfnmsub213bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmsub213bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xae,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmsub213bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xae,0x51,0x7f

# ATT:   vfnmsub213bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub213bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xae,0x52,0x80

# ATT:   vfnmsub213bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xae,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub213bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub213bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xae,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub213bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmsub213bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xae,0x10

# ATT:   vfnmsub213bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmsub213bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xae,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmsub213bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xae,0x51,0x7f

# ATT:   vfnmsub213bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub213bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xae,0x52,0x80

# ATT:   vfnmsub231bf16 %ymm4, %ymm3, %ymm2
# INTEL: vfnmsub231bf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0xbe,0xd4

# ATT:   vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0xbe,0xd4

# ATT:   vfnmsub231bf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0xbe,0xd4

# ATT:   vfnmsub231bf16 %zmm4, %zmm3, %zmm2
# INTEL: vfnmsub231bf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0xbe,0xd4

# ATT:   vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0xbe,0xd4

# ATT:   vfnmsub231bf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0xbe,0xd4

# ATT:   vfnmsub231bf16 %xmm4, %xmm3, %xmm2
# INTEL: vfnmsub231bf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0xbe,0xd4

# ATT:   vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0xbe,0xd4

# ATT:   vfnmsub231bf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0xbe,0xd4

# ATT:   vfnmsub231bf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub231bf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vfnmsub231bf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub231bf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vfnmsub231bf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0xbe,0x10

# ATT:   vfnmsub231bf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vfnmsub231bf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0xbe,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vfnmsub231bf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0xbe,0x51,0x7f

# ATT:   vfnmsub231bf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0xbe,0x52,0x80

# ATT:   vfnmsub231bf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub231bf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vfnmsub231bf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub231bf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vfnmsub231bf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0xbe,0x10

# ATT:   vfnmsub231bf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vfnmsub231bf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0xbe,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vfnmsub231bf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0xbe,0x51,0x7f

# ATT:   vfnmsub231bf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vfnmsub231bf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0xbe,0x52,0x80

# ATT:   vfnmsub231bf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0xbe,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vfnmsub231bf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vfnmsub231bf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0xbe,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vfnmsub231bf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vfnmsub231bf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0xbe,0x10

# ATT:   vfnmsub231bf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vfnmsub231bf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0xbe,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vfnmsub231bf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0xbe,0x51,0x7f

# ATT:   vfnmsub231bf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vfnmsub231bf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0xbe,0x52,0x80

# ATT:   vfpclassbf16 $123, %zmm3, %k5
# INTEL: vfpclassbf16 k5, zmm3, 123
0x62,0xf3,0x7f,0x48,0x66,0xeb,0x7b

# ATT:   vfpclassbf16 $123, %zmm3, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x66,0xeb,0x7b

# ATT:   vfpclassbf16 $123, %ymm3, %k5
# INTEL: vfpclassbf16 k5, ymm3, 123
0x62,0xf3,0x7f,0x28,0x66,0xeb,0x7b

# ATT:   vfpclassbf16 $123, %ymm3, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x66,0xeb,0x7b

# ATT:   vfpclassbf16 $123, %xmm3, %k5
# INTEL: vfpclassbf16 k5, xmm3, 123
0x62,0xf3,0x7f,0x08,0x66,0xeb,0x7b

# ATT:   vfpclassbf16 $123, %xmm3, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x66,0xeb,0x7b

# ATT:   vfpclassbf16x  $123, 268435456(%esp,%esi,8), %k5
# INTEL: vfpclassbf16 k5, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x66,0xac,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vfpclassbf16x  $123, 291(%edi,%eax,4), %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x66,0xac,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vfpclassbf16  $123, (%eax){1to8}, %k5
# INTEL: vfpclassbf16 k5, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x66,0x28,0x7b

# ATT:   vfpclassbf16x  $123, -512(,%ebp,2), %k5
# INTEL: vfpclassbf16 k5, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x66,0x2c,0x6d,0x00,0xfe,0xff,0xff,0x7b

# ATT:   vfpclassbf16x  $123, 2032(%ecx), %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x0f,0x66,0x69,0x7f,0x7b

# ATT:   vfpclassbf16  $123, -256(%edx){1to8}, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x1f,0x66,0x6a,0x80,0x7b

# ATT:   vfpclassbf16  $123, (%eax){1to16}, %k5
# INTEL: vfpclassbf16 k5, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x66,0x28,0x7b

# ATT:   vfpclassbf16y  $123, -1024(,%ebp,2), %k5
# INTEL: vfpclassbf16 k5, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x66,0x2c,0x6d,0x00,0xfc,0xff,0xff,0x7b

# ATT:   vfpclassbf16y  $123, 4064(%ecx), %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0x2f,0x66,0x69,0x7f,0x7b

# ATT:   vfpclassbf16  $123, -256(%edx){1to16}, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0x3f,0x66,0x6a,0x80,0x7b

# ATT:   vfpclassbf16  $123, (%eax){1to32}, %k5
# INTEL: vfpclassbf16 k5, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x66,0x28,0x7b

# ATT:   vfpclassbf16z  $123, -2048(,%ebp,2), %k5
# INTEL: vfpclassbf16 k5, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x66,0x2c,0x6d,0x00,0xf8,0xff,0xff,0x7b

# ATT:   vfpclassbf16z  $123, 8128(%ecx), %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0x4f,0x66,0x69,0x7f,0x7b

# ATT:   vfpclassbf16  $123, -256(%edx){1to32}, %k5 {%k7}
# INTEL: vfpclassbf16 k5 {k7}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0x5f,0x66,0x6a,0x80,0x7b

# ATT:   vgetexpbf16 %xmm3, %xmm2
# INTEL: vgetexpbf16 xmm2, xmm3
0x62,0xf5,0x7d,0x08,0x42,0xd3

# ATT:   vgetexpbf16 %xmm3, %xmm2 {%k7}
# INTEL: vgetexpbf16 xmm2 {k7}, xmm3
0x62,0xf5,0x7d,0x0f,0x42,0xd3

# ATT:   vgetexpbf16 %xmm3, %xmm2 {%k7} {z}
# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmm3
0x62,0xf5,0x7d,0x8f,0x42,0xd3

# ATT:   vgetexpbf16 %zmm3, %zmm2
# INTEL: vgetexpbf16 zmm2, zmm3
0x62,0xf5,0x7d,0x48,0x42,0xd3

# ATT:   vgetexpbf16 %zmm3, %zmm2 {%k7}
# INTEL: vgetexpbf16 zmm2 {k7}, zmm3
0x62,0xf5,0x7d,0x4f,0x42,0xd3

# ATT:   vgetexpbf16 %zmm3, %zmm2 {%k7} {z}
# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmm3
0x62,0xf5,0x7d,0xcf,0x42,0xd3

# ATT:   vgetexpbf16 %ymm3, %ymm2
# INTEL: vgetexpbf16 ymm2, ymm3
0x62,0xf5,0x7d,0x28,0x42,0xd3

# ATT:   vgetexpbf16 %ymm3, %ymm2 {%k7}
# INTEL: vgetexpbf16 ymm2 {k7}, ymm3
0x62,0xf5,0x7d,0x2f,0x42,0xd3

# ATT:   vgetexpbf16 %ymm3, %ymm2 {%k7} {z}
# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymm3
0x62,0xf5,0x7d,0xaf,0x42,0xd3

# ATT:   vgetexpbf16  268435456(%esp,%esi,8), %xmm2
# INTEL: vgetexpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x08,0x42,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vgetexpbf16  291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vgetexpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x0f,0x42,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vgetexpbf16  (%eax){1to8}, %xmm2
# INTEL: vgetexpbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf5,0x7d,0x18,0x42,0x10

# ATT:   vgetexpbf16  -512(,%ebp,2), %xmm2
# INTEL: vgetexpbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x7d,0x08,0x42,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vgetexpbf16  2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vgetexpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf5,0x7d,0x8f,0x42,0x51,0x7f

# ATT:   vgetexpbf16  -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vgetexpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf5,0x7d,0x9f,0x42,0x52,0x80

# ATT:   vgetexpbf16  268435456(%esp,%esi,8), %ymm2
# INTEL: vgetexpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x28,0x42,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vgetexpbf16  291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vgetexpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x2f,0x42,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vgetexpbf16  (%eax){1to16}, %ymm2
# INTEL: vgetexpbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf5,0x7d,0x38,0x42,0x10

# ATT:   vgetexpbf16  -1024(,%ebp,2), %ymm2
# INTEL: vgetexpbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x7d,0x28,0x42,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vgetexpbf16  4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vgetexpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf5,0x7d,0xaf,0x42,0x51,0x7f

# ATT:   vgetexpbf16  -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vgetexpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf5,0x7d,0xbf,0x42,0x52,0x80

# ATT:   vgetexpbf16  268435456(%esp,%esi,8), %zmm2
# INTEL: vgetexpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x48,0x42,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vgetexpbf16  291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vgetexpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x4f,0x42,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vgetexpbf16  (%eax){1to32}, %zmm2
# INTEL: vgetexpbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf5,0x7d,0x58,0x42,0x10

# ATT:   vgetexpbf16  -2048(,%ebp,2), %zmm2
# INTEL: vgetexpbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x7d,0x48,0x42,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vgetexpbf16  8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vgetexpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf5,0x7d,0xcf,0x42,0x51,0x7f

# ATT:   vgetexpbf16  -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vgetexpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf5,0x7d,0xdf,0x42,0x52,0x80

# ATT:   vgetmantbf16 $123, %zmm3, %zmm2
# INTEL: vgetmantbf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %zmm3, %zmm2 {%k7}
# INTEL: vgetmantbf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %zmm3, %zmm2 {%k7} {z}
# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %ymm3, %ymm2
# INTEL: vgetmantbf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %ymm3, %ymm2 {%k7}
# INTEL: vgetmantbf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %ymm3, %ymm2 {%k7} {z}
# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %xmm3, %xmm2
# INTEL: vgetmantbf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %xmm3, %xmm2 {%k7}
# INTEL: vgetmantbf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x26,0xd3,0x7b

# ATT:   vgetmantbf16 $123, %xmm3, %xmm2 {%k7} {z}
# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x26,0xd3,0x7b

# ATT:   vgetmantbf16  $123, 268435456(%esp,%esi,8), %xmm2
# INTEL: vgetmantbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vgetmantbf16  $123, 291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vgetmantbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vgetmantbf16  $123, (%eax){1to8}, %xmm2
# INTEL: vgetmantbf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x26,0x10,0x7b

# ATT:   vgetmantbf16  $123, -512(,%ebp,2), %xmm2
# INTEL: vgetmantbf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x26,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b

# ATT:   vgetmantbf16  $123, 2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vgetmantbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x26,0x51,0x7f,0x7b

# ATT:   vgetmantbf16  $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vgetmantbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x26,0x52,0x80,0x7b

# ATT:   vgetmantbf16  $123, 268435456(%esp,%esi,8), %ymm2
# INTEL: vgetmantbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vgetmantbf16  $123, 291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vgetmantbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vgetmantbf16  $123, (%eax){1to16}, %ymm2
# INTEL: vgetmantbf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x26,0x10,0x7b

# ATT:   vgetmantbf16  $123, -1024(,%ebp,2), %ymm2
# INTEL: vgetmantbf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x26,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b

# ATT:   vgetmantbf16  $123, 4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vgetmantbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x26,0x51,0x7f,0x7b

# ATT:   vgetmantbf16  $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vgetmantbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x26,0x52,0x80,0x7b

# ATT:   vgetmantbf16  $123, 268435456(%esp,%esi,8), %zmm2
# INTEL: vgetmantbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x26,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vgetmantbf16  $123, 291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vgetmantbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x26,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vgetmantbf16  $123, (%eax){1to32}, %zmm2
# INTEL: vgetmantbf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x26,0x10,0x7b

# ATT:   vgetmantbf16  $123, -2048(,%ebp,2), %zmm2
# INTEL: vgetmantbf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x26,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b

# ATT:   vgetmantbf16  $123, 8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vgetmantbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x26,0x51,0x7f,0x7b

# ATT:   vgetmantbf16  $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vgetmantbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x26,0x52,0x80,0x7b

# ATT:   vmaxbf16 %ymm4, %ymm3, %ymm2
# INTEL: vmaxbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5f,0xd4

# ATT:   vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5f,0xd4

# ATT:   vmaxbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5f,0xd4

# ATT:   vmaxbf16 %zmm4, %zmm3, %zmm2
# INTEL: vmaxbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5f,0xd4

# ATT:   vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5f,0xd4

# ATT:   vmaxbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5f,0xd4

# ATT:   vmaxbf16 %xmm4, %xmm3, %xmm2
# INTEL: vmaxbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5f,0xd4

# ATT:   vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5f,0xd4

# ATT:   vmaxbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5f,0xd4

# ATT:   vmaxbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmaxbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vmaxbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmaxbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vmaxbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5f,0x10

# ATT:   vmaxbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vmaxbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5f,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vmaxbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5f,0x51,0x7f

# ATT:   vmaxbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vmaxbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5f,0x52,0x80

# ATT:   vmaxbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmaxbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vmaxbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmaxbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vmaxbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5f,0x10

# ATT:   vmaxbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vmaxbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5f,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vmaxbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5f,0x51,0x7f

# ATT:   vmaxbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vmaxbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5f,0x52,0x80

# ATT:   vmaxbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5f,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmaxbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vmaxbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5f,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmaxbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vmaxbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5f,0x10

# ATT:   vmaxbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vmaxbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5f,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vmaxbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5f,0x51,0x7f

# ATT:   vmaxbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vmaxbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5f,0x52,0x80

# ATT:   vminbf16 %ymm4, %ymm3, %ymm2
# INTEL: vminbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5d,0xd4

# ATT:   vminbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vminbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5d,0xd4

# ATT:   vminbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5d,0xd4

# ATT:   vminbf16 %zmm4, %zmm3, %zmm2
# INTEL: vminbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5d,0xd4

# ATT:   vminbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vminbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5d,0xd4

# ATT:   vminbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5d,0xd4

# ATT:   vminbf16 %xmm4, %xmm3, %xmm2
# INTEL: vminbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5d,0xd4

# ATT:   vminbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vminbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5d,0xd4

# ATT:   vminbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5d,0xd4

# ATT:   vminbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vminbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vminbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vminbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vminbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5d,0x10

# ATT:   vminbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vminbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5d,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vminbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5d,0x51,0x7f

# ATT:   vminbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vminbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5d,0x52,0x80

# ATT:   vminbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vminbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vminbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vminbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vminbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5d,0x10

# ATT:   vminbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vminbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5d,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vminbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5d,0x51,0x7f

# ATT:   vminbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vminbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5d,0x52,0x80

# ATT:   vminbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5d,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vminbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vminbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5d,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vminbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vminbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5d,0x10

# ATT:   vminbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vminbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5d,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vminbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5d,0x51,0x7f

# ATT:   vminbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vminbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5d,0x52,0x80

# ATT:   vmulbf16 %ymm4, %ymm3, %ymm2
# INTEL: vmulbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x59,0xd4

# ATT:   vmulbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x59,0xd4

# ATT:   vmulbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x59,0xd4

# ATT:   vmulbf16 %zmm4, %zmm3, %zmm2
# INTEL: vmulbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x59,0xd4

# ATT:   vmulbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x59,0xd4

# ATT:   vmulbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x59,0xd4

# ATT:   vmulbf16 %xmm4, %xmm3, %xmm2
# INTEL: vmulbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x59,0xd4

# ATT:   vmulbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x59,0xd4

# ATT:   vmulbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x59,0xd4

# ATT:   vmulbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x59,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmulbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vmulbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x59,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmulbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vmulbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x59,0x10

# ATT:   vmulbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vmulbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x59,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vmulbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x59,0x51,0x7f

# ATT:   vmulbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vmulbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x59,0x52,0x80

# ATT:   vmulbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x59,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmulbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vmulbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x59,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmulbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vmulbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x59,0x10

# ATT:   vmulbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vmulbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x59,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vmulbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x59,0x51,0x7f

# ATT:   vmulbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vmulbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x59,0x52,0x80

# ATT:   vmulbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x59,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vmulbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vmulbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x59,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vmulbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vmulbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x59,0x10

# ATT:   vmulbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vmulbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x59,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vmulbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x59,0x51,0x7f

# ATT:   vmulbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vmulbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x59,0x52,0x80

# ATT:   vrcpbf16 %xmm3, %xmm2
# INTEL: vrcpbf16 xmm2, xmm3
0x62,0xf6,0x7c,0x08,0x4c,0xd3

# ATT:   vrcpbf16 %xmm3, %xmm2 {%k7}
# INTEL: vrcpbf16 xmm2 {k7}, xmm3
0x62,0xf6,0x7c,0x0f,0x4c,0xd3

# ATT:   vrcpbf16 %xmm3, %xmm2 {%k7} {z}
# INTEL: vrcpbf16 xmm2 {k7} {z}, xmm3
0x62,0xf6,0x7c,0x8f,0x4c,0xd3

# ATT:   vrcpbf16 %zmm3, %zmm2
# INTEL: vrcpbf16 zmm2, zmm3
0x62,0xf6,0x7c,0x48,0x4c,0xd3

# ATT:   vrcpbf16 %zmm3, %zmm2 {%k7}
# INTEL: vrcpbf16 zmm2 {k7}, zmm3
0x62,0xf6,0x7c,0x4f,0x4c,0xd3

# ATT:   vrcpbf16 %zmm3, %zmm2 {%k7} {z}
# INTEL: vrcpbf16 zmm2 {k7} {z}, zmm3
0x62,0xf6,0x7c,0xcf,0x4c,0xd3

# ATT:   vrcpbf16 %ymm3, %ymm2
# INTEL: vrcpbf16 ymm2, ymm3
0x62,0xf6,0x7c,0x28,0x4c,0xd3

# ATT:   vrcpbf16 %ymm3, %ymm2 {%k7}
# INTEL: vrcpbf16 ymm2 {k7}, ymm3
0x62,0xf6,0x7c,0x2f,0x4c,0xd3

# ATT:   vrcpbf16 %ymm3, %ymm2 {%k7} {z}
# INTEL: vrcpbf16 ymm2 {k7} {z}, ymm3
0x62,0xf6,0x7c,0xaf,0x4c,0xd3

# ATT:   vrcpbf16  268435456(%esp,%esi,8), %xmm2
# INTEL: vrcpbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x08,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrcpbf16  291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vrcpbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x0f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrcpbf16  (%eax){1to8}, %xmm2
# INTEL: vrcpbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf6,0x7c,0x18,0x4c,0x10

# ATT:   vrcpbf16  -512(,%ebp,2), %xmm2
# INTEL: vrcpbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x7c,0x08,0x4c,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vrcpbf16  2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vrcpbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf6,0x7c,0x8f,0x4c,0x51,0x7f

# ATT:   vrcpbf16  -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vrcpbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf6,0x7c,0x9f,0x4c,0x52,0x80

# ATT:   vrcpbf16  268435456(%esp,%esi,8), %ymm2
# INTEL: vrcpbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x28,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrcpbf16  291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vrcpbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x2f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrcpbf16  (%eax){1to16}, %ymm2
# INTEL: vrcpbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf6,0x7c,0x38,0x4c,0x10

# ATT:   vrcpbf16  -1024(,%ebp,2), %ymm2
# INTEL: vrcpbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x7c,0x28,0x4c,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vrcpbf16  4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vrcpbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf6,0x7c,0xaf,0x4c,0x51,0x7f

# ATT:   vrcpbf16  -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vrcpbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf6,0x7c,0xbf,0x4c,0x52,0x80

# ATT:   vrcpbf16  268435456(%esp,%esi,8), %zmm2
# INTEL: vrcpbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x48,0x4c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrcpbf16  291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vrcpbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x4f,0x4c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrcpbf16  (%eax){1to32}, %zmm2
# INTEL: vrcpbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf6,0x7c,0x58,0x4c,0x10

# ATT:   vrcpbf16  -2048(,%ebp,2), %zmm2
# INTEL: vrcpbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x7c,0x48,0x4c,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vrcpbf16  8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vrcpbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf6,0x7c,0xcf,0x4c,0x51,0x7f

# ATT:   vrcpbf16  -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vrcpbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf6,0x7c,0xdf,0x4c,0x52,0x80

# ATT:   vreducebf16 $123, %zmm3, %zmm2
# INTEL: vreducebf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %zmm3, %zmm2 {%k7}
# INTEL: vreducebf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %zmm3, %zmm2 {%k7} {z}
# INTEL: vreducebf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %ymm3, %ymm2
# INTEL: vreducebf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %ymm3, %ymm2 {%k7}
# INTEL: vreducebf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %ymm3, %ymm2 {%k7} {z}
# INTEL: vreducebf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %xmm3, %xmm2
# INTEL: vreducebf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %xmm3, %xmm2 {%k7}
# INTEL: vreducebf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x56,0xd3,0x7b

# ATT:   vreducebf16 $123, %xmm3, %xmm2 {%k7} {z}
# INTEL: vreducebf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x56,0xd3,0x7b

# ATT:   vreducebf16  $123, 268435456(%esp,%esi,8), %xmm2
# INTEL: vreducebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vreducebf16  $123, 291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vreducebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vreducebf16  $123, (%eax){1to8}, %xmm2
# INTEL: vreducebf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x56,0x10,0x7b

# ATT:   vreducebf16  $123, -512(,%ebp,2), %xmm2
# INTEL: vreducebf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x56,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b

# ATT:   vreducebf16  $123, 2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vreducebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x56,0x51,0x7f,0x7b

# ATT:   vreducebf16  $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vreducebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x56,0x52,0x80,0x7b

# ATT:   vreducebf16  $123, 268435456(%esp,%esi,8), %ymm2
# INTEL: vreducebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vreducebf16  $123, 291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vreducebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vreducebf16  $123, (%eax){1to16}, %ymm2
# INTEL: vreducebf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x56,0x10,0x7b

# ATT:   vreducebf16  $123, -1024(,%ebp,2), %ymm2
# INTEL: vreducebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x56,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b

# ATT:   vreducebf16  $123, 4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vreducebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x56,0x51,0x7f,0x7b

# ATT:   vreducebf16  $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vreducebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x56,0x52,0x80,0x7b

# ATT:   vreducebf16  $123, 268435456(%esp,%esi,8), %zmm2
# INTEL: vreducebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x56,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vreducebf16  $123, 291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vreducebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x56,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vreducebf16  $123, (%eax){1to32}, %zmm2
# INTEL: vreducebf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x56,0x10,0x7b

# ATT:   vreducebf16  $123, -2048(,%ebp,2), %zmm2
# INTEL: vreducebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x56,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b

# ATT:   vreducebf16  $123, 8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vreducebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x56,0x51,0x7f,0x7b

# ATT:   vreducebf16  $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vreducebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x56,0x52,0x80,0x7b

# ATT:   vrndscalebf16 $123, %zmm3, %zmm2
# INTEL: vrndscalebf16 zmm2, zmm3, 123
0x62,0xf3,0x7f,0x48,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %zmm3, %zmm2 {%k7}
# INTEL: vrndscalebf16 zmm2 {k7}, zmm3, 123
0x62,0xf3,0x7f,0x4f,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %zmm3, %zmm2 {%k7} {z}
# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmm3, 123
0x62,0xf3,0x7f,0xcf,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %ymm3, %ymm2
# INTEL: vrndscalebf16 ymm2, ymm3, 123
0x62,0xf3,0x7f,0x28,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %ymm3, %ymm2 {%k7}
# INTEL: vrndscalebf16 ymm2 {k7}, ymm3, 123
0x62,0xf3,0x7f,0x2f,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %ymm3, %ymm2 {%k7} {z}
# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymm3, 123
0x62,0xf3,0x7f,0xaf,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %xmm3, %xmm2
# INTEL: vrndscalebf16 xmm2, xmm3, 123
0x62,0xf3,0x7f,0x08,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %xmm3, %xmm2 {%k7}
# INTEL: vrndscalebf16 xmm2 {k7}, xmm3, 123
0x62,0xf3,0x7f,0x0f,0x08,0xd3,0x7b

# ATT:   vrndscalebf16 $123, %xmm3, %xmm2 {%k7} {z}
# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmm3, 123
0x62,0xf3,0x7f,0x8f,0x08,0xd3,0x7b

# ATT:   vrndscalebf16  $123, 268435456(%esp,%esi,8), %xmm2
# INTEL: vrndscalebf16 xmm2, xmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x08,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vrndscalebf16  $123, 291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vrndscalebf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x0f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vrndscalebf16  $123, (%eax){1to8}, %xmm2
# INTEL: vrndscalebf16 xmm2, word ptr [eax]{1to8}, 123
0x62,0xf3,0x7f,0x18,0x08,0x10,0x7b

# ATT:   vrndscalebf16  $123, -512(,%ebp,2), %xmm2
# INTEL: vrndscalebf16 xmm2, xmmword ptr [2*ebp - 512], 123
0x62,0xf3,0x7f,0x08,0x08,0x14,0x6d,0x00,0xfe,0xff,0xff,0x7b

# ATT:   vrndscalebf16  $123, 2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vrndscalebf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032], 123
0x62,0xf3,0x7f,0x8f,0x08,0x51,0x7f,0x7b

# ATT:   vrndscalebf16  $123, -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vrndscalebf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}, 123
0x62,0xf3,0x7f,0x9f,0x08,0x52,0x80,0x7b

# ATT:   vrndscalebf16  $123, 268435456(%esp,%esi,8), %ymm2
# INTEL: vrndscalebf16 ymm2, ymmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x28,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vrndscalebf16  $123, 291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vrndscalebf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x2f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vrndscalebf16  $123, (%eax){1to16}, %ymm2
# INTEL: vrndscalebf16 ymm2, word ptr [eax]{1to16}, 123
0x62,0xf3,0x7f,0x38,0x08,0x10,0x7b

# ATT:   vrndscalebf16  $123, -1024(,%ebp,2), %ymm2
# INTEL: vrndscalebf16 ymm2, ymmword ptr [2*ebp - 1024], 123
0x62,0xf3,0x7f,0x28,0x08,0x14,0x6d,0x00,0xfc,0xff,0xff,0x7b

# ATT:   vrndscalebf16  $123, 4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vrndscalebf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064], 123
0x62,0xf3,0x7f,0xaf,0x08,0x51,0x7f,0x7b

# ATT:   vrndscalebf16  $123, -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vrndscalebf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}, 123
0x62,0xf3,0x7f,0xbf,0x08,0x52,0x80,0x7b

# ATT:   vrndscalebf16  $123, 268435456(%esp,%esi,8), %zmm2
# INTEL: vrndscalebf16 zmm2, zmmword ptr [esp + 8*esi + 268435456], 123
0x62,0xf3,0x7f,0x48,0x08,0x94,0xf4,0x00,0x00,0x00,0x10,0x7b

# ATT:   vrndscalebf16  $123, 291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vrndscalebf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291], 123
0x62,0xf3,0x7f,0x4f,0x08,0x94,0x87,0x23,0x01,0x00,0x00,0x7b

# ATT:   vrndscalebf16  $123, (%eax){1to32}, %zmm2
# INTEL: vrndscalebf16 zmm2, word ptr [eax]{1to32}, 123
0x62,0xf3,0x7f,0x58,0x08,0x10,0x7b

# ATT:   vrndscalebf16  $123, -2048(,%ebp,2), %zmm2
# INTEL: vrndscalebf16 zmm2, zmmword ptr [2*ebp - 2048], 123
0x62,0xf3,0x7f,0x48,0x08,0x14,0x6d,0x00,0xf8,0xff,0xff,0x7b

# ATT:   vrndscalebf16  $123, 8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vrndscalebf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128], 123
0x62,0xf3,0x7f,0xcf,0x08,0x51,0x7f,0x7b

# ATT:   vrndscalebf16  $123, -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vrndscalebf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}, 123
0x62,0xf3,0x7f,0xdf,0x08,0x52,0x80,0x7b

# ATT:   vrsqrtbf16 %xmm3, %xmm2
# INTEL: vrsqrtbf16 xmm2, xmm3
0x62,0xf6,0x7c,0x08,0x4e,0xd3

# ATT:   vrsqrtbf16 %xmm3, %xmm2 {%k7}
# INTEL: vrsqrtbf16 xmm2 {k7}, xmm3
0x62,0xf6,0x7c,0x0f,0x4e,0xd3

# ATT:   vrsqrtbf16 %xmm3, %xmm2 {%k7} {z}
# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmm3
0x62,0xf6,0x7c,0x8f,0x4e,0xd3

# ATT:   vrsqrtbf16 %zmm3, %zmm2
# INTEL: vrsqrtbf16 zmm2, zmm3
0x62,0xf6,0x7c,0x48,0x4e,0xd3

# ATT:   vrsqrtbf16 %zmm3, %zmm2 {%k7}
# INTEL: vrsqrtbf16 zmm2 {k7}, zmm3
0x62,0xf6,0x7c,0x4f,0x4e,0xd3

# ATT:   vrsqrtbf16 %zmm3, %zmm2 {%k7} {z}
# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmm3
0x62,0xf6,0x7c,0xcf,0x4e,0xd3

# ATT:   vrsqrtbf16 %ymm3, %ymm2
# INTEL: vrsqrtbf16 ymm2, ymm3
0x62,0xf6,0x7c,0x28,0x4e,0xd3

# ATT:   vrsqrtbf16 %ymm3, %ymm2 {%k7}
# INTEL: vrsqrtbf16 ymm2 {k7}, ymm3
0x62,0xf6,0x7c,0x2f,0x4e,0xd3

# ATT:   vrsqrtbf16 %ymm3, %ymm2 {%k7} {z}
# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymm3
0x62,0xf6,0x7c,0xaf,0x4e,0xd3

# ATT:   vrsqrtbf16  268435456(%esp,%esi,8), %xmm2
# INTEL: vrsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x08,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrsqrtbf16  291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vrsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x0f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrsqrtbf16  (%eax){1to8}, %xmm2
# INTEL: vrsqrtbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf6,0x7c,0x18,0x4e,0x10

# ATT:   vrsqrtbf16  -512(,%ebp,2), %xmm2
# INTEL: vrsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x7c,0x08,0x4e,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vrsqrtbf16  2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vrsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf6,0x7c,0x8f,0x4e,0x51,0x7f

# ATT:   vrsqrtbf16  -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vrsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf6,0x7c,0x9f,0x4e,0x52,0x80

# ATT:   vrsqrtbf16  268435456(%esp,%esi,8), %ymm2
# INTEL: vrsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x28,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrsqrtbf16  291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vrsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x2f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrsqrtbf16  (%eax){1to16}, %ymm2
# INTEL: vrsqrtbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf6,0x7c,0x38,0x4e,0x10

# ATT:   vrsqrtbf16  -1024(,%ebp,2), %ymm2
# INTEL: vrsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x7c,0x28,0x4e,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vrsqrtbf16  4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vrsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf6,0x7c,0xaf,0x4e,0x51,0x7f

# ATT:   vrsqrtbf16  -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vrsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf6,0x7c,0xbf,0x4e,0x52,0x80

# ATT:   vrsqrtbf16  268435456(%esp,%esi,8), %zmm2
# INTEL: vrsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x7c,0x48,0x4e,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vrsqrtbf16  291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vrsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x7c,0x4f,0x4e,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vrsqrtbf16  (%eax){1to32}, %zmm2
# INTEL: vrsqrtbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf6,0x7c,0x58,0x4e,0x10

# ATT:   vrsqrtbf16  -2048(,%ebp,2), %zmm2
# INTEL: vrsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x7c,0x48,0x4e,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vrsqrtbf16  8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vrsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf6,0x7c,0xcf,0x4e,0x51,0x7f

# ATT:   vrsqrtbf16  -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vrsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf6,0x7c,0xdf,0x4e,0x52,0x80

# ATT:   vscalefbf16 %ymm4, %ymm3, %ymm2
# INTEL: vscalefbf16 ymm2, ymm3, ymm4
0x62,0xf6,0x64,0x28,0x2c,0xd4

# ATT:   vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf6,0x64,0x2f,0x2c,0xd4

# ATT:   vscalefbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf6,0x64,0xaf,0x2c,0xd4

# ATT:   vscalefbf16 %zmm4, %zmm3, %zmm2
# INTEL: vscalefbf16 zmm2, zmm3, zmm4
0x62,0xf6,0x64,0x48,0x2c,0xd4

# ATT:   vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf6,0x64,0x4f,0x2c,0xd4

# ATT:   vscalefbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf6,0x64,0xcf,0x2c,0xd4

# ATT:   vscalefbf16 %xmm4, %xmm3, %xmm2
# INTEL: vscalefbf16 xmm2, xmm3, xmm4
0x62,0xf6,0x64,0x08,0x2c,0xd4

# ATT:   vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf6,0x64,0x0f,0x2c,0xd4

# ATT:   vscalefbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf6,0x64,0x8f,0x2c,0xd4

# ATT:   vscalefbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x48,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vscalefbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vscalefbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x4f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vscalefbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vscalefbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf6,0x64,0x58,0x2c,0x10

# ATT:   vscalefbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vscalefbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf6,0x64,0x48,0x2c,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vscalefbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf6,0x64,0xcf,0x2c,0x51,0x7f

# ATT:   vscalefbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vscalefbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf6,0x64,0xdf,0x2c,0x52,0x80

# ATT:   vscalefbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x28,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vscalefbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vscalefbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x2f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vscalefbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vscalefbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf6,0x64,0x38,0x2c,0x10

# ATT:   vscalefbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vscalefbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf6,0x64,0x28,0x2c,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vscalefbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf6,0x64,0xaf,0x2c,0x51,0x7f

# ATT:   vscalefbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vscalefbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf6,0x64,0xbf,0x2c,0x52,0x80

# ATT:   vscalefbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf6,0x64,0x08,0x2c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vscalefbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vscalefbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf6,0x64,0x0f,0x2c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vscalefbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vscalefbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf6,0x64,0x18,0x2c,0x10

# ATT:   vscalefbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vscalefbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf6,0x64,0x08,0x2c,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vscalefbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf6,0x64,0x8f,0x2c,0x51,0x7f

# ATT:   vscalefbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vscalefbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf6,0x64,0x9f,0x2c,0x52,0x80

# ATT:   vsqrtbf16 %xmm3, %xmm2
# INTEL: vsqrtbf16 xmm2, xmm3
0x62,0xf5,0x7d,0x08,0x51,0xd3

# ATT:   vsqrtbf16 %xmm3, %xmm2 {%k7}
# INTEL: vsqrtbf16 xmm2 {k7}, xmm3
0x62,0xf5,0x7d,0x0f,0x51,0xd3

# ATT:   vsqrtbf16 %xmm3, %xmm2 {%k7} {z}
# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmm3
0x62,0xf5,0x7d,0x8f,0x51,0xd3

# ATT:   vsqrtbf16 %zmm3, %zmm2
# INTEL: vsqrtbf16 zmm2, zmm3
0x62,0xf5,0x7d,0x48,0x51,0xd3

# ATT:   vsqrtbf16 %zmm3, %zmm2 {%k7}
# INTEL: vsqrtbf16 zmm2 {k7}, zmm3
0x62,0xf5,0x7d,0x4f,0x51,0xd3

# ATT:   vsqrtbf16 %zmm3, %zmm2 {%k7} {z}
# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmm3
0x62,0xf5,0x7d,0xcf,0x51,0xd3

# ATT:   vsqrtbf16 %ymm3, %ymm2
# INTEL: vsqrtbf16 ymm2, ymm3
0x62,0xf5,0x7d,0x28,0x51,0xd3

# ATT:   vsqrtbf16 %ymm3, %ymm2 {%k7}
# INTEL: vsqrtbf16 ymm2 {k7}, ymm3
0x62,0xf5,0x7d,0x2f,0x51,0xd3

# ATT:   vsqrtbf16 %ymm3, %ymm2 {%k7} {z}
# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymm3
0x62,0xf5,0x7d,0xaf,0x51,0xd3

# ATT:   vsqrtbf16  268435456(%esp,%esi,8), %xmm2
# INTEL: vsqrtbf16 xmm2, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x08,0x51,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsqrtbf16  291(%edi,%eax,4), %xmm2 {%k7}
# INTEL: vsqrtbf16 xmm2 {k7}, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x0f,0x51,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsqrtbf16  (%eax){1to8}, %xmm2
# INTEL: vsqrtbf16 xmm2, word ptr [eax]{1to8}
0x62,0xf5,0x7d,0x18,0x51,0x10

# ATT:   vsqrtbf16  -512(,%ebp,2), %xmm2
# INTEL: vsqrtbf16 xmm2, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x7d,0x08,0x51,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vsqrtbf16  2032(%ecx), %xmm2 {%k7} {z}
# INTEL: vsqrtbf16 xmm2 {k7} {z}, xmmword ptr [ecx + 2032]
0x62,0xf5,0x7d,0x8f,0x51,0x51,0x7f

# ATT:   vsqrtbf16  -256(%edx){1to8}, %xmm2 {%k7} {z}
# INTEL: vsqrtbf16 xmm2 {k7} {z}, word ptr [edx - 256]{1to8}
0x62,0xf5,0x7d,0x9f,0x51,0x52,0x80

# ATT:   vsqrtbf16  268435456(%esp,%esi,8), %ymm2
# INTEL: vsqrtbf16 ymm2, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x28,0x51,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsqrtbf16  291(%edi,%eax,4), %ymm2 {%k7}
# INTEL: vsqrtbf16 ymm2 {k7}, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x2f,0x51,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsqrtbf16  (%eax){1to16}, %ymm2
# INTEL: vsqrtbf16 ymm2, word ptr [eax]{1to16}
0x62,0xf5,0x7d,0x38,0x51,0x10

# ATT:   vsqrtbf16  -1024(,%ebp,2), %ymm2
# INTEL: vsqrtbf16 ymm2, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x7d,0x28,0x51,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vsqrtbf16  4064(%ecx), %ymm2 {%k7} {z}
# INTEL: vsqrtbf16 ymm2 {k7} {z}, ymmword ptr [ecx + 4064]
0x62,0xf5,0x7d,0xaf,0x51,0x51,0x7f

# ATT:   vsqrtbf16  -256(%edx){1to16}, %ymm2 {%k7} {z}
# INTEL: vsqrtbf16 ymm2 {k7} {z}, word ptr [edx - 256]{1to16}
0x62,0xf5,0x7d,0xbf,0x51,0x52,0x80

# ATT:   vsqrtbf16  268435456(%esp,%esi,8), %zmm2
# INTEL: vsqrtbf16 zmm2, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x7d,0x48,0x51,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsqrtbf16  291(%edi,%eax,4), %zmm2 {%k7}
# INTEL: vsqrtbf16 zmm2 {k7}, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x7d,0x4f,0x51,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsqrtbf16  (%eax){1to32}, %zmm2
# INTEL: vsqrtbf16 zmm2, word ptr [eax]{1to32}
0x62,0xf5,0x7d,0x58,0x51,0x10

# ATT:   vsqrtbf16  -2048(,%ebp,2), %zmm2
# INTEL: vsqrtbf16 zmm2, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x7d,0x48,0x51,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vsqrtbf16  8128(%ecx), %zmm2 {%k7} {z}
# INTEL: vsqrtbf16 zmm2 {k7} {z}, zmmword ptr [ecx + 8128]
0x62,0xf5,0x7d,0xcf,0x51,0x51,0x7f

# ATT:   vsqrtbf16  -256(%edx){1to32}, %zmm2 {%k7} {z}
# INTEL: vsqrtbf16 zmm2 {k7} {z}, word ptr [edx - 256]{1to32}
0x62,0xf5,0x7d,0xdf,0x51,0x52,0x80

# ATT:   vsubbf16 %ymm4, %ymm3, %ymm2
# INTEL: vsubbf16 ymm2, ymm3, ymm4
0x62,0xf5,0x65,0x28,0x5c,0xd4

# ATT:   vsubbf16 %ymm4, %ymm3, %ymm2 {%k7}
# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymm4
0x62,0xf5,0x65,0x2f,0x5c,0xd4

# ATT:   vsubbf16 %ymm4, %ymm3, %ymm2 {%k7} {z}
# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymm4
0x62,0xf5,0x65,0xaf,0x5c,0xd4

# ATT:   vsubbf16 %zmm4, %zmm3, %zmm2
# INTEL: vsubbf16 zmm2, zmm3, zmm4
0x62,0xf5,0x65,0x48,0x5c,0xd4

# ATT:   vsubbf16 %zmm4, %zmm3, %zmm2 {%k7}
# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmm4
0x62,0xf5,0x65,0x4f,0x5c,0xd4

# ATT:   vsubbf16 %zmm4, %zmm3, %zmm2 {%k7} {z}
# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmm4
0x62,0xf5,0x65,0xcf,0x5c,0xd4

# ATT:   vsubbf16 %xmm4, %xmm3, %xmm2
# INTEL: vsubbf16 xmm2, xmm3, xmm4
0x62,0xf5,0x65,0x08,0x5c,0xd4

# ATT:   vsubbf16 %xmm4, %xmm3, %xmm2 {%k7}
# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmm4
0x62,0xf5,0x65,0x0f,0x5c,0xd4

# ATT:   vsubbf16 %xmm4, %xmm3, %xmm2 {%k7} {z}
# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmm4
0x62,0xf5,0x65,0x8f,0x5c,0xd4

# ATT:   vsubbf16  268435456(%esp,%esi,8), %zmm3, %zmm2
# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x48,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsubbf16  291(%edi,%eax,4), %zmm3, %zmm2 {%k7}
# INTEL: vsubbf16 zmm2 {k7}, zmm3, zmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x4f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsubbf16  (%eax){1to32}, %zmm3, %zmm2
# INTEL: vsubbf16 zmm2, zmm3, word ptr [eax]{1to32}
0x62,0xf5,0x65,0x58,0x5c,0x10

# ATT:   vsubbf16  -2048(,%ebp,2), %zmm3, %zmm2
# INTEL: vsubbf16 zmm2, zmm3, zmmword ptr [2*ebp - 2048]
0x62,0xf5,0x65,0x48,0x5c,0x14,0x6d,0x00,0xf8,0xff,0xff

# ATT:   vsubbf16  8128(%ecx), %zmm3, %zmm2 {%k7} {z}
# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, zmmword ptr [ecx + 8128]
0x62,0xf5,0x65,0xcf,0x5c,0x51,0x7f

# ATT:   vsubbf16  -256(%edx){1to32}, %zmm3, %zmm2 {%k7} {z}
# INTEL: vsubbf16 zmm2 {k7} {z}, zmm3, word ptr [edx - 256]{1to32}
0x62,0xf5,0x65,0xdf,0x5c,0x52,0x80

# ATT:   vsubbf16  268435456(%esp,%esi,8), %ymm3, %ymm2
# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x28,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsubbf16  291(%edi,%eax,4), %ymm3, %ymm2 {%k7}
# INTEL: vsubbf16 ymm2 {k7}, ymm3, ymmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x2f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsubbf16  (%eax){1to16}, %ymm3, %ymm2
# INTEL: vsubbf16 ymm2, ymm3, word ptr [eax]{1to16}
0x62,0xf5,0x65,0x38,0x5c,0x10

# ATT:   vsubbf16  -1024(,%ebp,2), %ymm3, %ymm2
# INTEL: vsubbf16 ymm2, ymm3, ymmword ptr [2*ebp - 1024]
0x62,0xf5,0x65,0x28,0x5c,0x14,0x6d,0x00,0xfc,0xff,0xff

# ATT:   vsubbf16  4064(%ecx), %ymm3, %ymm2 {%k7} {z}
# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, ymmword ptr [ecx + 4064]
0x62,0xf5,0x65,0xaf,0x5c,0x51,0x7f

# ATT:   vsubbf16  -256(%edx){1to16}, %ymm3, %ymm2 {%k7} {z}
# INTEL: vsubbf16 ymm2 {k7} {z}, ymm3, word ptr [edx - 256]{1to16}
0x62,0xf5,0x65,0xbf,0x5c,0x52,0x80

# ATT:   vsubbf16  268435456(%esp,%esi,8), %xmm3, %xmm2
# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [esp + 8*esi + 268435456]
0x62,0xf5,0x65,0x08,0x5c,0x94,0xf4,0x00,0x00,0x00,0x10

# ATT:   vsubbf16  291(%edi,%eax,4), %xmm3, %xmm2 {%k7}
# INTEL: vsubbf16 xmm2 {k7}, xmm3, xmmword ptr [edi + 4*eax + 291]
0x62,0xf5,0x65,0x0f,0x5c,0x94,0x87,0x23,0x01,0x00,0x00

# ATT:   vsubbf16  (%eax){1to8}, %xmm3, %xmm2
# INTEL: vsubbf16 xmm2, xmm3, word ptr [eax]{1to8}
0x62,0xf5,0x65,0x18,0x5c,0x10

# ATT:   vsubbf16  -512(,%ebp,2), %xmm3, %xmm2
# INTEL: vsubbf16 xmm2, xmm3, xmmword ptr [2*ebp - 512]
0x62,0xf5,0x65,0x08,0x5c,0x14,0x6d,0x00,0xfe,0xff,0xff

# ATT:   vsubbf16  2032(%ecx), %xmm3, %xmm2 {%k7} {z}
# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, xmmword ptr [ecx + 2032]
0x62,0xf5,0x65,0x8f,0x5c,0x51,0x7f

# ATT:   vsubbf16  -256(%edx){1to8}, %xmm3, %xmm2 {%k7} {z}
# INTEL: vsubbf16 xmm2 {k7} {z}, xmm3, word ptr [edx - 256]{1to8}
0x62,0xf5,0x65,0x9f,0x5c,0x52,0x80

