aarch64: Add support for FEAT_SME_B16B16 feature.

This patch adds support for SME ZA-targeting non-widening BFloat16 instructions,
under tick FEAT_SME_B16B16 and command line flag "+sme-b16b16".

FEAT_SME_B16B16 implements FEAT_SME2 and FEAT_SVE_B16B16, in accordance with that
"+sme-b16b16" enables "+sme2" and "+sve-b16b16".

Also the test files related to FEAT_SME_B16B16 are prefixed with sme-b16b16*.
eg: sme-b16b16-1.s, sme-b16b16-1.d.

The spec for this feature and instructions is availabe here [1]:
[1]: https://developer.arm.com/documentation/ddi0602/2024-06/SME-Instructions?lang=en
This commit is contained in:
Srinath Parvathaneni
2025-01-10 16:47:32 +00:00
parent 150bfae1d7
commit 308d7670f0
11 changed files with 1182 additions and 311 deletions

View File

@@ -2,6 +2,9 @@
* Add support for the x86 Zhaoxin PadLock RNG2 instruction.
* Add support for AArch64 SME and SVE non-widening BFloat16 (SVE_B16B16 and
SME_B16B16) instructions.
* Add support for the x86 Intel AVX10.2 instructions.
* Add support for the x86 Intel SM4 AVX10.2 instructions.

View File

@@ -10764,6 +10764,8 @@ static const struct aarch64_option_cpu_value_table aarch64_features[] = {
{"sme-f8f16", AARCH64_FEATURE (SME_F8F16),
AARCH64_FEATURE (SME_F8F32)},
{"sme-f16f16", AARCH64_FEATURE (SME_F16F16), AARCH64_FEATURE (SME2)},
{"sme-b16b16", AARCH64_FEATURE (SME_B16B16),
AARCH64_FEATURES (2, SVE_B16B16, SME2)},
{NULL, AARCH64_NO_FEATURES, AARCH64_NO_FEATURES},
};

View File

@@ -269,6 +269,8 @@ automatically cause those extensions to be disabled.
@tab Enable the SM3 and SM4 cryptographic extensions.
@item @code{sme} @tab @code{sve2}, @code{bf16}
@tab Enable the Scalable Matrix Extension.
@item @code{sme-b16b16} @tab @code{sme2}, @code{sve-b16b16}
@tab Enable SME ZA-targeting non-widening BFloat16 instructions.
@item @code{sme-f8f16} @tab @code{sme-f8f32}
@tab Enable the SME F8F16 Extension.
@item @code{sme-f8f32} @tab @code{sme2}, @code{fp8}

View File

@@ -0,0 +1,126 @@
#name: Test of SME2 non-widening BFloat16 instructions.
#as: -march=armv8-a+sme-b16b16
#objdump: -dr
[^:]+: file format .*
[^:]+:
[^:]+:
.*: c1e41c00 bfadd za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}
.*: c1e47c00 bfadd za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}
.*: c1e41c07 bfadd za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}
.*: c1e41fc0 bfadd za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}
.*: c1e41fc3 bfadd za.h\[w8, 3, vgx2\], { ?z30.h-z31.h ?}
.*: c1e51c00 bfadd za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}
.*: c1e57c00 bfadd za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}
.*: c1e51c07 bfadd za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}
.*: c1e51f80 bfadd za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}
.*: c1e51f83 bfadd za.h\[w8, 3, vgx4\], { ?z28.h-z31.h ?}
.*: c1e41c08 bfsub za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}
.*: c1e47c08 bfsub za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}
.*: c1e41c0f bfsub za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}
.*: c1e41fc8 bfsub za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}
.*: c1e41fcb bfsub za.h\[w8, 3, vgx2\], { ?z30.h-z31.h ?}
.*: c1e51c08 bfsub za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}
.*: c1e57c08 bfsub za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}
.*: c1e51c0f bfsub za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}
.*: c1e51f88 bfsub za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}
.*: c1e51f8b bfsub za.h\[w8, 3, vgx4\], { ?z28.h-z31.h ?}
.*: c1101020 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c1107020 bfmla za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c1101027 bfmla za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c11013e0 bfmla za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}, z0.h\[0\]
.*: c11f1020 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h\[0\]
.*: c1101c28 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[7\]
.*: c1101428 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[3\]
.*: c1101c2b bfmla za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, z0.h\[7\]
.*: c1109020 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c110f020 bfmla za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c1109027 bfmla za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c11093a0 bfmla za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}, z0.h\[0\]
.*: c11f9020 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z15.h\[0\]
.*: c1109c28 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[7\]
.*: c1109428 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[3\]
.*: c1109c2b bfmla za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, z0.h\[7\]
.*: c1601c00 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1607c00 bfmla za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1601c07 bfmla za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1601fe0 bfmla za.h\[w8, 0, vgx2\], { ?z31.h-z0.h ?}, z0.h
.*: c16f1c00 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: c16f1c03 bfmla za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: c1701c00 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1707c00 bfmla za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1701c07 bfmla za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1701fe0 bfmla za.h\[w8, 0, vgx4\], { ?z31.h-z2.h ?}, z0.h
.*: c17f1c00 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z15.h
.*: c17f1c03 bfmla za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, z15.h
.*: c1e01008 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e07008 bfmla za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e0100f bfmla za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e013c8 bfmla za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}, { ?z0.h-z1.h ?}
.*: c1fe1008 bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z30.h-z31.h ?}
.*: c1fe100b bfmla za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, { ?z30.h-z31.h ?}
.*: c1e11008 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e17008 bfmla za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e1100f bfmla za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e11388 bfmla za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}, { ?z0.h-z3.h ?}
.*: c1fd1008 bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z28.h-z31.h ?}
.*: c1fd100b bfmla za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, { ?z28.h-z31.h ?}
.*: c1101030 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c1107030 bfmls za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c1101037 bfmls za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, z0.h\[0\]
.*: c11013f0 bfmls za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}, z0.h\[0\]
.*: c11f1030 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h\[0\]
.*: c1101c38 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[7\]
.*: c1101438 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h\[3\]
.*: c1101c3b bfmls za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, z0.h\[7\]
.*: c1109030 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c110f030 bfmls za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c1109037 bfmls za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, z0.h\[0\]
.*: c11093b0 bfmls za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}, z0.h\[0\]
.*: c11f9030 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z15.h\[0\]
.*: c1109c38 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[7\]
.*: c1109438 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h\[3\]
.*: c1109c3b bfmls za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, z0.h\[7\]
.*: c1601c08 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1607c08 bfmls za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1601c0f bfmls za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, z0.h
.*: c1601fe8 bfmls za.h\[w8, 0, vgx2\], { ?z31.h-z0.h ?}, z0.h
.*: c16f1c08 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: c16f1c0b bfmls za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: c1701c08 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1707c08 bfmls za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1701c0f bfmls za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, z0.h
.*: c1701fe8 bfmls za.h\[w8, 0, vgx4\], { ?z31.h-z2.h ?}, z0.h
.*: c17f1c08 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, z15.h
.*: c17f1c0b bfmls za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, z15.h
.*: c1e01018 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e07018 bfmls za.h\[w11, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e0101f bfmls za.h\[w8, 7, vgx2\], { ?z0.h-z1.h ?}, { ?z0.h-z1.h ?}
.*: c1e013d8 bfmls za.h\[w8, 0, vgx2\], { ?z30.h-z31.h ?}, { ?z0.h-z1.h ?}
.*: c1fe1018 bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, { ?z30.h-z31.h ?}
.*: c1fe101b bfmls za.h\[w8, 3, vgx2\], { ?z0.h-z1.h ?}, { ?z30.h-z31.h ?}
.*: c1e11018 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e17018 bfmls za.h\[w11, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e1101f bfmls za.h\[w8, 7, vgx4\], { ?z0.h-z3.h ?}, { ?z0.h-z3.h ?}
.*: c1e11398 bfmls za.h\[w8, 0, vgx4\], { ?z28.h-z31.h ?}, { ?z0.h-z3.h ?}
.*: c1fd1018 bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}, { ?z28.h-z31.h ?}
.*: c1fd101b bfmls za.h\[w8, 3, vgx4\], { ?z0.h-z3.h ?}, { ?z28.h-z31.h ?}
.*: 81a00008 bfmopa za0.h, p0/m, p0/m, z0.h, z0.h
.*: 81a00009 bfmopa za1.h, p0/m, p0/m, z0.h, z0.h
.*: 81a01c08 bfmopa za0.h, p7/m, p0/m, z0.h, z0.h
.*: 81a0e008 bfmopa za0.h, p0/m, p7/m, z0.h, z0.h
.*: 81a003e8 bfmopa za0.h, p0/m, p0/m, z31.h, z0.h
.*: 81bf0008 bfmopa za0.h, p0/m, p0/m, z0.h, z31.h
.*: 81afad48 bfmopa za0.h, p3/m, p5/m, z10.h, z15.h
.*: 81b965e9 bfmopa za1.h, p1/m, p3/m, z15.h, z25.h
.*: 81a00018 bfmops za0.h, p0/m, p0/m, z0.h, z0.h
.*: 81a00019 bfmops za1.h, p0/m, p0/m, z0.h, z0.h
.*: 81a01c18 bfmops za0.h, p7/m, p0/m, z0.h, z0.h
.*: 81a0e018 bfmops za0.h, p0/m, p7/m, z0.h, z0.h
.*: 81a003f8 bfmops za0.h, p0/m, p0/m, z31.h, z0.h
.*: 81bf0018 bfmops za0.h, p0/m, p0/m, z0.h, z31.h
.*: 81afad58 bfmops za0.h, p3/m, p5/m, z10.h, z15.h
.*: 81b965f9 bfmops za1.h, p1/m, p3/m, z15.h, z25.h

View File

@@ -0,0 +1,143 @@
/* BFADD. */
bfadd za.h[w8, 0, vgx2], {z0.h - z1.h}
bfadd za.h[w11, 0, vgx2], {z0.h - z1.h}
bfadd za.h[w8, 7, vgx2], {z0.h - z1.h}
bfadd za.h[w8, 0, vgx2], {z30.h - z31.h}
bfadd za.h[w8, 3], {z30.h - z31.h}
bfadd za.h[w8, 0, vgx4], {z0.h - z3.h}
bfadd za.h[w11, 0, vgx4], {z0.h - z3.h}
bfadd za.h[w8, 7, vgx4], {z0.h - z3.h}
bfadd za.h[w8, 0, vgx4], {z28.h - z31.h}
bfadd za.h[w8, 3], {z28.h - z31.h}
/* BFSUB. */
bfsub za.h[w8, 0, vgx2], {z0.h - z1.h}
bfsub za.h[w11, 0, vgx2], {z0.h - z1.h}
bfsub za.h[w8, 7, vgx2], {z0.h - z1.h}
bfsub za.h[w8, 0, vgx2], {z30.h - z31.h}
bfsub za.h[w8, 3], {z30.h - z31.h}
bfsub za.h[w8, 0, vgx4], {z0.h - z3.h}
bfsub za.h[w11, 0, vgx4], {z0.h - z3.h}
bfsub za.h[w8, 7, vgx4], {z0.h - z3.h}
bfsub za.h[w8, 0, vgx4], {z28.h - z31.h}
bfsub za.h[w8, 3], {z28.h - z31.h}
/* BFMLA (multiple and indexed vector). */
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w11, 0, vgx2], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w8, 7, vgx2], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w8, 0, vgx2], {z30.h - z31.h}, z0.h[0]
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z15.h[0]
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[7]
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[3]
bfmla za.h[w8, 3], {z0.h - z1.h}, z0.h[7]
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[0]
bfmla za.h[w11, 0, vgx4], {z0.h - z3.h}, z0.h[0]
bfmla za.h[w8, 7, vgx4], {z0.h - z3.h}, z0.h[0]
bfmla za.h[w8, 0, vgx4], {z28.h - z31.h}, z0.h[0]
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z15.h[0]
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[7]
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[3]
bfmla za.h[w8, 3], {z0.h - z3.h}, z0.h[7]
/* BFMLA (multiple and single vector). */
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h
bfmla za.h[w11, 0, vgx2], {z0.h - z1.h}, z0.h
bfmla za.h[w8, 7, vgx2], {z0.h - z1.h}, z0.h
bfmla za.h[w8, 0, vgx2], {z31.h - z0.h}, z0.h
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, z15.h
bfmla za.h[w8, 3], {z0.h - z1.h}, z15.h
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h
bfmla za.h[w11, 0, vgx4], {z0.h - z3.h}, z0.h
bfmla za.h[w8, 7, vgx4], {z0.h - z3.h}, z0.h
bfmla za.h[w8, 0, vgx4], {z31.h - z2.h}, z0.h
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, z15.h
bfmla za.h[w8, 3], {z0.h - z3.h}, z15.h
/* BFMLA (multiple vectors). */
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmla za.h[w11, 0, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmla za.h[w8, 7, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmla za.h[w8, 0, vgx2], {z30.h - z31.h}, {z0.h - z1.h}
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, {z30.h - z31.h}
bfmla za.h[w8, 3], {z0.h - z1.h}, {z30.h - z31.h}
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmla za.h[w11, 0, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmla za.h[w8, 7, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmla za.h[w8, 0, vgx4], {z28.h - z31.h}, {z0.h - z3.h}
bfmla za.h[w8, 0, vgx4], {z0.h - z3.h}, {z28.h - z31.h}
bfmla za.h[w8, 3], {z0.h - z3.h}, {z28.h - z31.h}
/* BFMLS (multiple and indexed vector). */
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w11, 0, vgx2], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w8, 7, vgx2], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w8, 0, vgx2], {z30.h - z31.h}, z0.h[0]
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z15.h[0]
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[7]
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h[3]
bfmls za.h[w8, 3], {z0.h - z1.h}, z0.h[7]
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[0]
bfmls za.h[w11, 0, vgx4], {z0.h - z3.h}, z0.h[0]
bfmls za.h[w8, 7, vgx4], {z0.h - z3.h}, z0.h[0]
bfmls za.h[w8, 0, vgx4], {z28.h - z31.h}, z0.h[0]
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z15.h[0]
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[7]
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h[3]
bfmls za.h[w8, 3], {z0.h - z3.h}, z0.h[7]
/* BFMLS (multiple and single vector). */
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z0.h
bfmls za.h[w11, 0, vgx2], {z0.h - z1.h}, z0.h
bfmls za.h[w8, 7, vgx2], {z0.h - z1.h}, z0.h
bfmls za.h[w8, 0, vgx2], {z31.h - z0.h}, z0.h
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, z15.h
bfmls za.h[w8, 3], {z0.h - z1.h}, z15.h
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z0.h
bfmls za.h[w11, 0, vgx4], {z0.h - z3.h}, z0.h
bfmls za.h[w8, 7, vgx4], {z0.h - z3.h}, z0.h
bfmls za.h[w8, 0, vgx4], {z31.h - z2.h}, z0.h
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, z15.h
bfmls za.h[w8, 3], {z0.h - z3.h}, z15.h
/* BFMLS (multiple vectors). */
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmls za.h[w11, 0, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmls za.h[w8, 7, vgx2], {z0.h - z1.h}, {z0.h - z1.h}
bfmls za.h[w8, 0, vgx2], {z30.h - z31.h}, {z0.h - z1.h}
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, {z30.h - z31.h}
bfmls za.h[w8, 3], {z0.h - z1.h}, {z30.h - z31.h}
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmls za.h[w11, 0, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmls za.h[w8, 7, vgx4], {z0.h - z3.h}, {z0.h - z3.h}
bfmls za.h[w8, 0, vgx4], {z28.h - z31.h}, {z0.h - z3.h}
bfmls za.h[w8, 0, vgx4], {z0.h - z3.h}, {z28.h - z31.h}
bfmls za.h[w8, 3], {z0.h - z3.h}, {z28.h - z31.h}
/* BFMOPA. */
bfmopa ZA0.h, p0/m, p0/m, z0.h, z0.h
bfmopa ZA1.h, p0/m, p0/m, z0.h, z0.h
bfmopa ZA0.h, p7/m, p0/m, z0.h, z0.h
bfmopa ZA0.h, p0/m, p7/m, z0.h, z0.h
bfmopa ZA0.h, p0/m, p0/m, z31.h, z0.h
bfmopa ZA0.h, p0/m, p0/m, z0.h, z31.h
bfmopa ZA0.h, p3/m, p5/m, z10.h, z15.h
bfmopa ZA1.h, p1/m, p3/m, z15.h, z25.h
/* BFMOPS. */
bfmops ZA0.h, p0/m, p0/m, z0.h, z0.h
bfmops ZA1.h, p0/m, p0/m, z0.h, z0.h
bfmops ZA0.h, p7/m, p0/m, z0.h, z0.h
bfmops ZA0.h, p0/m, p7/m, z0.h, z0.h
bfmops ZA0.h, p0/m, p0/m, z31.h, z0.h
bfmops ZA0.h, p0/m, p0/m, z0.h, z31.h
bfmops ZA0.h, p3/m, p5/m, z10.h, z15.h
bfmops ZA1.h, p1/m, p3/m, z15.h, z25.h

View File

@@ -0,0 +1,3 @@
#name: Test of invalid SME2 non-widening BFloat16 instructions.
#as: -march=armv8-a+sme-b16b16
#error_output: sme-b16b16-bad-1.l

View File

@@ -0,0 +1,193 @@
.*: Assembler messages:
.*: Error: operand mismatch -- `bfadd za.s\[w8,0,vgx2\],{ ?z0.h-z1.h ?}'
.*: Info: did you mean this\?
.*: Info: bfadd za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}
.*: Error: too many registers in vector register list at operand 2 -- `bfadd za.h\[w13,0,vgx2\],{ ?z1.h-z0.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfadd za.h\[w8,11,vgx3\],{ ?z0.h-z1.h ?}'
.*: Error: too many registers in vector register list at operand 2 -- `bfadd za.h\[w8,0,vgx2\],{ ?z0.h-z4.h ?}'
.*: Error: operand mismatch -- `bfadd za.s\[w8,0,vgx4\],{ ?z0.h-z3.h ?}'
.*: Info: did you mean this\?
.*: Info: bfadd za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}
.*: Error: too many registers in vector register list at operand 2 -- `bfadd za.h\[w14,0,vgx4\],{ ?z10.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfadd za.h\[w8,15,vgx1\],{ ?z3.h-z2.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfadd za.h\[w8,0,vgx4\],{ ?z30.h-z31.h ?}'
.*: Error: operand mismatch -- `bfsub za.s\[w8,0,vgx2\],{ ?z0.h-z1.h ?}'
.*: Info: did you mean this\?
.*: Info: bfsub za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}
.*: Error: too many registers in vector register list at operand 2 -- `bfsub za.h\[w13,0,vgx2\],{ ?z1.h-z0.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfsub za.h\[w8,11,vgx3\],{ ?z0.h-z1.h ?}'
.*: Error: too many registers in vector register list at operand 2 -- `bfsub za.h\[w8,0,vgx2\],{ ?z0.h-z4.h ?}'
.*: Error: operand mismatch -- `bfsub za.s\[w8,0,vgx4\],{ ?z0.h-z3.h ?}'
.*: Info: did you mean this\?
.*: Info: bfsub za.h\[w8, 0, vgx4\], { ?z0.h-z3.h ?}
.*: Error: too many registers in vector register list at operand 2 -- `bfsub za.h\[w14,0,vgx4\],{ ?z10.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfsub za.h\[w8,15,vgx1\],{ ?z3.h-z2.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfsub za.h\[w8,0,vgx4\],{ ?z30.h-z31.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,15,vgx3\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.d\[w8,0,vgx3\],{ ?z30.h-z31.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z15.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h\[7\]'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},z0.h\[7\]'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},z0.h'
.*: Error: missing type suffix at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0-z1},z0.h\[7\]'
.*: Error: missing type suffix at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0-z1}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w14,0,vgx1\],{ ?z10.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,15,vgx1\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx1\],{ ?z30.h-z31.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z15.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h\[7\]'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},z0.h\[7\]'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},z0.h'
.*: Error: missing type suffix at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0-z1},z0.h\[7\]'
.*: Error: missing type suffix at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0-z1}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,15,vgx3\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.d\[w8,0,vgx3\],{ ?z31.h-z0.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z15.h'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},z15.h'
.*: Error: operand mismatch -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},z15'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: Error: operand mismatch -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},z20'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z20.h
.*: Error: comma expected between operands at operand 3 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w14,0,vgx1\],{ ?z10.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,15,vgx1\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx1\],{ ?z31.h-z2.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z15.h'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},z15.h'
.*: Error: operand mismatch -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},z15'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z1.h ?}, z15.h
.*: Error: operand mismatch -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},z20'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 0, vgx4\], { ?z0.h-z1.h ?}, z20.h
.*: Error: comma expected between operands at operand 3 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.d\[w8,15,vgx3\],{ ?z0.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx3\],{ ?z30.h-z31.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.b\[w8,0,vgx3\],{ ?z0.h-z1.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 2 registers at operand 3 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmla za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: operand mismatch -- `bfmla za.b\[w8,20,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 20, vgx2\], { ?z0.h ?}, { ?z30.h ?}
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,0,vgx1\],{ ?z0.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w14,0,vgx1\],{ ?z10.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.s\[w8,15,vgx1\],{ ?z0.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.h\[w8,0,vgx1\],{ ?z30.h-z31.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmla za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmla za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: operand mismatch -- `bfmla za.b\[w8,20,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Info: did you mean this\?
.*: Info: bfmla za.h\[w8, 20, vgx4\], { ?z0.h ?}, { ?z30.h ?}
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,15,vgx3\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.d\[w8,0,vgx3\],{ ?z30.h-z31.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z15.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h\[7\]'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},z0.h\[7\]'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},z0.h'
.*: Error: missing type suffix at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0-z1},z0.h\[7\]'
.*: Error: missing type suffix at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0-z1}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w14,0,vgx1\],{ ?z10.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,15,vgx1\],{ ?z0.h-z1.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx1\],{ ?z30.h-z31.h ?},z0.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z15.h\[0\]'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h\[7\]'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},z0.h\[7\]'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},z0.h'
.*: Error: missing type suffix at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0-z1},z0.h\[7\]'
.*: Error: missing type suffix at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0-z1}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,15,vgx3\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.d\[w8,0,vgx3\],{ ?z31.h-z0.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx3\],{ ?z0.h-z1.h ?},z15.h'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},z15.h'
.*: Error: operand mismatch -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},z15'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z15.h
.*: Error: operand mismatch -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},z20'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 0, vgx2\], { ?z0.h-z1.h ?}, z20.h
.*: Error: comma expected between operands at operand 3 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w14,0,vgx1\],{ ?z10.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,15,vgx1\],{ ?z0.h-z1.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx1\],{ ?z31.h-z2.h ?},z0.h'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},z15.h'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},z15.h'
.*: Error: operand mismatch -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},z15'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z1.h ?}, z15.h
.*: Error: operand mismatch -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},z20'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 0, vgx4\], { ?z0.h-z1.h ?}, z20.h
.*: Error: comma expected between operands at operand 3 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,0,vgx3\],{ ?z0.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w14,0,vgx3\],{ ?z10.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.d\[w8,15,vgx3\],{ ?z0.h-z1.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx3\],{ ?z30.h-z31.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.b\[w8,0,vgx3\],{ ?z0.h-z1.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 2 registers at operand 3 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h-z1.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 2 registers at operand 2 -- `bfmls za.h\[w8,0,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: operand mismatch -- `bfmls za.b\[w8,20,vgx2\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 20, vgx2\], { ?z0.h ?}, { ?z30.h ?}
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,0,vgx1\],{ ?z0.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w14,0,vgx1\],{ ?z10.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.s\[w8,15,vgx1\],{ ?z0.h-z1.h ?},{ ?z0.h-z3.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.h\[w8,0,vgx1\],{ ?z30.h-z31.h ?},{ ?z0.h-z1.h ?}'
.*: Error: invalid vector group size at operand 1 -- `bfmls za.b\[w8,0,vgx1\],{ ?z0.h-z1.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h-z31.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h-z1.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: expected a list of 4 registers at operand 2 -- `bfmls za.h\[w8,0,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Error: operand mismatch -- `bfmls za.b\[w8,20,vgx4\],{ ?z0.h ?},{ ?z30.h ?}'
.*: Info: did you mean this\?
.*: Info: bfmls za.h\[w8, 20, vgx4\], { ?z0.h ?}, { ?z30.h ?}
.*: Error: operand mismatch -- `bfmopa ZA1.h,p0,p0/m,z0.h,z0.h'
.*: Info: did you mean this\?
.*: Info: bfmopa za1.h, p0/m, p0/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmopa ZA0.h,p7/m,p0,z0.h,z0.h'
.*: Info: did you mean this\?
.*: Info: bfmopa za0.h, p7/m, p0/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmopa ZA0.h,p0/m,p7/m,z0.s,z0.s'
.*: Info: did you mean this\?
.*: Info: bfmopa za0.h, p0/m, p7/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmopa ZA0.h,p0/m,p0/m,z31.d,z0.d'
.*: Info: did you mean this\?
.*: Info: bfmopa za0.h, p0/m, p0/m, z31.h, z0.h
.*: Error: ZA tile number out of range at operand 1 -- `bfmopa ZA2.h,p0/m,p8/m,z0.s,z31.b'
.*: Error: ZA tile number out of range at operand 1 -- `bfmopa ZA4.h,p15/m,p11/m,z0.s,z31.b'
.*: Error: operand mismatch -- `bfmops ZA1.h,p0,p0/m,z0.h,z0.h'
.*: Info: did you mean this\?
.*: Info: bfmops za1.h, p0/m, p0/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmops ZA0.h,p7/m,p0,z0.h,z0.h'
.*: Info: did you mean this\?
.*: Info: bfmops za0.h, p7/m, p0/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmops ZA0.h,p0/m,p7/m,z0.s,z0.s'
.*: Info: did you mean this\?
.*: Info: bfmops za0.h, p0/m, p7/m, z0.h, z0.h
.*: Error: operand mismatch -- `bfmops ZA0.h,p0/m,p0/m,z31.d,z0.d'
.*: Info: did you mean this\?
.*: Info: bfmops za0.h, p0/m, p0/m, z31.h, z0.h
.*: Error: ZA tile number out of range at operand 1 -- `bfmops ZA2.h,p0/m,p8/m,z0.s,z31.b'
.*: Error: ZA tile number out of range at operand 1 -- `bfmops ZA4.h,p15/m,p11/m,z0.s,z31.b'

View File

@@ -0,0 +1,173 @@
/* BFADD. */
bfadd za.s[w8, 0, vgx2], {z0.h - z1.h}
bfadd za.h[w13, 0, vgx2], {z1.h - z0.h}
bfadd za.h[w8, 11, vgx3], {z0.h - z1.h}
bfadd za.h[w8, 0, vgx2], {z0.h - z4.h}
bfadd za.s[w8, 0, vgx4], {z0.h - z3.h}
bfadd za.h[w14, 0, vgx4], {z10.h - z3.h}
bfadd za.h[w8, 15, vgx1], {z3.h - z2.h}
bfadd za.h[w8, 0, vgx4], {z30.h - z31.h}
/* BFSUB. */
bfsub za.s[w8, 0, vgx2], {z0.h - z1.h}
bfsub za.h[w13, 0, vgx2], {z1.h - z0.h}
bfsub za.h[w8, 11, vgx3], {z0.h - z1.h}
bfsub za.h[w8, 0, vgx2], {z0.h - z4.h}
bfsub za.s[w8, 0, vgx4], {z0.h - z3.h}
bfsub za.h[w14, 0, vgx4], {z10.h - z3.h}
bfsub za.h[w8, 15, vgx1], {z3.h - z2.h}
bfsub za.h[w8, 0, vgx4], {z30.h - z31.h}
/* BFMLA (multiple and indexed vector). */
bfmla za.s[w8, 0, vgx3], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w14, 0, vgx3], {z10.h - z1.h}, z0.h[0]
bfmla za.h[w8, 15, vgx3], {z0.h - z1.h}, z0.h[0]
bfmla za.d[w8, 0, vgx3], {z30.h - z31.h}, z0.h[0]
bfmla za.h[w8, 0, vgx3], {z0.h - z1.h}, z15.h[0]
bfmla za.h[w8, 0, vgx3], {z0.h - z1.h}, z0.h[7]
bfmla za.h[w8, 0, vgx2], {z0.h}, z0.h[7]
bfmla za.h[w8, 0, vgx2], {z0.h}, z0.h
bfmla za.h[w8, 0, vgx2], {z0 - z1}, z0.h[7]
bfmla za.h[w8, 0, vgx2], {z0 - z1}
bfmla za.b[w8, 0, vgx1], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w14, 0, vgx1], {z10.h - z1.h}, z0.h[0]
bfmla za.h[w8, 15, vgx1], {z0.h - z1.h}, z0.h[0]
bfmla za.h[w8, 0, vgx1], {z30.h - z31.h}, z0.h[0]
bfmla za.s[w8, 0, vgx1], {z0.h - z1.h}, z15.h[0]
bfmla za.h[w8, 0, vgx1], {z0.h - z1.h}, z0.h[7]
bfmla za.h[w8, 0, vgx4], {z0.h}, z0.h[7]
bfmla za.h[w8, 0, vgx4], {z0.h}, z0.h
bfmla za.h[w8, 0, vgx4], {z0 - z1}, z0.h[7]
bfmla za.h[w8, 0, vgx4], {z0 - z1}
/* BFMLA (multiple and single vector). */
bfmla za.s[w8, 0, vgx3], {z0.h - z1.h}, z0.h
bfmla za.h[w14, 0, vgx3], {z10.h - z1.h}, z0.h
bfmla za.h[w8, 15, vgx3], {z0.h - z1.h}, z0.h
bfmla za.d[w8, 0, vgx3], {z31.h - z0.h}, z0.h
bfmla za.h[w8, 0, vgx3], {z0.h - z1.h}, z15.h
bfmla za.h[w8, 0, vgx2], {z0.h}, z15.h
bfmla za.h[w8, 0, vgx2], {z0.h -z1.h}, z15
bfmla za.h[w8, 0, vgx2], {z0.h -z1.h}, z20
bfmla za.h[w8, 0, vgx2], {z0.h -z1.h}
bfmla za.h[w8, 0, vgx1], {z0.h - z1.h}, z0.h
bfmla za.s[w14, 0, vgx1], {z10.h - z1.h}, z0.h
bfmla za.h[w8, 15, vgx1], {z0.h - z1.h}, z0.h
bfmla za.h[w8, 0, vgx1], {z31.h - z2.h}, z0.h
bfmla za.b[w8, 0, vgx1], {z0.h - z1.h}, z15.h
bfmla za.h[w8, 0, vgx4], {z0.h}, z15.h
bfmla za.h[w8, 0, vgx4], {z0.h -z1.h}, z15
bfmla za.h[w8, 0, vgx4], {z0.h -z1.h}, z20
bfmla za.h[w8, 0, vgx4], {z0.h -z1.h}
/* BFMLA (multiple vectors). */
bfmla za.s[w8, 0, vgx3], {z0.h - z1.h}, {z0.h - z1.h}
bfmla za.h[w14, 0, vgx3], {z10.h - z1.h}, {z0.h - z1.h}
bfmla za.d[w8, 15, vgx3], {z0.h - z1.h}, {z0.h - z1.h}
bfmla za.h[w8, 0, vgx3], {z30.h - z31.h}, {z0.h - z1.h}
bfmla za.b[w8, 0, vgx3], {z0.h - z1.h}, {z30.h - z31.h}
bfmla za.h[w8, 0, vgx2], {z0.h}, {z30.h - z31.h}
bfmla za.h[w8, 0, vgx2], {z0.h - z1.h}, {z30.h}
bfmla za.h[w8, 0, vgx2], {z0.h}, {z30.h}
bfmla za.h[w8, 0, vgx2], {z0.h}, {z30.h}
bfmla za.b[w8, 20, vgx2], {z0.h}, {z30.h}
bfmla za.s[w8, 0, vgx1], {z0.h - z1.h}, {z0.h - z3.h}
bfmla za.h[w14, 0, vgx1], {z10.h - z1.h}, {z0.h - z3.h}
bfmla za.s[w8, 15, vgx1], {z0.h - z1.h}, {z0.h - z3.h}
bfmla za.h[w8, 0, vgx1], {z30.h - z31.h}, {z0.h - z1.h}
bfmla za.b[w8, 0, vgx1], {z0.h - z1.h}, {z30.h - z31.h}
bfmla za.h[w8, 0, vgx4], {z0.h}, {z30.h - z31.h}
bfmla za.h[w8, 0, vgx4], {z0.h - z1.h}, {z30.h}
bfmla za.h[w8, 0, vgx4], {z0.h}, {z30.h}
bfmla za.h[w8, 0, vgx4], {z0.h}, {z30.h}
bfmla za.b[w8, 20, vgx4], {z0.h}, {z30.h}
/* BFMLS (multiple and indexed vector). */
bfmls za.s[w8, 0, vgx3], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w14, 0, vgx3], {z10.h - z1.h}, z0.h[0]
bfmls za.h[w8, 15, vgx3], {z0.h - z1.h}, z0.h[0]
bfmls za.d[w8, 0, vgx3], {z30.h - z31.h}, z0.h[0]
bfmls za.h[w8, 0, vgx3], {z0.h - z1.h}, z15.h[0]
bfmls za.h[w8, 0, vgx3], {z0.h - z1.h}, z0.h[7]
bfmls za.h[w8, 0, vgx2], {z0.h}, z0.h[7]
bfmls za.h[w8, 0, vgx2], {z0.h}, z0.h
bfmls za.h[w8, 0, vgx2], {z0 - z1}, z0.h[7]
bfmls za.h[w8, 0, vgx2], {z0 - z1}
bfmls za.b[w8, 0, vgx1], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w14, 0, vgx1], {z10.h - z1.h}, z0.h[0]
bfmls za.h[w8, 15, vgx1], {z0.h - z1.h}, z0.h[0]
bfmls za.h[w8, 0, vgx1], {z30.h - z31.h}, z0.h[0]
bfmls za.s[w8, 0, vgx1], {z0.h - z1.h}, z15.h[0]
bfmls za.h[w8, 0, vgx1], {z0.h - z1.h}, z0.h[7]
bfmls za.h[w8, 0, vgx4], {z0.h}, z0.h[7]
bfmls za.h[w8, 0, vgx4], {z0.h}, z0.h
bfmls za.h[w8, 0, vgx4], {z0 - z1}, z0.h[7]
bfmls za.h[w8, 0, vgx4], {z0 - z1}
/* BFMLS (multiple and single vector). */
bfmls za.s[w8, 0, vgx3], {z0.h - z1.h}, z0.h
bfmls za.h[w14, 0, vgx3], {z10.h - z1.h}, z0.h
bfmls za.h[w8, 15, vgx3], {z0.h - z1.h}, z0.h
bfmls za.d[w8, 0, vgx3], {z31.h - z0.h}, z0.h
bfmls za.h[w8, 0, vgx3], {z0.h - z1.h}, z15.h
bfmls za.h[w8, 0, vgx2], {z0.h}, z15.h
bfmls za.h[w8, 0, vgx2], {z0.h -z1.h}, z15
bfmls za.h[w8, 0, vgx2], {z0.h -z1.h}, z20
bfmls za.h[w8, 0, vgx2], {z0.h -z1.h}
bfmls za.h[w8, 0, vgx1], {z0.h - z1.h}, z0.h
bfmls za.s[w14, 0, vgx1], {z10.h - z1.h}, z0.h
bfmls za.h[w8, 15, vgx1], {z0.h - z1.h}, z0.h
bfmls za.h[w8, 0, vgx1], {z31.h - z2.h}, z0.h
bfmls za.b[w8, 0, vgx1], {z0.h - z1.h}, z15.h
bfmls za.h[w8, 0, vgx4], {z0.h}, z15.h
bfmls za.h[w8, 0, vgx4], {z0.h -z1.h}, z15
bfmls za.h[w8, 0, vgx4], {z0.h -z1.h}, z20
bfmls za.h[w8, 0, vgx4], {z0.h -z1.h}
/* BFMLS (multiple vectors). */
bfmls za.s[w8, 0, vgx3], {z0.h - z1.h}, {z0.h - z1.h}
bfmls za.h[w14, 0, vgx3], {z10.h - z1.h}, {z0.h - z1.h}
bfmls za.d[w8, 15, vgx3], {z0.h - z1.h}, {z0.h - z1.h}
bfmls za.h[w8, 0, vgx3], {z30.h - z31.h}, {z0.h - z1.h}
bfmls za.b[w8, 0, vgx3], {z0.h - z1.h}, {z30.h - z31.h}
bfmls za.h[w8, 0, vgx2], {z0.h}, {z30.h - z31.h}
bfmls za.h[w8, 0, vgx2], {z0.h - z1.h}, {z30.h}
bfmls za.h[w8, 0, vgx2], {z0.h}, {z30.h}
bfmls za.h[w8, 0, vgx2], {z0.h}, {z30.h}
bfmls za.b[w8, 20, vgx2], {z0.h}, {z30.h}
bfmls za.s[w8, 0, vgx1], {z0.h - z1.h}, {z0.h - z3.h}
bfmls za.h[w14, 0, vgx1], {z10.h - z1.h}, {z0.h - z3.h}
bfmls za.s[w8, 15, vgx1], {z0.h - z1.h}, {z0.h - z3.h}
bfmls za.h[w8, 0, vgx1], {z30.h - z31.h}, {z0.h - z1.h}
bfmls za.b[w8, 0, vgx1], {z0.h - z1.h}, {z30.h - z31.h}
bfmls za.h[w8, 0, vgx4], {z0.h}, {z30.h - z31.h}
bfmls za.h[w8, 0, vgx4], {z0.h - z1.h}, {z30.h}
bfmls za.h[w8, 0, vgx4], {z0.h}, {z30.h}
bfmls za.h[w8, 0, vgx4], {z0.h}, {z30.h}
bfmls za.b[w8, 20, vgx4], {z0.h}, {z30.h}
/* BFMOPA. */
bfmopa ZA0.s, p0/m, p0/m, z0.h, z0.h
bfmopa ZA1.h, p0, p0/m, z0.h, z0.h
bfmopa ZA0.h, p7/m, p0, z0.h, z0.h
bfmopa ZA0.h, p0/m, p7/m, z0.s, z0.s
bfmopa ZA0.h, p0/m, p0/m, z31.d, z0.d
bfmopa ZA2.h, p0/m, p8/m, z0.s, z31.b
bfmopa ZA4.h, p15/m, p11/m, z0.s, z31.b
/* BFMOPS. */
bfmops ZA0.s, p0/m, p0/m, z0.h, z0.h
bfmops ZA1.h, p0, p0/m, z0.h, z0.h
bfmops ZA0.h, p7/m, p0, z0.h, z0.h
bfmops ZA0.h, p0/m, p7/m, z0.s, z0.s
bfmops ZA0.h, p0/m, p0/m, z31.d, z0.d
bfmops ZA2.h, p0/m, p8/m, z0.s, z31.b
bfmops ZA4.h, p15/m, p11/m, z0.s, z31.b

View File

@@ -266,6 +266,8 @@ enum aarch64_feature_bit {
AARCH64_FEATURE_SME_F16F16,
/* SVE Z-targeting non-widening BFloat16 instructions. */
AARCH64_FEATURE_SVE_B16B16,
/* SME non-widening BFloat16 instructions. */
AARCH64_FEATURE_SME_B16B16,
/* Virtual features. These are used to gate instructions that are enabled
by either of two (or more) sets of command line flags. */

File diff suppressed because it is too large Load Diff

View File

@@ -2809,6 +2809,8 @@ static const aarch64_feature_set aarch64_feature_sve_b16b16_sve2 =
AARCH64_FEATURES (2, SVE_B16B16, SVE2);
static const aarch64_feature_set aarch64_feature_sve_b16b16_sme2 =
AARCH64_FEATURES (2, SVE_B16B16, SME2);
static const aarch64_feature_set aarch64_feature_sme_b16b16 =
AARCH64_FEATURES (2, SME_B16B16, SME2);
static const aarch64_feature_set aarch64_feature_sme2p1 =
AARCH64_FEATURE (SME2p1);
static const aarch64_feature_set aarch64_feature_sve2p1 =
@@ -2925,6 +2927,7 @@ static const aarch64_feature_set aarch64_feature_sme_f16f16 =
#define D128_THE &aarch64_feature_d128_the
#define B16B16_SVE2 &aarch64_feature_sve_b16b16_sve2
#define SVE_B16B16_SME &aarch64_feature_sve_b16b16_sme2
#define SME_B16B16 &aarch64_feature_sme_b16b16
#define SME2p1 &aarch64_feature_sme2p1
#define SVE2p1 &aarch64_feature_sve2p1
#define RCPC3 &aarch64_feature_rcpc3
@@ -3035,6 +3038,9 @@ static const aarch64_feature_set aarch64_feature_sme_f16f16 =
#define SVE_B16B16_SME_INSNC(NAME,OPCODE,MASK,CLASS,OP,OPS,QUALS,FLAGS,CONSTRAINTS,TIED) \
{ NAME, OPCODE, MASK, CLASS, OP, SVE_B16B16_SME, OPS, QUALS, \
FLAGS | F_STRICT, CONSTRAINTS, TIED, NULL }
#define SME_B16B16_INSN(NAME,OPCODE,MASK,CLASS,OP,OPS,QUALS,FLAGS,TIED) \
{ NAME, OPCODE, MASK, CLASS, OP, SME_B16B16, OPS, QUALS, \
FLAGS | F_STRICT, 0, TIED, NULL }
#define SVE2p1_INSN(NAME,OPCODE,MASK,CLASS,OP,OPS,QUALS,FLAGS,TIED) \
{ NAME, OPCODE, MASK, CLASS, OP, SVE2p1, OPS, QUALS, \
FLAGS | F_STRICT, 0, TIED, NULL }
@@ -6678,6 +6684,26 @@ const struct aarch64_opcode aarch64_opcode_table[] =
SVE_B16B16_SME_INSN("bfclamp", 0xc120c000, 0xffe0fc01, sme_misc, 0, OP3 (SME_Zdnx2, SVE_Zn, SVE_Zm_16), OP_SVE_HHH, 0, 0),
SVE_B16B16_SME_INSN("bfclamp", 0xc120c800, 0xffe0fc03, sme_misc, 0, OP3 (SME_Zdnx4, SVE_Zn, SVE_Zm_16), OP_SVE_HHH,0, 0),
/* SME ZA-targeting non-widening BFloat16 instructions. */
SME_B16B16_INSN("bfadd", 0xc1e41c00, 0xffff9c38, sme_misc, 0, OP2 (SME_ZA_array_off3_0, SME_Znx2), OP_SVE_HH, F_OD(2), 0),
SME_B16B16_INSN("bfadd", 0xc1e51c00, 0xffff9c78, sme_misc, 0, OP2 (SME_ZA_array_off3_0, SME_Znx4), OP_SVE_HH, F_OD(4), 0),
SME_B16B16_INSN("bfsub", 0xc1e41c08, 0xffff9c38, sme_misc, 0, OP2 (SME_ZA_array_off3_0, SME_Znx2), OP_SVE_HH, F_OD(2), 0),
SME_B16B16_INSN("bfsub", 0xc1e51c08, 0xffff9c78, sme_misc, 0, OP2 (SME_ZA_array_off3_0, SME_Znx4), OP_SVE_HH, F_OD(4), 0),
SME_B16B16_INSN("bfmla", 0xc1101020, 0xfff09030, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx2, SME_Zm_INDEX3_3), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmla", 0xc1109020, 0xfff09070, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx4, SME_Zm_INDEX3_3), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmla", 0xc1601c00, 0xfff09c18, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SVE_ZnxN, SME_Zm), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmla", 0xc1701c00, 0xfff09c18, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SVE_ZnxN, SME_Zm), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmla", 0xc1e01008, 0xffe19c38, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx2, SME_Zmx2), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmla", 0xc1e11008, 0xffe39c78, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx4, SME_Zmx4), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmls", 0xc1101030, 0xfff09030, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx2, SME_Zm_INDEX3_3), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmls", 0xc1109030, 0xfff09070, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx4, SME_Zm_INDEX3_3), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmls", 0xc1601c08, 0xfff09c18, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SVE_ZnxN, SME_Zm), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmls", 0xc1701c08, 0xfff09c18, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SVE_ZnxN, SME_Zm), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmls", 0xc1e01018, 0xffe19c38, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx2, SME_Zmx2), OP_SVE_HHH, F_OD(2), 0),
SME_B16B16_INSN("bfmls", 0xc1e11018, 0xffe39c78, sme_misc, 0, OP3 (SME_ZA_array_off3_0, SME_Znx4, SME_Zmx4), OP_SVE_HHH, F_OD(4), 0),
SME_B16B16_INSN("bfmopa", 0x81a00008, 0xffe0001e, sme_misc, 0, OP5 (SME_ZAda_1b, SVE_Pg3, SME_Pm, SVE_Zn, SVE_Zm_16), OP_SVE_HMMHH, 0, 0),
SME_B16B16_INSN("bfmops", 0x81a00018, 0xffe0001e, sme_misc, 0, OP5 (SME_ZAda_1b, SVE_Pg3, SME_Pm, SVE_Zn, SVE_Zm_16), OP_SVE_HMMHH, 0, 0),
/* SME2.1 movaz instructions. */
SME2p1_INSN ("movaz", 0xc0060600, 0xffff1f83, sme2_movaz, 0, OP2 (SME_Zdnx4, SME_ZA_array_vrsb_2), OP_SVE_BB, 0, 0),
SME2p1_INSN ("movaz", 0xc0460600, 0xffff1f83, sme2_movaz, 0, OP2 (SME_Zdnx4, SME_ZA_array_vrsh_2), OP_SVE_HH, 0, 0),