AARCH64_FEATURES (2, MOPS, MEMTAG)},
{"sve2p3", AARCH64_FEATURE (SVE2p3), AARCH64_FEATURE (SVE2p2)},
{"sme2p3", AARCH64_FEATURE (SME2p3), AARCH64_FEATURES (2, SME2p2, SME_LUTv2)},
+ {"f16f32dot", AARCH64_FEATURE (F16F32DOT), AARCH64_FEATURE (SIMD)},
{NULL, AARCH64_NO_FEATURES, AARCH64_NO_FEATURES},
};
@tab Enable Armv8.2 16-bit floating-point multiplication variant support.
@item @code{fp16} @tab @code{fp}
@tab Enable Armv8.2 16-bit floating-point support.
+@item @code{f16f32dot} @tab @code{simd}
+ @tab Enable Armv9.7 f16f32dot instructions.
@item @code{fprcvt} @tab @code{fp}
@tab Enable Armv9.6 fprcvt instructions.
@item @code{frintts} @tab @code{fp}
--- /dev/null
+#as: -march=armv8-a+f16f32dot
+#objdump: -dr
+
+.*: file format .*
+
+Disassembly of section \.text:
+
+0+ <\.text>:
+ *[0-9a-f]+: 0f409000 fdot v0\.2s, v0\.4h, v0\.2h\[0]
+ *[0-9a-f]+: 0f60901f fdot v31\.2s, v0\.4h, v0\.2h\[1]
+ *[0-9a-f]+: 0f409be0 fdot v0\.2s, v31\.4h, v0\.2h\[2]
+ *[0-9a-f]+: 0f7f9800 fdot v0\.2s, v0\.4h, v31\.2h\[3]
+ *[0-9a-f]+: 4f409000 fdot v0\.4s, v0\.8h, v0\.2h\[0]
+ *[0-9a-f]+: 4f60901f fdot v31\.4s, v0\.8h, v0\.2h\[1]
+ *[0-9a-f]+: 4f409be0 fdot v0\.4s, v31\.8h, v0\.2h\[2]
+ *[0-9a-f]+: 4f7f9800 fdot v0\.4s, v0\.8h, v31\.2h\[3]
+ *[0-9a-f]+: 0e80fc00 fdot v0\.2s, v0\.4h, v0\.4h
+ *[0-9a-f]+: 0e80fc1f fdot v31\.2s, v0\.4h, v0\.4h
+ *[0-9a-f]+: 0e80ffe0 fdot v0\.2s, v31\.4h, v0\.4h
+ *[0-9a-f]+: 0e9ffc00 fdot v0\.2s, v0\.4h, v31\.4h
+ *[0-9a-f]+: 4e80fc00 fdot v0\.4s, v0\.8h, v0\.8h
+ *[0-9a-f]+: 4e80fc1f fdot v31\.4s, v0\.8h, v0\.8h
+ *[0-9a-f]+: 4e80ffe0 fdot v0\.4s, v31\.8h, v0\.8h
+ *[0-9a-f]+: 4e9ffc00 fdot v0\.4s, v0\.8h, v31\.8h
--- /dev/null
+fdot v0.2s, v0.4h, v0.2h[0]
+fdot v31.2s, v0.4h, v0.2h[1]
+fdot v0.2s, v31.4h, v0.2h[2]
+fdot v0.2s, v0.4h, v31.2h[3]
+
+fdot v0.4s, v0.8h, v0.2h[0]
+fdot v31.4s, v0.8h, v0.2h[1]
+fdot v0.4s, v31.8h, v0.2h[2]
+fdot v0.4s, v0.8h, v31.2h[3]
+
+fdot v0.2s, v0.4h, v0.4h
+fdot v31.2s, v0.4h, v0.4h
+fdot v0.2s, v31.4h, v0.4h
+fdot v0.2s, v0.4h, v31.4h
+
+fdot v0.4s, v0.8h, v0.8h
+fdot v31.4s, v0.8h, v0.8h
+fdot v0.4s, v31.8h, v0.8h
+fdot v0.4s, v0.8h, v31.8h
AARCH64_FEATURE_SVE2p3,
/* SME2.3. */
AARCH64_FEATURE_SME2p3,
+ /* F16F32DOT instructions. */
+ AARCH64_FEATURE_F16F32DOT,
/* Virtual features. These are used to gate instructions that are enabled
by either of two (or more) sets of command line flags. */
{
if (((word >> 22) & 0x1) == 0)
{
- /* 33222222222211111111110000000000
- 10987654321098765432109876543210
- 0x001110x00xxxxxx11111xxxxxxxxxx. */
- return A64_OPID_0e00fc00_fdot_Vd_Vn_Vm;
+ if (((word >> 23) & 0x1) == 0)
+ {
+ /* 33222222222211111111110000000000
+ 10987654321098765432109876543210
+ 0x001110000xxxxxx11111xxxxxxxxxx. */
+ return A64_OPID_0e00fc00_fdot_Vd_Vn_Vm;
+ }
+ else
+ {
+ /* 33222222222211111111110000000000
+ 10987654321098765432109876543210
+ 0x001110100xxxxxx11111xxxxxxxxxx. */
+ return A64_OPID_0e80fc00_fdot_Vd_Vn_Vm;
+ }
}
else
{
{
if (((word >> 23) & 0x1) == 0)
{
- if (((word >> 29) & 0x1) == 0)
+ if (((word >> 22) & 0x1) == 0)
{
- /* 33222222222211111111110000000000
- 10987654321098765432109876543210
- xx0011110xxxxxxx1001x0xxxxxxxxxx. */
- return A64_OPID_0f009000_fmul_Vd_Vn_Em16;
+ if (((word >> 29) & 0x1) == 0)
+ {
+ /* 33222222222211111111110000000000
+ 10987654321098765432109876543210
+ xx00111100xxxxxx1001x0xxxxxxxxxx. */
+ return A64_OPID_0f009000_fmul_Vd_Vn_Em16;
+ }
+ else
+ {
+ /* 33222222222211111111110000000000
+ 10987654321098765432109876543210
+ xx10111100xxxxxx1001x0xxxxxxxxxx. */
+ return A64_OPID_2f009000_fmulx_Vd_Vn_Em16;
+ }
}
else
{
/* 33222222222211111111110000000000
10987654321098765432109876543210
- xx1011110xxxxxxx1001x0xxxxxxxxxx. */
- return A64_OPID_2f009000_fmulx_Vd_Vn_Em16;
+ xxx0111101xxxxxx1001x0xxxxxxxxxx. */
+ return A64_OPID_0f409000_fdot_Vd_Vn_Em16;
}
}
else
A64_OPID_45a02000_sqshrun_SVE_Zd_SME_Znx2_SVE_SHRIMM_UNPRED_22,
A64_OPID_45a83800_uqrshrn_SVE_Zd_SME_Znx2_SME_SHRIMM3,
A64_OPID_45a01000_uqshrn_SVE_Zd_SME_Znx2_SVE_SHRIMM_UNPRED_22,
+ A64_OPID_0f409000_fdot_Vd_Vn_Em16,
+ A64_OPID_0e80fc00_fdot_Vd_Vn_Vm,
A64_OPID_MAX,
};
AARCH64_FEATURE (SME2p3);
static const aarch64_feature_set aarch64_feature_sve2p3_sme2p3 =
AARCH64_FEATURE (SVE2p3_SME2p3);
+static const aarch64_feature_set aarch64_feature_f16f32dot =
+ AARCH64_FEATURE (F16F32DOT);
#define CORE &aarch64_feature_v8
#define FP &aarch64_feature_fp
#define SVE2p3 &aarch64_feature_sve2p3
#define SME2p3 &aarch64_feature_sme2p3
#define SVE2p3_SME2p3 &aarch64_feature_sve2p3_sme2p3
+#define F16F32DOT &aarch64_feature_f16f32dot
#define CORE_INSN(NAME,OPCODE,MASK,CLASS,OP,OPS,QUALS,FLAGS) \
{ NAME, OPCODE, MASK, CLASS, OP, CORE, OPS, QUALS, FLAGS | F_INVALID_IMM_SYMS_1, 0, 0, NULL }
{ NAME, OPCODE, MASK, CLASS, OP, SVE2p3_SME2p3, OPS, QUALS, \
F_STRICT | F_INVALID_IMM_SYMS_3 | FLAGS, CONSTRAINTS, TIED, NULL }
+#define F16F32DOT_INSN(NAME,OPCODE,MASK,CLASS,OPS,QUALS,FLAGS) \
+ { NAME, OPCODE, MASK, CLASS, 0, F16F32DOT, OPS, QUALS, FLAGS, 0, 0, NULL }
#define MOPS_CPY_OP1_OP2_PME_INSN(NAME, OPCODE, MASK, FLAGS, CONSTRAINTS) \
MOPS_INSN (NAME, OPCODE, MASK, 0, \
SVE2p3_SME2p3_INSN ("uqrshrn", 0x45a83800, 0xfff8fc20, sve_misc, 0, OP3 (SVE_Zd, SME_Znx2, SME_SHRIMM3), OP_SVE_BHU, 0, 0, 0),
SVE2p3_SME2p3_INSN ("uqshrn", 0x45a01000, 0xffe0fc20, sve_shift_tsz_hsd, 0, OP3 (SVE_Zd, SME_Znx2, SVE_SHRIMM_UNPRED_22), OP_SVE_VVU_BH_HS, 0, 0, 0),
+ /* F16F32DOT instructions. */
+ F16F32DOT_INSN ("fdot", 0x0f409000, 0xbfc0f400, dotproduct, OP3 (Vd, Vn, Em16), QL_BFDOT64I, F_SIZEQ),
+ F16F32DOT_INSN ("fdot", 0x0e80fc00, 0xbfe0fc00, dotproduct, OP3 (Vd, Vn, Vm), QL_BFDOT64, F_SIZEQ),
+
{0, 0, 0, 0, 0, 0, {}, {}, 0, 0, 0, NULL},
};