aarch64: Fix up bfmlal lane pattern [PR104921]

author Alex Coplan <alex.coplan@arm.com>

Mon, 6 Feb 2023 14:32:21 +0000 (14:32 +0000)

committer Alex Coplan <alex.coplan@arm.com>

Mon, 20 Feb 2023 17:43:01 +0000 (17:43 +0000)
author Alex Coplan <alex.coplan@arm.com>
Mon, 6 Feb 2023 14:32:21 +0000 (14:32 +0000)
committer Alex Coplan <alex.coplan@arm.com>
Mon, 20 Feb 2023 17:43:01 +0000 (17:43 +0000)
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index e16bc784bb4087dc9690ad17745c2c08f20fd642..45e72ba0761cde1707780ca2d431a20c94997645 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -7199,7 +7199,7 @@
    [(set (match_operand:V4SF 0 "register_operand" "=w")
          (plus: V4SF (match_operand:V4SF 1 "register_operand" "0")
                      (unspec:V4SF [(match_operand:V8BF 2 "register_operand" "w")
-                                  (match_operand:VBF 3 "register_operand" "w")
+                                  (match_operand:VBF 3 "register_operand" "x")
                                    (match_operand:SI 4 "const_int_operand" "n")]
                       BF_MLA)))]
    "TARGET_BF16_SIMD"
diff --git a/gcc/testsuite/gcc.target/aarch64/pr104921-1.c b/gcc/testsuite/gcc.target/aarch64/pr104921-1.c

new file mode 100644 (file)

index 0000000..dcf6fe7
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/pr104921-1.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-additional-options "-O2 -march=armv8.2-a+bf16 -std=gnu99 -save-temps" }  */
+/* { dg-final { check-function-bodies "**" "" } } */
+
+#include "pr104921.x"
+
+/*
+**foo:
+**     mov     v([0-9]|1[0-5])\.8b, v16\.8b
+**     bfmlalb v0\.4s, v1\.8h, v([0-9]|1[0-5])\.h\[0\]
+**     ret
+*/
diff --git a/gcc/testsuite/gcc.target/aarch64/pr104921-2.c b/gcc/testsuite/gcc.target/aarch64/pr104921-2.c

new file mode 100644 (file)

index 0000000..211fcd0
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/pr104921-2.c
@@ -0,0 +1,6 @@
+/* { dg-do assemble } */
+/* { dg-add-options arm_v8_2a_bf16_neon }  */
+/* { dg-additional-options "-O2 -std=gnu99" }  */
+/* { dg-require-effective-target arm_v8_2a_bf16_neon_ok } */
+
+#include "pr104921.x"
diff --git a/gcc/testsuite/gcc.target/aarch64/pr104921.x b/gcc/testsuite/gcc.target/aarch64/pr104921.x

new file mode 100644 (file)

index 0000000..1e1a6f2
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/pr104921.x
@@ -0,0 +1,9 @@
+#include <arm_neon.h>
+
+float32x4_t
+foo(float32x4_t x, bfloat16x8_t a)
+{
+  register bfloat16x4_t b asm ("v16");
+  asm volatile ("" : "=w"(b));
+  return vbfmlalbq_lane_f32 (x, a, b, 0);
+}
author	Alex Coplan <alex.coplan@arm.com>
	Mon, 6 Feb 2023 14:32:21 +0000 (14:32 +0000)
committer	Alex Coplan <alex.coplan@arm.com>
	Mon, 20 Feb 2023 17:43:01 +0000 (17:43 +0000)
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/pr104921-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/aarch64/pr104921-2.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/aarch64/pr104921.x	[new file with mode: 0644]	patch \| blob