[gcc r12-2096] Add avx512 tests for MADDSUB and FMSUBADD SLP vectorization patterns.

public inbox for gcc-cvs@sourceware.org
help / color / mirror / Atom feed

* [gcc r12-2096] Add avx512 tests for MADDSUB and FMSUBADD SLP vectorization patterns.
@ 2021-07-07  7:30 hongtao Liu
  0 siblings, 0 replies; only message in thread
From: hongtao Liu @ 2021-07-07  7:30 UTC (permalink / raw)
  To: gcc-cvs

https://gcc.gnu.org/g:98bfd845e93937d92ca844d7fa7e853ad51c6193

commit r12-2096-g98bfd845e93937d92ca844d7fa7e853ad51c6193
Author: liuhongt <hongtao.liu@intel.com>
Date:   Wed Jul 7 15:19:42 2021 +0800

    Add avx512 tests for MADDSUB and FMSUBADD SLP vectorization patterns.
    
    gcc/testsuite/ChangeLog:
    
            * gcc.target/i386/avx512f-vect-fmaddsubXXXpd.c: New test.
            * gcc.target/i386/avx512f-vect-fmaddsubXXXps.c: New test.
            * gcc.target/i386/avx512f-vect-fmsubaddXXXpd.c: New test.
            * gcc.target/i386/avx512f-vect-fmsubaddXXXps.c: New test.

Diff:
---
 .../gcc.target/i386/avx512f-vect-fmaddsubXXXpd.c   | 41 ++++++++++++++++++
 .../gcc.target/i386/avx512f-vect-fmaddsubXXXps.c   | 50 ++++++++++++++++++++++
 .../gcc.target/i386/avx512f-vect-fmsubaddXXXpd.c   | 41 ++++++++++++++++++
 .../gcc.target/i386/avx512f-vect-fmsubaddXXXps.c   | 50 ++++++++++++++++++++++
 4 files changed, 182 insertions(+)

diff --git a/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXpd.c b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXpd.c
new file mode 100644
index 00000000000..734f9e01443
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXpd.c
@@ -0,0 +1,41 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512f } */
+/* { dg-options "-O3 -mfma -save-temps -mavx512f -mprefer-vector-width=512" } */
+
+#include "fma-check.h"
+void __attribute__((noipa))
+check_fmaddsub (double * __restrict a, double *b, double *c, int n)
+{
+  for (int i = 0; i < n; ++i)
+    {
+      a[8*i + 0] = b[8*i + 0] * c[8*i + 0] - a[8*i + 0];
+      a[8*i + 1] = b[8*i + 1] * c[8*i + 1] + a[8*i + 1];
+      a[8*i + 2] = b[8*i + 2] * c[8*i + 2] - a[8*i + 2];
+      a[8*i + 3] = b[8*i + 3] * c[8*i + 3] + a[8*i + 3];
+      a[8*i + 4] = b[8*i + 4] * c[8*i + 4] - a[8*i + 4];
+      a[8*i + 5] = b[8*i + 5] * c[8*i + 5] + a[8*i + 5];
+      a[8*i + 6] = b[8*i + 6] * c[8*i + 6] - a[8*i + 6];
+      a[8*i + 7] = b[8*i + 7] * c[8*i + 7] + a[8*i + 7];
+    }
+}
+
+static void
+fma_test (void)
+{
+  if (!__builtin_cpu_supports ("avx512f"))
+    return;
+  double a[8], b[8], c[8];
+  for (int i = 0; i < 8; ++i)
+    {
+      a[i] = i;
+      b[i] = 3*i;
+      c[i] = 7*i;
+    }
+  check_fmaddsub (a, b, c, 1);
+  const double d[8] = { 0., 22., 82., 192., 332., 530., 750., 1036.};
+  for (int i = 0; i < 8; ++i)
+    if (a[i] != d[i])
+      __builtin_abort ();
+}
+
+/* { dg-final { scan-assembler {(?n)fmaddsub...pd[ \t].*%zmm[0-9]} } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXps.c b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXps.c
new file mode 100644
index 00000000000..ae196c5ef48
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmaddsubXXXps.c
@@ -0,0 +1,50 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512f } */
+/* { dg-options "-O3 -mavx512f -mprefer-vector-width=512 -save-temps" } */
+
+#include "fma-check.h"
+void __attribute__((noipa))
+check_fmaddsub (float * __restrict a, float *b, float *c, int n)
+{
+  for (int i = 0; i < n; ++i)
+    {
+      a[16*i + 0] = b[16*i + 0] * c[16*i + 0] - a[16*i + 0];
+      a[16*i + 1] = b[16*i + 1] * c[16*i + 1] + a[16*i + 1];
+      a[16*i + 2] = b[16*i + 2] * c[16*i + 2] - a[16*i + 2];
+      a[16*i + 3] = b[16*i + 3] * c[16*i + 3] + a[16*i + 3];
+      a[16*i + 4] = b[16*i + 4] * c[16*i + 4] - a[16*i + 4];
+      a[16*i + 5] = b[16*i + 5] * c[16*i + 5] + a[16*i + 5];
+      a[16*i + 6] = b[16*i + 6] * c[16*i + 6] - a[16*i + 6];
+      a[16*i + 7] = b[16*i + 7] * c[16*i + 7] + a[16*i + 7];
+      a[16*i + 8] = b[16*i + 8] * c[16*i + 8] - a[16*i + 8];
+      a[16*i + 9] = b[16*i + 9] * c[16*i + 9] + a[16*i + 9];
+      a[16*i + 10] = b[16*i + 10] * c[16*i + 10] - a[16*i + 10];
+      a[16*i + 11] = b[16*i + 11] * c[16*i + 11] + a[16*i + 11];
+      a[16*i + 12] = b[16*i + 12] * c[16*i + 12] - a[16*i + 12];
+      a[16*i + 13] = b[16*i + 13] * c[16*i + 13] + a[16*i + 13];
+      a[16*i + 14] = b[16*i + 14] * c[16*i + 14] - a[16*i + 14];
+      a[16*i + 15] = b[16*i + 15] * c[16*i + 15] + a[16*i + 15];
+    }
+}
+
+static void
+fma_test (void)
+{
+  if (!__builtin_cpu_supports ("avx512f"))
+    return;
+  float a[16], b[16], c[16];
+  for (int i = 0; i < 16; ++i)
+    {
+      a[i] = i;
+      b[i] = 3*i;
+      c[i] = 7*i;
+    }
+  check_fmaddsub (a, b, c, 1);
+  const float d[16] = { 0., 22., 82., 192., 332., 530., 750., 1036.,
+			1336, 1710., 2090., 2552., 3012., 3562., 4102., 4740.};
+  for (int i = 0; i < 16; ++i)
+    if (a[i] != d[i])
+      __builtin_abort ();
+}
+
+/* { dg-final { scan-assembler {(?n)fmaddsub...ps[ \t].*%zmm[0-9]} } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXpd.c b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXpd.c
new file mode 100644
index 00000000000..cde76db1755
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXpd.c
@@ -0,0 +1,41 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512f } */
+/* { dg-options "-O3 -mavx512f -mprefer-vector-width=512 -save-temps" } */
+
+#include "fma-check.h"
+void __attribute__((noipa))
+check_fmaddsub (double * __restrict a, double *b, double *c, int n)
+{
+  for (int i = 0; i < n; ++i)
+    {
+      a[8*i + 0] = b[8*i + 0] * c[8*i + 0] + a[8*i + 0];
+      a[8*i + 1] = b[8*i + 1] * c[8*i + 1] - a[8*i + 1];
+      a[8*i + 2] = b[8*i + 2] * c[8*i + 2] + a[8*i + 2];
+      a[8*i + 3] = b[8*i + 3] * c[8*i + 3] - a[8*i + 3];
+      a[8*i + 4] = b[8*i + 4] * c[8*i + 4] + a[8*i + 4];
+      a[8*i + 5] = b[8*i + 5] * c[8*i + 5] - a[8*i + 5];
+      a[8*i + 6] = b[8*i + 6] * c[8*i + 6] + a[8*i + 6];
+      a[8*i + 7] = b[8*i + 7] * c[8*i + 7] - a[8*i + 7];
+    }
+}
+
+static void
+fma_test (void)
+{
+  if (!__builtin_cpu_supports ("avx512f"))
+    return;
+  double a[8], b[8], c[8];
+  for (int i = 0; i < 8; ++i)
+    {
+      a[i] = i;
+      b[i] = 3*i;
+      c[i] = 7*i;
+    }
+  check_fmaddsub (a, b, c, 1);
+  const double d[8] = { 0., 20., 86., 186., 340., 520., 762., 1022.};
+  for (int i = 0; i < 8; ++i)
+    if (a[i] != d[i])
+      __builtin_abort ();
+}
+
+/* { dg-final { scan-assembler {(?n)fmsubadd...pd[ \t].*%zmm[0-9]} } } */
diff --git a/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXps.c b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXps.c
new file mode 100644
index 00000000000..59de39f4112
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/avx512f-vect-fmsubaddXXXps.c
@@ -0,0 +1,50 @@
+/* { dg-do run } */
+/* { dg-require-effective-target avx512f } */
+/* { dg-options "-O3 -mavx512f -mprefer-vector-width=512 -save-temps" } */
+
+#include "fma-check.h"
+void __attribute__((noipa))
+check_fmaddsub (float * __restrict a, float *b, float *c, int n)
+{
+  for (int i = 0; i < n; ++i)
+    {
+      a[16*i + 0] = b[16*i + 0] * c[16*i + 0] + a[16*i + 0];
+      a[16*i + 1] = b[16*i + 1] * c[16*i + 1] - a[16*i + 1];
+      a[16*i + 2] = b[16*i + 2] * c[16*i + 2] + a[16*i + 2];
+      a[16*i + 3] = b[16*i + 3] * c[16*i + 3] - a[16*i + 3];
+      a[16*i + 4] = b[16*i + 4] * c[16*i + 4] + a[16*i + 4];
+      a[16*i + 5] = b[16*i + 5] * c[16*i + 5] - a[16*i + 5];
+      a[16*i + 6] = b[16*i + 6] * c[16*i + 6] + a[16*i + 6];
+      a[16*i + 7] = b[16*i + 7] * c[16*i + 7] - a[16*i + 7];
+      a[16*i + 8] = b[16*i + 8] * c[16*i + 8] + a[16*i + 8];
+      a[16*i + 9] = b[16*i + 9] * c[16*i + 9] - a[16*i + 9];
+      a[16*i + 10] = b[16*i + 10] * c[16*i + 10] + a[16*i + 10];
+      a[16*i + 11] = b[16*i + 11] * c[16*i + 11] - a[16*i + 11];
+      a[16*i + 12] = b[16*i + 12] * c[16*i + 12] + a[16*i + 12];
+      a[16*i + 13] = b[16*i + 13] * c[16*i + 13] - a[16*i + 13];
+      a[16*i + 14] = b[16*i + 14] * c[16*i + 14] + a[16*i + 14];
+      a[16*i + 15] = b[16*i + 15] * c[16*i + 15] - a[16*i + 15];
+    }
+}
+
+static void
+fma_test (void)
+{
+  if (!__builtin_cpu_supports ("avx512f"))
+    return;
+  float a[16], b[16], c[16];
+  for (int i = 0; i < 16; ++i)
+    {
+      a[i] = i;
+      b[i] = 3*i;
+      c[i] = 7*i;
+    }
+  check_fmaddsub (a, b, c, 1);
+  const float d[16] = { 0., 20., 86., 186., 340., 520., 762., 1022.,
+			1352, 1692., 2110., 2530., 3036., 3536., 4130., 4710.};
+  for (int i = 0; i < 16; ++i)
+    if (a[i] != d[i])
+      __builtin_abort ();
+}
+
+/* { dg-final { scan-assembler {(?n)fmsubadd...ps[ \t].*%zmm[0-9]} } } */


^ permalink raw reply	[flat|nested] only message in thread

only message in thread, other threads:[~2021-07-07  7:30 UTC | newest]

Thread overview: (only message) (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2021-07-07  7:30 [gcc r12-2096] Add avx512 tests for MADDSUB and FMSUBADD SLP vectorization patterns hongtao Liu

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).