public inbox for gcc-patches@gcc.gnu.org
 help / color / mirror / Atom feed
* [PATCH] complex-lowering: Better handling of PAREN_EXPR [PR68855]
@ 2024-06-21  2:34 Andrew Pinski
  2024-06-21  5:18 ` Richard Biener
  0 siblings, 1 reply; 2+ messages in thread
From: Andrew Pinski @ 2024-06-21  2:34 UTC (permalink / raw)
  To: gcc-patches; +Cc: Andrew Pinski

When PAREN_EXPR tree code was added in r0-85884-gdedd42d511b6e4,
a simplified handling was added to complex lowering. Which means
we would get:
```
  _9 = COMPLEX_EXPR <_15, _14>;
  _11 = ((_9));
  _19 = REALPART_EXPR <_11>;
  _20 = IMAGPART_EXPR <_11>;
```

In many cases instead of just simply:
```
  _19 = ((_15));
  _20 = ((_14));
```

So this adds full support for PAREN_EXPR to complex lowering.
It is handled very similar as NEGATE_EXPR; except creating PAREN_EXPR
instead of NEGATE_EXPR for the real/imag parts. This allows for
more optimizations including vectorization, especially with
-ffast-math.
gfortran.dg/vect/pr68855.f90 is an example where this could show up.
It also shows up in SPEC CPU 2006's 465.tonto; though I have not done
any benchmarking there.

Bootstrapped and tested on x86_64-linux-gnu with no regressions.

gcc/ChangeLog:

	PR tree-optimization/68855
	* tree-complex.cc (init_dont_simulate_again): Handle PAREN_EXPR
	like NEGATE_EXPR.
	(complex_propagate::visit_stmt): Likewise.
	(expand_complex_move): Don't handle PAREN_EXPR.
	(expand_complex_paren): New function.
	(expand_complex_operations_1): Handle PAREN_EXPR like
	NEGATE_EXPR. And call expand_complex_paren for PAREN_EXPR.

gcc/testsuite/ChangeLog:

	* gcc.dg/vect/pr68855.c: New test.
	* gfortran.dg/vect/pr68855.f90: New test.

Signed-off-by: Andrew Pinski <quic_apinski@quicinc.com>
---
 gcc/testsuite/gcc.dg/vect/pr68855.c        | 17 +++++++++++++
 gcc/testsuite/gfortran.dg/vect/pr68855.f90 | 16 ++++++++++++
 gcc/tree-complex.cc                        | 29 ++++++++++++++++++++--
 3 files changed, 60 insertions(+), 2 deletions(-)
 create mode 100644 gcc/testsuite/gcc.dg/vect/pr68855.c
 create mode 100644 gcc/testsuite/gfortran.dg/vect/pr68855.f90

diff --git a/gcc/testsuite/gcc.dg/vect/pr68855.c b/gcc/testsuite/gcc.dg/vect/pr68855.c
new file mode 100644
index 00000000000..68a3a1cee36
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/pr68855.c
@@ -0,0 +1,17 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target vect_float } */
+
+/* { dg-final { scan-tree-dump "LOOP VECTORIZED" "vect" } } */
+
+/* PAREN_EXPR should not cause the vectorization of complex float add to be missed. */
+void foo(_Complex float *a, int n)
+{
+  for(int i = 0; i < n; i++)
+  {
+    _Complex float t;
+    t = a[i];
+    t += 6.0;
+    t = __builtin_assoc_barrier(t);
+    a[i] = t;
+  }
+}
diff --git a/gcc/testsuite/gfortran.dg/vect/pr68855.f90 b/gcc/testsuite/gfortran.dg/vect/pr68855.f90
new file mode 100644
index 00000000000..90d444c86bf
--- /dev/null
+++ b/gcc/testsuite/gfortran.dg/vect/pr68855.f90
@@ -0,0 +1,16 @@
+! { dg-do compile }
+! { dg-require-effective-target vect_float }
+
+! { dg-final { scan-tree-dump "LOOP VECTORIZED" "vect" } }
+! PAREN_EXPR should not cause the vectorization of complex float add to be missed.
+
+subroutine foo(a,n)
+
+  complex (kind(1.0)) :: a(*)
+  integer :: i,n
+
+  do i=1,n
+     a(i)=(a(i)+(6.0,1.0))
+  enddo
+  
+end subroutine foo
diff --git a/gcc/tree-complex.cc b/gcc/tree-complex.cc
index 877913972bd..8a879acffca 100644
--- a/gcc/tree-complex.cc
+++ b/gcc/tree-complex.cc
@@ -281,6 +281,7 @@ init_dont_simulate_again (void)
 
 	      case NEGATE_EXPR:
 	      case CONJ_EXPR:
+	      case PAREN_EXPR:
 		if (TREE_CODE (TREE_TYPE (op0)) == COMPLEX_TYPE)
 		  saw_a_complex_op = true;
 		break;
@@ -391,6 +392,7 @@ complex_propagate::visit_stmt (gimple *stmt, edge *taken_edge_p ATTRIBUTE_UNUSED
       break;
 
     case NEGATE_EXPR:
+    case PAREN_EXPR:
     case CONJ_EXPR:
       new_l = find_lattice_value (gimple_assign_rhs1 (stmt));
       break;
@@ -852,8 +854,7 @@ expand_complex_move (gimple_stmt_iterator *gsi, tree type)
 	  update_complex_components_on_edge (e, lhs, r, i);
 	}
       else if (is_gimple_call (stmt)
-	       || gimple_has_side_effects (stmt)
-	       || gimple_assign_rhs_code (stmt) == PAREN_EXPR)
+	       || gimple_has_side_effects (stmt))
 	{
 	  r = build1 (REALPART_EXPR, inner_type, lhs);
 	  i = build1 (IMAGPART_EXPR, inner_type, lhs);
@@ -1545,6 +1546,25 @@ expand_complex_negation (gimple_stmt_iterator *gsi, tree inner_type,
   update_complex_assignment (gsi, rr, ri);
 }
 
+/* Expand complex paren to scalars:
+	((a)) = ((ar)) + i((ai))
+*/
+
+static void
+expand_complex_paren (gimple_stmt_iterator *gsi, tree inner_type,
+		      tree ar, tree ai)
+{
+  tree rr, ri;
+  gimple_seq stmts = NULL;
+  location_t loc = gimple_location (gsi_stmt (*gsi));
+
+  rr = gimple_build (&stmts, loc, PAREN_EXPR, inner_type, ar);
+  ri = gimple_build (&stmts, loc, PAREN_EXPR, inner_type, ai);
+
+  gsi_insert_seq_before (gsi, stmts, GSI_SAME_STMT);
+  update_complex_assignment (gsi, rr, ri);
+}
+
 /* Expand complex conjugate to scalars:
 	~a = (ar) + i(-ai)
 */
@@ -1697,6 +1717,7 @@ expand_complex_operations_1 (gimple_stmt_iterator *gsi)
     case ROUND_DIV_EXPR:
     case RDIV_EXPR:
     case NEGATE_EXPR:
+    case PAREN_EXPR:
     case CONJ_EXPR:
       if (TREE_CODE (type) != COMPLEX_TYPE)
 	return;
@@ -1815,6 +1836,10 @@ expand_complex_operations_1 (gimple_stmt_iterator *gsi)
       expand_complex_comparison (gsi, ar, ai, br, bi, code);
       break;
 
+    case PAREN_EXPR:
+      expand_complex_paren (gsi, inner_type, ar, ai);
+      break;
+
     default:
       gcc_unreachable ();
     }
-- 
2.43.0


^ permalink raw reply	[flat|nested] 2+ messages in thread

* Re: [PATCH] complex-lowering: Better handling of PAREN_EXPR [PR68855]
  2024-06-21  2:34 [PATCH] complex-lowering: Better handling of PAREN_EXPR [PR68855] Andrew Pinski
@ 2024-06-21  5:18 ` Richard Biener
  0 siblings, 0 replies; 2+ messages in thread
From: Richard Biener @ 2024-06-21  5:18 UTC (permalink / raw)
  To: Andrew Pinski; +Cc: gcc-patches



> Am 21.06.2024 um 04:35 schrieb Andrew Pinski <quic_apinski@quicinc.com>:
> 
> When PAREN_EXPR tree code was added in r0-85884-gdedd42d511b6e4,
> a simplified handling was added to complex lowering. Which means
> we would get:
> ```
>  _9 = COMPLEX_EXPR <_15, _14>;
>  _11 = ((_9));
>  _19 = REALPART_EXPR <_11>;
>  _20 = IMAGPART_EXPR <_11>;
> ```
> 
> In many cases instead of just simply:
> ```
>  _19 = ((_15));
>  _20 = ((_14));
> ```
> 
> So this adds full support for PAREN_EXPR to complex lowering.
> It is handled very similar as NEGATE_EXPR; except creating PAREN_EXPR
> instead of NEGATE_EXPR for the real/imag parts. This allows for
> more optimizations including vectorization, especially with
> -ffast-math.
> gfortran.dg/vect/pr68855.f90 is an example where this could show up.
> It also shows up in SPEC CPU 2006's 465.tonto; though I have not done
> any benchmarking there.
> 
> Bootstrapped and tested on x86_64-linux-gnu with no regressions.

Ok

Thanks,
Richard 

> gcc/ChangeLog:
> 
>    PR tree-optimization/68855
>    * tree-complex.cc (init_dont_simulate_again): Handle PAREN_EXPR
>    like NEGATE_EXPR.
>    (complex_propagate::visit_stmt): Likewise.
>    (expand_complex_move): Don't handle PAREN_EXPR.
>    (expand_complex_paren): New function.
>    (expand_complex_operations_1): Handle PAREN_EXPR like
>    NEGATE_EXPR. And call expand_complex_paren for PAREN_EXPR.
> 
> gcc/testsuite/ChangeLog:
> 
>    * gcc.dg/vect/pr68855.c: New test.
>    * gfortran.dg/vect/pr68855.f90: New test.
> 
> Signed-off-by: Andrew Pinski <quic_apinski@quicinc.com>
> ---
> gcc/testsuite/gcc.dg/vect/pr68855.c        | 17 +++++++++++++
> gcc/testsuite/gfortran.dg/vect/pr68855.f90 | 16 ++++++++++++
> gcc/tree-complex.cc                        | 29 ++++++++++++++++++++--
> 3 files changed, 60 insertions(+), 2 deletions(-)
> create mode 100644 gcc/testsuite/gcc.dg/vect/pr68855.c
> create mode 100644 gcc/testsuite/gfortran.dg/vect/pr68855.f90
> 
> diff --git a/gcc/testsuite/gcc.dg/vect/pr68855.c b/gcc/testsuite/gcc.dg/vect/pr68855.c
> new file mode 100644
> index 00000000000..68a3a1cee36
> --- /dev/null
> +++ b/gcc/testsuite/gcc.dg/vect/pr68855.c
> @@ -0,0 +1,17 @@
> +/* { dg-do compile } */
> +/* { dg-require-effective-target vect_float } */
> +
> +/* { dg-final { scan-tree-dump "LOOP VECTORIZED" "vect" } } */
> +
> +/* PAREN_EXPR should not cause the vectorization of complex float add to be missed. */
> +void foo(_Complex float *a, int n)
> +{
> +  for(int i = 0; i < n; i++)
> +  {
> +    _Complex float t;
> +    t = a[i];
> +    t += 6.0;
> +    t = __builtin_assoc_barrier(t);
> +    a[i] = t;
> +  }
> +}
> diff --git a/gcc/testsuite/gfortran.dg/vect/pr68855.f90 b/gcc/testsuite/gfortran.dg/vect/pr68855.f90
> new file mode 100644
> index 00000000000..90d444c86bf
> --- /dev/null
> +++ b/gcc/testsuite/gfortran.dg/vect/pr68855.f90
> @@ -0,0 +1,16 @@
> +! { dg-do compile }
> +! { dg-require-effective-target vect_float }
> +
> +! { dg-final { scan-tree-dump "LOOP VECTORIZED" "vect" } }
> +! PAREN_EXPR should not cause the vectorization of complex float add to be missed.
> +
> +subroutine foo(a,n)
> +
> +  complex (kind(1.0)) :: a(*)
> +  integer :: i,n
> +
> +  do i=1,n
> +     a(i)=(a(i)+(6.0,1.0))
> +  enddo
> +  
> +end subroutine foo
> diff --git a/gcc/tree-complex.cc b/gcc/tree-complex.cc
> index 877913972bd..8a879acffca 100644
> --- a/gcc/tree-complex.cc
> +++ b/gcc/tree-complex.cc
> @@ -281,6 +281,7 @@ init_dont_simulate_again (void)
> 
>          case NEGATE_EXPR:
>          case CONJ_EXPR:
> +          case PAREN_EXPR:
>        if (TREE_CODE (TREE_TYPE (op0)) == COMPLEX_TYPE)
>          saw_a_complex_op = true;
>        break;
> @@ -391,6 +392,7 @@ complex_propagate::visit_stmt (gimple *stmt, edge *taken_edge_p ATTRIBUTE_UNUSED
>       break;
> 
>     case NEGATE_EXPR:
> +    case PAREN_EXPR:
>     case CONJ_EXPR:
>       new_l = find_lattice_value (gimple_assign_rhs1 (stmt));
>       break;
> @@ -852,8 +854,7 @@ expand_complex_move (gimple_stmt_iterator *gsi, tree type)
>      update_complex_components_on_edge (e, lhs, r, i);
>    }
>       else if (is_gimple_call (stmt)
> -           || gimple_has_side_effects (stmt)
> -           || gimple_assign_rhs_code (stmt) == PAREN_EXPR)
> +           || gimple_has_side_effects (stmt))
>    {
>      r = build1 (REALPART_EXPR, inner_type, lhs);
>      i = build1 (IMAGPART_EXPR, inner_type, lhs);
> @@ -1545,6 +1546,25 @@ expand_complex_negation (gimple_stmt_iterator *gsi, tree inner_type,
>   update_complex_assignment (gsi, rr, ri);
> }
> 
> +/* Expand complex paren to scalars:
> +    ((a)) = ((ar)) + i((ai))
> +*/
> +
> +static void
> +expand_complex_paren (gimple_stmt_iterator *gsi, tree inner_type,
> +              tree ar, tree ai)
> +{
> +  tree rr, ri;
> +  gimple_seq stmts = NULL;
> +  location_t loc = gimple_location (gsi_stmt (*gsi));
> +
> +  rr = gimple_build (&stmts, loc, PAREN_EXPR, inner_type, ar);
> +  ri = gimple_build (&stmts, loc, PAREN_EXPR, inner_type, ai);
> +
> +  gsi_insert_seq_before (gsi, stmts, GSI_SAME_STMT);
> +  update_complex_assignment (gsi, rr, ri);
> +}
> +
> /* Expand complex conjugate to scalars:
>    ~a = (ar) + i(-ai)
> */
> @@ -1697,6 +1717,7 @@ expand_complex_operations_1 (gimple_stmt_iterator *gsi)
>     case ROUND_DIV_EXPR:
>     case RDIV_EXPR:
>     case NEGATE_EXPR:
> +    case PAREN_EXPR:
>     case CONJ_EXPR:
>       if (TREE_CODE (type) != COMPLEX_TYPE)
>    return;
> @@ -1815,6 +1836,10 @@ expand_complex_operations_1 (gimple_stmt_iterator *gsi)
>       expand_complex_comparison (gsi, ar, ai, br, bi, code);
>       break;
> 
> +    case PAREN_EXPR:
> +      expand_complex_paren (gsi, inner_type, ar, ai);
> +      break;
> +
>     default:
>       gcc_unreachable ();
>     }
> --
> 2.43.0
> 

^ permalink raw reply	[flat|nested] 2+ messages in thread

end of thread, other threads:[~2024-06-21  5:18 UTC | newest]

Thread overview: 2+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2024-06-21  2:34 [PATCH] complex-lowering: Better handling of PAREN_EXPR [PR68855] Andrew Pinski
2024-06-21  5:18 ` Richard Biener

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).