[gcc(refs/users/meissner/heads/work119)] Fold vsx_extract from memory with constant element to floating point.

public inbox for gcc-cvs@sourceware.org
help / color / mirror / Atom feed

* [gcc(refs/users/meissner/heads/work119)] Fold vsx_extract from memory with constant element to floating point.
@ 2023-04-24 19:17 Michael Meissner
  0 siblings, 0 replies; only message in thread
From: Michael Meissner @ 2023-04-24 19:17 UTC (permalink / raw)
  To: gcc-cvs

https://gcc.gnu.org/g:d6b9208d66fd2c1ae26394e6f918c19d83651491

commit d6b9208d66fd2c1ae26394e6f918c19d83651491
Author: Michael Meissner <meissner@linux.ibm.com>
Date:   Mon Apr 24 15:16:44 2023 -0400

    Fold vsx_extract from memory with constant element to floating point.
    
    This patch folds V4SI/V8HI/V16QI vsx_extract from memory where the element
    number is constant and it is converted to floating point (both signed and
    unsigned floating point conversion).
    
    2023-04-21   Michael Meissner  <meissner@linux.ibm.com>
    
    gcc/
    
            * config/rs6000/vsx.md (FL_CONV_REG): New mode attribute.
            (vsx_extract_<VSX_EXTRACT_I:mode>_load_to_u<FL_CONV:mode>): New insn.
            (vsx_extract_v4si_load_to_s<mode>): New insn.
            (vsx_extract_v8hi_load_to_s<mode>): New insn.

Diff:
---
 gcc/config/rs6000/vsx.md | 106 +++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 106 insertions(+)

diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md
index acda883564d..f90005d4b63 100644
--- a/gcc/config/rs6000/vsx.md
+++ b/gcc/config/rs6000/vsx.md
@@ -247,6 +247,13 @@
 			       (TF "TARGET_FLOAT128_HW
 				    && FLOAT128_IEEE_P (TFmode)")])
 
+;; Mode attribute to give the constraint for floating point when used
+;; with FL_CONV modes.
+(define_mode_attr FL_CONV_REG [(SF "wa")
+			       (DF "wa")
+			       (KF "v")
+			       (TF "v")])
+
 ;; Iterator for the 2 short vector types to do a splat from an integer
 (define_mode_iterator VSX_SPLAT_I [V16QI V8HI])
 
@@ -4061,6 +4068,105 @@
   [(set_attr "type" "load")
    (set_attr "length" "8")])
 
+;; Extract a V4SI/V8HI/V16QI element from memory with a constant element number
+;; and convert it to unsigned float.
+(define_insn_and_split "*vsx_extract_<VSX_EXTRACT_I:mode>_load_to_u<FL_CONV:mode>"
+  [(set (match_operand:FL_CONV 0 "register_operand" "=<FL_CONV:FL_CONV_REG>")
+	(unsigned_float:FL_CONV
+	 (vec_select:<VSX_EXTRACT_I:VEC_base>
+	  (match_operand:VSX_EXTRACT_I 1 "memory_operand" "Q")
+	  (parallel [(match_operand:QI 2 "const_int_operand" "n")]))))
+   (clobber (match_scratch:DI 3 "=&b"))
+   (clobber (match_scratch:DI 4 "=<VSX_EX>"))]
+  "VECTOR_MEM_VSX_P (<VSX_EXTRACT_I:MODE>mode) && TARGET_DIRECT_MOVE_64BIT"
+  "#"
+  "&& 1"
+  [(set (match_dup 4)
+	(zero_extend:DI (match_dup 5)))
+   (set (match_dup 0)
+	(float:FL_CONV (match_dup 4)))]
+{
+  machine_mode base_mode = <VSX_EXTRACT_I:VEC_base>mode;
+
+  if (GET_CODE (operands[3]) == SCRATCH)
+    operands[3] = gen_reg_rtx (DImode);
+  if (GET_CODE (operands[4]) == SCRATCH)
+    operands[4] = gen_reg_rtx (DImode);
+
+  operands[5] = rs6000_adjust_vec_address (operands[0], operands[1],
+					   operands[2], operands[3],
+					   base_mode);
+}
+  [(set_attr "type" "fpload")
+   (set_attr "length" "8")])
+
+;; Extract a V4SI element from memory with a constant element number and
+;; convert it to signed float.
+(define_insn_and_split "*vsx_extract_v4si_load_to_s<mode>"
+  [(set (match_operand:FL_CONV 0 "register_operand" "=<FL_CONV_REG>")
+	(float:FL_CONV
+	 (vec_select:SI
+	  (match_operand:V4SI 1 "memory_operand" "Q")
+	  (parallel [(match_operand:QI 2 "const_0_to_3_operand" "n")]))))
+   (clobber (match_scratch:DI 3 "=&b"))
+   (clobber (match_scratch:DI 4 "=<FL_CONV_REG>"))]
+  "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
+  "#"
+  "&& 1"
+  [(set (match_dup 4)
+	(sign_extend:DI (match_dup 5)))
+   (set (match_dup 0)
+	(float:FL_CONV (match_dup 4)))]
+{
+  if (GET_CODE (operands[3]) == SCRATCH)
+    operands[3] = gen_reg_rtx (DImode);
+  if (GET_CODE (operands[4]) == SCRATCH)
+    operands[4] = gen_reg_rtx (DImode);
+
+  operands[5] = rs6000_adjust_vec_address (operands[0], operands[1],
+					   operands[2], operands[3],
+					   SImode);
+}
+  [(set_attr "type" "fpload")
+   (set_attr "length" "8")])
+
+;; Extract a V8HI element from memory with a constant element number and
+;; convert it to signed float.  While we could do this via a LXSIHZX
+;; instruction followed by VEXTSB2D, it is better to do a LWA and MTVSRD
+;; instruction.
+(define_insn_and_split "*vsx_extract_v8hi_load_to_s<mode>"
+  [(set (match_operand:FL_CONV 0 "register_operand" "=<FL_CONV_REG>,<FL_CONV_REG>")
+	(float:FL_CONV
+	 (vec_select:HI
+	  (match_operand:V8HI 1 "memory_operand" "m,Qo")
+	  (parallel [(match_operand:QI 2 "const_0_to_7_operand" "O,n")]))))
+   (clobber (match_scratch:DI 3 "=X,&b"))
+   (clobber (match_scratch:DI 4 "=&r,&r"))
+   (clobber (match_scratch:DI 5 "=<FL_CONV_REG>,<FL_CONV_REG>"))]
+  "VECTOR_MEM_VSX_P (V4SImode) && TARGET_DIRECT_MOVE_64BIT"
+  "#"
+  "&& 1"
+  [(set (match_dup 4)
+	(sign_extend:DI (match_dup 6)))
+   (set (match_dup 5)
+	(match_dup 4))
+   (set (match_dup 0)
+	(float:FL_CONV (match_dup 5)))]
+{
+  if (GET_CODE (operands[3]) == SCRATCH)
+    operands[3] = gen_reg_rtx (DImode);
+  if (GET_CODE (operands[4]) == SCRATCH)
+    operands[4] = gen_reg_rtx (DImode);
+  if (GET_CODE (operands[5]) == SCRATCH)
+    operands[5] = gen_reg_rtx (DImode);
+
+  operands[6] = rs6000_adjust_vec_address (operands[0], operands[1],
+					   operands[2], operands[3],
+					   HImode);
+}
+  [(set_attr "type" "load")
+   (set_attr "length" "12")])
+
 ;; Variable V16QI/V8HI/V4SI extract from a register
 (define_insn_and_split "vsx_extract_<mode>_var"
   [(set (match_operand:<VEC_base> 0 "gpc_reg_operand" "=r,r")

^ permalink raw reply	[flat|nested] only message in thread

only message in thread, other threads:[~2023-04-24 19:17 UTC | newest]

Thread overview: (only message) (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2023-04-24 19:17 [gcc(refs/users/meissner/heads/work119)] Fold vsx_extract from memory with constant element to floating point Michael Meissner

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).