[gcc(refs/users/meissner/heads/work071)] Rework XXSPLTIDP support.

public inbox for gcc-cvs@sourceware.org
help / color / mirror / Atom feed

* [gcc(refs/users/meissner/heads/work071)] Rework XXSPLTIDP support.
@ 2021-10-13 18:46 Michael Meissner
  0 siblings, 0 replies; only message in thread
From: Michael Meissner @ 2021-10-13 18:46 UTC (permalink / raw)
  To: gcc-cvs

https://gcc.gnu.org/g:db504d15cebeff014c83e93fd903e2caa0357828

commit db504d15cebeff014c83e93fd903e2caa0357828
Author: Michael Meissner <meissner@linux.ibm.com>
Date:   Wed Oct 13 14:46:25 2021 -0400

    Rework XXSPLTIDP support.
    
    This patch rewrites the XXSPLTIDP support to use a new structure
    rs6000_vec_const that holds all of the information for a vector constant.
    
    2021-10-13  Michael Meissner  <meissner@the-meissners.org>
    
    gcc/
    
            * config/rs6000/predicates.md
            (easy_vector_constant_64bit_element): Switch to use
            rs6000_vec_const.
            * config/rs6000/rs6000-protos.h (xxspltidp_constant_immediate):
            Delete.
            (convert_vector_constant_to_bytes): Likewise.
            (convert_scalar_64bit_constant_to_bytes): Likewise.
            (prefixed_xxsplti_p): Likewise.
            (VECTOR_CONST_*): New defines.
            (rs6000_vec_const): New data structure.
            (vec_const_to_bytes): New function.
            (vec_const_use_xxspltidp): New function.
            * config/rs6000/rs6000.c (convert_vector_constant_to_bytes):
            Delete.
            (convert_scalar_64bit_constant_to_bytes): Likewise.
            (xxspltidp_constant_immediate): Likewise.
            (output_vec_const_move): Switch to use rs6000_vec_const.
            (prefixed_xxsplti_p): Likewise.
            (vec_const_integer): New helper function.
            (vec_const_floating_point): New helper function.
            (vec_const_use_xxspltidp): New function.
            (vec_const_to_bytes): New function.
            * config/rs6000/vsx.md (XXSPLTIDP splitters): Switch to use
            rs6000_vec_const.

Diff:
---
 gcc/config/rs6000/predicates.md   |  93 +------
 gcc/config/rs6000/rs6000-protos.h |  30 ++-
 gcc/config/rs6000/rs6000.c        | 520 +++++++++++++++++++++-----------------
 gcc/config/rs6000/vsx.md          |  10 +-
 4 files changed, 326 insertions(+), 327 deletions(-)

diff --git a/gcc/config/rs6000/predicates.md b/gcc/config/rs6000/predicates.md
index 20da6faf6e7..f2ee2bed230 100644
--- a/gcc/config/rs6000/predicates.md
+++ b/gcc/config/rs6000/predicates.md
@@ -620,102 +620,17 @@
 (define_predicate "easy_vector_constant_64bit_element"
   (match_code "const_vector,vec_duplicate,const_int,const_double")
 {
-  unsigned char vector_bytes[16];
+  rs6000_vec_const vec_const;
 
   /* Can we do the XXSPLTIDP instruction?  */
   if (!TARGET_XXSPLTIDP || !TARGET_PREFIXED || !TARGET_VSX)
     return false;
 
-  /* We use DImode for integer constants and DFmode for floating point
-     constants, since SFmode scalars are stored as DFmode in the PowerPC.  */
-  if (CONST_INT_P (op) || CONST_DOUBLE_P (op))
-    {
-      if (!convert_scalar_64bit_constant_to_bytes (op, vector_bytes,
-						   sizeof (vector_bytes)))
-	return false;
-
-      /* Change mode to value in the vector register.  */
-      mode = (CONST_INT_P (op)) ? E_DImode : E_DFmode;
-    }
-
-  /* For vector constants, get the whole vector.  */
-  else if (!convert_vector_constant_to_bytes (op, mode, vector_bytes,
-					      sizeof (vector_bytes)))
-    return false;
-
-  /* The vector_bytes array has the 8 bytes of the upper and lower constants in
-     big endian order. Convert these into 64-bit constants.  */
-  unsigned HOST_WIDE_INT df_upper = 0, df_lower = 0;
-  for (int i = 0; i < 8; i++)
-    {
-      df_upper = (df_upper << 8) | vector_bytes[i];
-      df_lower = (df_lower << 8) | vector_bytes[i+8];
-    }
-
-  /* Make sure that the two 64-bit segments are the same.  */
-  if (df_upper != df_lower)
-    return false;
-  
-  /* Avoid values that are easy to create with other instructions (0.0 for
-     floating point, and values that can be loaded with XXSPLTIB and sign
-     extension for integer.  */
-  if (op == CONST0_RTX (mode))
-    return false;
-
-  if (INTEGRAL_MODE_P (mode) && IN_RANGE (df_upper, -128, 127))
-    return false;
-
-  /* Avoid values that look like DFmode NaN's.  The IEEE 754 64-bit floating
-     format has 1 bit for sign, 11 bits for the exponent, and 52 bits for the
-     mantissa.  NaN values have the exponent set to all 1 bits, and the
-     mantissa non-zero (mantissa == 0 is infinity).  */
-
-  int df_exponent = (df_upper >> 52) & 0x7ff;
-  HOST_WIDE_INT df_mantissa = df_upper & HOST_WIDE_INT_C (0x1fffffffffffff);
-
-  if (df_exponent == 0x7ff && df_mantissa != 0)		/* NaN.  */
-    return false;
-
-  /* Avoid values that are DFmode subnormal values.  Subnormal numbers have
-     the exponent all 0 bits, and the mantissa non-zero.  If the value is
-     subnormal, then the hidden bit in the mantissa is not set.  */
-  if (df_exponent == 0 && df_mantissa != 0)		/* subnormal.  */
-    return false;
-
-  /* Change the representation to DFmode constant.  */
-  long df_words[2];
-  df_words[0] = (df_upper >> 32) & 0xffffffff;
-  df_words[1] = df_upper & 0xffffffff;
-
-  /* real_from_target takes the target words in  target order.  */
-  if (!BYTES_BIG_ENDIAN)
-    std::swap (df_words[0], df_words[1]);
-
-  REAL_VALUE_TYPE rv_type;
-  real_from_target (&rv_type, df_words, DFmode);
-
-  const REAL_VALUE_TYPE *rv = &rv_type;
-
-  /* Validate that the number can be stored as a SFmode value.  */
-  if (!exact_real_truncate (SFmode, rv))
-    return false;
-
-  /* Validate that the number is not a SFmode subnormal value (exponent is 0,
-     mantissa field is non-zero) which is undefined for the XXSPLTIDP
-     instruction.  */
-  long sf_value;
-  real_to_target (&sf_value, rv, SFmode);
-
-  /* IEEE 754 32-bit values have 1 bit for the sign, 8 bits for the exponent,
-     and 23 bits for the mantissa.  Subnormal numbers have the exponent all
-     0 bits, and the mantissa non-zero.  */
-  long sf_exponent = (sf_value >> 23) & 0xFF;
-  long sf_mantissa = sf_value & 0x7FFFFF;
-
-  if (sf_exponent == 0 && sf_mantissa != 0)
+  /* Convert the vector constant to bytes.  */
+  if (!vec_const_to_bytes (op, mode, &vec_const))
     return false;
 
-  return true;
+  return vec_const_use_xxspltidp (&vec_const);
 })
 
 ;; Return 1 if the operand is a constant that can loaded with a XXSPLTIB
diff --git a/gcc/config/rs6000/rs6000-protos.h b/gcc/config/rs6000/rs6000-protos.h
index 574b3d5e17e..da9502bcb33 100644
--- a/gcc/config/rs6000/rs6000-protos.h
+++ b/gcc/config/rs6000/rs6000-protos.h
@@ -32,15 +32,10 @@ extern void init_cumulative_args (CUMULATIVE_ARGS *, tree, rtx, int, int, int,
 
 extern int easy_altivec_constant (rtx, machine_mode);
 extern bool xxspltib_constant_p (rtx, machine_mode, int *, int *);
-extern long xxspltidp_constant_immediate (rtx, machine_mode);
 extern int vspltis_shifted (rtx);
 extern HOST_WIDE_INT const_vector_elt_as_int (rtx, unsigned int);
 extern bool macho_lo_sum_memory_operand (rtx, machine_mode);
 extern int num_insns_constant (rtx, machine_mode);
-extern bool convert_vector_constant_to_bytes (rtx, machine_mode,
-					      unsigned char [], size_t);
-extern bool convert_scalar_64bit_constant_to_bytes (rtx, unsigned char [],
-						    size_t);
 extern int small_data_operand (rtx, machine_mode);
 extern bool mem_operand_gpr (rtx, machine_mode);
 extern bool mem_operand_ds_form (rtx, machine_mode);
@@ -228,6 +223,31 @@ address_is_prefixed (rtx addr,
   return (iform == INSN_FORM_PREFIXED_NUMERIC
 	  || iform == INSN_FORM_PCREL_LOCAL);
 }
+
+/* Functions and data structures relating to 128-bit vector constants.  All
+   fields are kept in big endian order.  */
+#define VECTOR_CONST_BITS	128
+#define VECTOR_CONST_BYTES	(VECTOR_CONST_BITS / 8)
+#define VECTOR_CONST_16BIT	(VECTOR_CONST_BITS / 16)
+#define VECTOR_CONST_32BIT	(VECTOR_CONST_BITS / 32)
+#define VECTOR_CONST_64BIT	(VECTOR_CONST_BITS / 64)
+
+typedef struct {
+  /* Vector constant as various sized items.  */
+  unsigned char bytes[VECTOR_CONST_BYTES];
+  unsigned short h_words[VECTOR_CONST_16BIT];
+  unsigned int words[VECTOR_CONST_32BIT];
+  unsigned HOST_WIDE_INT d_words[VECTOR_CONST_64BIT];
+  machine_mode orig_mode;		/* Original mode.  */
+  enum rtx_code orig_code;		/* Original rtx code.  */
+  bool is_xxspltidp;			/* Use XXSPLTIDP to load constant.  */
+  machine_mode xxspltidp_mode;		/* Mode to use for XXSPLTIDP.  */
+  unsigned int xxspltidp_immediate;	/* Immediate value for XXSPLTIDP.  */
+  bool is_prefixed;			/* Prefixed instruction used.  */
+} rs6000_vec_const;
+
+extern bool vec_const_to_bytes (rtx, machine_mode, rs6000_vec_const *);
+extern bool vec_const_use_xxspltidp (rs6000_vec_const *);
 #endif /* RTX_CODE */
 
 #ifdef TREE_CODE
diff --git a/gcc/config/rs6000/rs6000.c b/gcc/config/rs6000/rs6000.c
index a433c7c9386..35f5cc8f89e 100644
--- a/gcc/config/rs6000/rs6000.c
+++ b/gcc/config/rs6000/rs6000.c
@@ -6502,179 +6502,6 @@ num_insns_constant (rtx op, machine_mode mode)
   return num_insns_constant_multi (val, mode);
 }
 
-/* Convert a constant OP which has mode MODE into into BYTES (which is
-   NUM_BYTES long).  Return false if the we cannot convert the constant to a
-   series of bytes.  This code supports normal constants and vector constants.
-   In addition to CONST_VECTOR, we also support constant vectors formed with
-   VEC_DUPLICATE.  Return false if we don't recognize the constant.  If OP is a
-   scalar, it is assumed to be a vector element.
-
-   We return the bytes in big endian order, i.e. for 128-bit vectors, byte 0 is
-   the most significant byte, and byte 15 is the least significant byte.  */
-
-bool
-convert_vector_constant_to_bytes (rtx op,
-				  machine_mode mode,
-				  unsigned char bytes[],
-				  size_t num_bytes)
-{
-  /* If we don't know the size of the constant, punt.  */
-  if (mode == VOIDmode)
-    return false;
-
-  /* Is the buffer too small?  Punt.  */
-  if (num_bytes < GET_MODE_SIZE (mode))
-    return false;
-
-  switch (GET_CODE (op))
-    {
-      /* Integer constants.  */
-    case CONST_INT:
-      {
-	unsigned bitsize = GET_MODE_BITSIZE (mode);
-	unsigned HOST_WIDE_INT uvalue = UINTVAL (op);
-	size_t byte_num = 0;
-
-	for (int shift = bitsize - 8; shift >= 0; shift -= 8)
-	  bytes[byte_num++] = (uvalue >> shift) & 0xff;
-
-	break;
-      }
-
-      /* Floating point constants.  */
-    case CONST_DOUBLE:
-      {
-	unsigned bitsize = GET_MODE_BITSIZE (mode);
-	unsigned num_words = bitsize / 32;
-	const REAL_VALUE_TYPE *rtype = CONST_DOUBLE_REAL_VALUE (op);
-	size_t byte_num = 0;
-	long real_words[4];
-
-	/* Make sure we don't overflow the real_words array and that it is
-	   filled completely.  */
-	if (bitsize > 128 || (bitsize % 32) != 0)
-	  return false;
-
-	real_to_target (real_words, rtype, mode);
-
-	/* Iterate over each 32-bit word in the floating point constant.  The
-	   real_to_target function puts out words in endian fashion.  We need
-	   to arrange so the bytes are written in big endian order.  */
-	for (unsigned num = 0; num < num_words; num++)
-	  {
-	    unsigned endian_num = (BYTES_BIG_ENDIAN
-				   ? num
-				   : num_words - 1 - num);
-
-	    unsigned uvalue = real_words[endian_num];
-	    for (int shift = 32 - 8; shift >= 0; shift -= 8)
-	      bytes[byte_num++] = (uvalue >> shift) & 0xff;
-	  }
-
-	break;
-      }
-
-      /* Vector constants, iterate each element.  On little endian systems, we
-	 have to reverse the element numbers.  */
-    case CONST_VECTOR:
-      {
-	machine_mode ele_mode = GET_MODE_INNER (mode);
-	size_t nunits = GET_MODE_NUNITS (mode);
-	size_t size = GET_MODE_SIZE (ele_mode);
-
-	for (size_t num = 0; num < nunits; num++)
-	  {
-	    rtx ele = CONST_VECTOR_ELT (op, num);
-	    size_t byte_num = (BYTES_BIG_ENDIAN
-			       ? num
-			       : nunits - 1 - num) * size;
-
-	    if (!convert_vector_constant_to_bytes (ele, ele_mode,
-						   &bytes[byte_num], size))
-	      return false;
-	  }
-
-	break;
-      }
-
-      /* Vector constants, formed with VEC_DUPLICATE of a constant.  */
-    case VEC_DUPLICATE:
-      {
-	machine_mode ele_mode = GET_MODE_INNER (mode);
-	size_t nunits = GET_MODE_NUNITS (mode);
-	size_t size = GET_MODE_SIZE (ele_mode);
-	rtx ele = XEXP (op, 0);
-	size_t byte_num = 0;
-
-	for (size_t num = 0; num < nunits; num++)
-	  {
-	    if (!convert_vector_constant_to_bytes (ele, ele_mode,
-						   &bytes[byte_num], size))
-	      return false;
-
-	    byte_num += size;
-	  }
-
-	break;
-      }
-
-      /* Any thing else, just return failure.  */
-    default:
-      return false;
-    }
-
-  return true;
-}
-
-/* Convert a CONST_INT or CONST_DOUBLE OP which has mode MODE into into BYTES
-   (which is NUM_BYTES long).  Return false if the we cannot convert the
-   constant to a series of bytes.  This function used for the XXSPLTIDP and
-   XXSPLTI32DX instructions that load up a vector register with a value into
-   the upper 64-bits of the vector register and then is splatted to the lower
-   64-bits.
-
-   We return the bytes in big endian order, i.e. for 128-bit vectors, byte 0 is
-   the most significant byte, and byte 15 is the least significant byte.  */
-
-bool
-convert_scalar_64bit_constant_to_bytes (rtx op,
-					unsigned char bytes[],
-					size_t num_bytes)
-{
-  machine_mode mode;
-
-  /* We use DImode for integer constants and DFmode for floating point
-     constants, since SFmode scalars are stored as DFmode in the PowerPC.  */
-  if (CONST_INT_P (op))
-    mode = DImode;
-
-  else if (CONST_DOUBLE_P (op))
-    {
-      if (GET_MODE (op) != SFmode && GET_MODE (op) != DFmode)
-	return false;
-
-      mode = DFmode;
-    }
-
-  else
-    return false;
-
-  /* Verify that the buffer is either scalar sized (64-bits) or vector
-     sized.  */
-  if (num_bytes != 8 && num_bytes != 16)
-    return false;
-
-  if (!convert_vector_constant_to_bytes (op, mode, bytes, 8))
-    return false;
-
-  /* If the caller wanted the bytes in a vector size, duplicate the bytes to
-     mimic the behavior of the XXSPLTIDP and XXSPLTI32DX instructions.  */
-  if (num_bytes == 16)
-    memcpy (&bytes[8], &bytes[0], 8);
-
-  return true;
-}
-
 /* Interpret element ELT of the CONST_VECTOR OP as an integer value.
    If the mode of OP is MODE_VECTOR_INT, this simply returns the
    corresponding element of the vector, but for V4SFmode, the
@@ -7119,58 +6946,6 @@ xxspltib_constant_p (rtx op,
   return true;
 }
 
-/* Return the 32-bit immediate value that is used for the XXSPLTIDP instruction
-   to load a DFmode value that is splatted into a 128-bit vector.  */
-
-long
-xxspltidp_constant_immediate (rtx op, machine_mode mode)
-{
-  long ret;
-  unsigned char vector_bytes[16];
-
-  gcc_assert (easy_vector_constant_64bit_element (op, mode));
-
-  /* We use DImode for integer constants and DFmode for floating point
-     constants, since SFmode scalars are stored as DFmode in the PowerPC.  */
-  if (CONST_INT_P (op) || CONST_DOUBLE_P (op))
-    {
-      if (!convert_scalar_64bit_constant_to_bytes (op, vector_bytes,
-						   sizeof (vector_bytes)))
-	gcc_unreachable ();
-
-      /* Change mode to value in the vector register.  */
-      mode = CONST_INT_P (op) ? E_DImode : E_DFmode;
-    }
-
-  /* For vector constants, get the whole vector.  */
-  else if (!convert_vector_constant_to_bytes (op, mode, vector_bytes,
-					      sizeof (vector_bytes)))
-    gcc_unreachable ();
-
-  /* The vector_bytes array has the 8 bytes of the upper and lower constants in
-     big endian order. Convert the upper 8 bytes into a 64-bit constant.  The
-     64-bit constant is represented by a pair of 32-bit constants.  Then
-     convert it to a DFmode constant.  The real value support functions take
-     things in target endian order, so we will need to swap things on little
-     endian.  */
-  long df_upper = 0, df_lower = 0;
-  for (int i = 0; i < 4; i++)
-    {
-      df_upper = (df_upper << 8) | vector_bytes[i];
-      df_lower = (df_lower << 8) | vector_bytes[i+4];
-    }
-
-  if (!BYTES_BIG_ENDIAN)
-    std::swap (df_upper, df_lower);
-
-  long df_words[2] = { df_upper, df_lower };
-  REAL_VALUE_TYPE r;
-  real_from_target (&r, &df_words[0], DFmode);
-  real_to_target (&ret, &r, SFmode);
-
-  return ret;
-}
-
 const char *
 output_vec_const_move (rtx *operands)
 {
@@ -7215,9 +6990,11 @@ output_vec_const_move (rtx *operands)
 	    gcc_unreachable ();
 	}
 
-      if (easy_vector_constant_64bit_element (vec, mode))
+      rs6000_vec_const vec_const;
+      if (vec_const_to_bytes (vec, mode, &vec_const)
+	  && vec_const_use_xxspltidp (&vec_const))
 	{
-	  operands[2] = GEN_INT (xxspltidp_constant_immediate (vec, mode));
+	  operands[2] = GEN_INT (vec_const.xxspltidp_immediate);
 	  return "xxspltidp %x0,%2";
 	}
 
@@ -26972,10 +26749,20 @@ prefixed_xxsplti_p (rtx_insn *insn)
   if (!REG_P (dest) && !SUBREG_P (dest))
     return false;
 
-  if (easy_vector_constant_64bit_element (src, mode))
-    return true;
+  if (GET_CODE (src) == UNSPEC)
+    {
+      int unspec = XINT (src, 1);
+      return (unspec == UNSPEC_XXSPLTIW
+	      || unspec == UNSPEC_XXSPLTIDP
+	      || unspec == UNSPEC_XXSPLTI32DX);
+    }
 
-  return false;
+  rs6000_vec_const vec_const;
+  if (!vec_const_to_bytes (src, mode, &vec_const))
+    return false;
+
+  return (vec_const.is_prefixed
+	  || vec_const_use_xxspltidp (&vec_const));
 }
 
 /* Whether the next instruction needs a 'p' prefix issued before the
@@ -28841,6 +28628,279 @@ rs6000_output_addr_vec_elt (FILE *file, int value)
   fprintf (file, "\n");
 }
 
+\f
+/* Copy an integer constant to the vector constant structure.  */
+
+static void
+vec_const_integer (rtx op,
+		   machine_mode mode,
+		   size_t byte_num,
+		   rs6000_vec_const *vec_const)
+{
+  unsigned HOST_WIDE_INT uvalue = UINTVAL (op);
+  unsigned bitsize = GET_MODE_BITSIZE (mode);
+
+  for (int shift = bitsize - 8; shift >= 0; shift -= 8)
+    vec_const->bytes[byte_num++] = (uvalue >> shift) & 0xff;
+}
+
+/* Copy an floating point constant to the vector constant structure.  */
+
+static void
+vec_const_floating_point (rtx op,
+			  machine_mode mode,
+			  size_t byte_num,
+			  rs6000_vec_const *vec_const)
+{
+  unsigned bitsize = GET_MODE_BITSIZE (mode);
+  unsigned num_words = bitsize / 32;
+  const REAL_VALUE_TYPE *rtype = CONST_DOUBLE_REAL_VALUE (op);
+  long real_words[VECTOR_CONST_32BIT];
+
+  /* Make sure we don't overflow the real_words array and that it is
+     filled completely.  */
+  gcc_assert (bitsize <= VECTOR_CONST_BITS && (bitsize % 32) == 0);
+
+  real_to_target (real_words, rtype, mode);
+
+  /* Iterate over each 32-bit word in the floating point constant.  The
+     real_to_target function puts out words in endian fashion.  We need
+     to arrange so the words are written in big endian order.  */
+  for (unsigned num = 0; num < num_words; num++)
+    {
+      unsigned endian_num = (BYTES_BIG_ENDIAN
+			     ? num
+			     : num_words - 1 - num);
+
+      unsigned uvalue = real_words[endian_num];
+      for (int shift = 32 - 8; shift >= 0; shift -= 8)
+	vec_const->bytes[byte_num++] = (uvalue >> shift) & 0xff;
+    }
+}
+
+/* Determine if a vector constant can be loaded with XXSPLTIDP.  If so,
+   fill out the fields used to generate the instruction.  */
+
+bool
+vec_const_use_xxspltidp (rs6000_vec_const *vec_const)
+{
+  if (!TARGET_XXSPLTIDP || !TARGET_PREFIXED || !TARGET_VSX)
+    return false;
+
+  /* Make sure that the two 64-bit segments are the same.  */
+  unsigned HOST_WIDE_INT df_upper = vec_const->d_words[0];
+  unsigned HOST_WIDE_INT df_lower = vec_const->d_words[1];
+  if (df_upper != df_lower)
+    return false;
+  
+  /* Avoid values that are easy to create with other instructions (0.0 for
+     floating point, and values that can be loaded with XXSPLTIB and sign
+     extension for integer.  */
+  if (df_upper == 0)
+    return false;
+
+  machine_mode mode = vec_const->orig_mode;
+  if (mode == VOIDmode)
+    mode = DImode;
+
+  if (!FLOAT_MODE_P (mode) && IN_RANGE (df_upper, -128, 127))
+    return false;
+
+  /* Avoid values that look like DFmode NaN's, except for the normal NaN bit
+     pattern and signalling NaN bit pattern.  Recognize infinity and negative
+     infinity.
+
+     The IEEE 754 64-bit floating format has 1 bit for sign, 11 bits for the
+     exponent, and 52 bits for the mantissa (not counting the hidden bit used
+     for normal numbers).  NaN values have the exponent set to all 1 bits, and
+     the mantissa non-zero (mantissa == 0 is infinity).  */
+
+#define VECTOR_CONST_DF_NAN	HOST_WIDE_INT_UC (0x7ff8000000000000)
+#define VECTOR_CONST_DF_NANS	HOST_WIDE_INT_UC (0x7ff4000000000000)
+#define VECTOR_CONST_DF_INF	HOST_WIDE_INT_UC (0x7ff0000000000000)
+#define VECTOR_CONST_DF_NEG_INF	HOST_WIDE_INT_UC (0xfff0000000000000)
+
+  if (df_upper != VECTOR_CONST_DF_NAN
+      && df_upper != VECTOR_CONST_DF_NANS
+      && df_upper != VECTOR_CONST_DF_INF
+      && df_upper != VECTOR_CONST_DF_NEG_INF)
+    {
+      int df_exponent = (df_upper >> 52) & 0x7ff;
+      unsigned HOST_WIDE_INT df_mantissa
+	= df_upper & ((HOST_WIDE_INT_1U << 52) - HOST_WIDE_INT_1U);
+
+      if (df_exponent == 0x7ff && df_mantissa != 0)	/* other NaNs.  */
+	return false;
+
+      /* Avoid values that are DFmode subnormal values.  Subnormal numbers have
+	 the exponent all 0 bits, and the mantissa non-zero.  If the value is
+	 subnormal, then the hidden bit in the mantissa is not set.  */
+      if (df_exponent == 0 && df_mantissa != 0)		/* subnormal.  */
+	return false;
+    }
+
+  /* Change the representation to DFmode constant.  */
+  long df_words[2] = { vec_const->words[0], vec_const->words[1] };
+
+  /* real_from_target takes the target words in  target order.  */
+  if (!BYTES_BIG_ENDIAN)
+    std::swap (df_words[0], df_words[1]);
+
+  REAL_VALUE_TYPE rv_type;
+  real_from_target (&rv_type, df_words, DFmode);
+
+  const REAL_VALUE_TYPE *rv = &rv_type;
+
+  /* Validate that the number can be stored as a SFmode value.  */
+  if (!exact_real_truncate (SFmode, rv))
+    return false;
+
+  /* Validate that the number is not a SFmode subnormal value (exponent is 0,
+     mantissa field is non-zero) which is undefined for the XXSPLTIDP
+     instruction.  */
+  long sf_value;
+  real_to_target (&sf_value, rv, SFmode);
+
+  /* IEEE 754 32-bit values have 1 bit for the sign, 8 bits for the exponent,
+     and 23 bits for the mantissa.  Subnormal numbers have the exponent all
+     0 bits, and the mantissa non-zero.  */
+  long sf_exponent = (sf_value >> 23) & 0xFF;
+  long sf_mantissa = sf_value & 0x7FFFFF;
+
+  if (sf_exponent == 0 && sf_mantissa != 0)
+    return false;
+
+  /* Record the information in the vec_const structure for XXSPLTIDP.  */
+  vec_const->is_xxspltidp = true;
+  vec_const->is_prefixed = true;
+  vec_const->xxspltidp_immediate = sf_value;
+  vec_const->xxspltidp_mode = FLOAT_MODE_P (mode) ? E_DFmode : E_DImode;
+
+  return true;
+}
+
+/* Convert a vector constant to an internal structure, breaking it out to
+   bytes, half words, words, and double words.  Return true if we have
+   successfully broken it out.  */
+
+bool
+vec_const_to_bytes (rtx op,
+		    machine_mode mode,
+		    rs6000_vec_const *vec_const)
+{
+  /* Initialize vec const structure.  */
+  memset ((void *)vec_const, 0, sizeof (rs6000_vec_const));
+
+  /* If we don't know the size of the constant, punt.  */
+  if (mode == VOIDmode)
+    return false;
+
+  switch (GET_CODE (op))
+    {
+      /* Integer constants, default to double word.  */
+    case CONST_INT:
+      {
+	if (mode == VOIDmode)
+	  mode = DImode;
+
+	vec_const_integer (op, mode, 0, vec_const);
+
+	/* Splat the constant to the rest of the vector constant structure.  */
+	unsigned size = GET_MODE_SIZE (mode);
+	gcc_assert (size <= VECTOR_CONST_BYTES);
+	gcc_assert ((VECTOR_CONST_BYTES % size) == 0);
+
+	for (size_t splat = size; splat < VECTOR_CONST_BYTES; splat += size)
+	  memcpy ((void *) &vec_const->bytes[splat],
+		  (void *) &vec_const->bytes[0],
+		  size);
+	break;
+      }
+
+      /* Floating point constants.  */
+    case CONST_DOUBLE:
+      {
+	vec_const_floating_point (op, mode, 0, vec_const);
+
+	/* Splat the constant to the rest of the vector constant structure.  */
+	unsigned size = GET_MODE_SIZE (mode);
+	gcc_assert (size <= VECTOR_CONST_BYTES);
+	gcc_assert ((VECTOR_CONST_BYTES % size) == 0);
+
+	for (size_t splat = size; splat < VECTOR_CONST_BYTES; splat += size)
+	  memcpy ((void *) &vec_const->bytes[splat],
+		  (void *) &vec_const->bytes[0],
+		  size);
+	break;
+      }
+
+      /* Vector constants, iterate each element.  On little endian systems, we
+	 have to reverse the element numbers.  Also handle VEC_DUPLICATE.  */
+    case CONST_VECTOR:
+    case VEC_DUPLICATE:
+      {
+	machine_mode ele_mode = GET_MODE_INNER (mode);
+	size_t nunits = GET_MODE_NUNITS (mode);
+	size_t size = GET_MODE_SIZE (ele_mode);
+
+	for (size_t num = 0; num < nunits; num++)
+	  {
+	    rtx ele = (GET_CODE (op) == VEC_DUPLICATE
+		       ? XEXP (op, 0)
+		       : CONST_VECTOR_ELT (op, num));
+	    size_t byte_num = (BYTES_BIG_ENDIAN
+			       ? num
+			       : nunits - 1 - num) * size;
+
+	    if (CONST_INT_P (ele))
+	      vec_const_integer (ele, ele_mode, byte_num, vec_const);
+	    else if (CONST_DOUBLE_P (ele))
+	      vec_const_floating_point (ele, ele_mode, byte_num, vec_const);
+	    else
+	      return false;
+	  }
+
+	break;
+      }
+
+      /* Any thing else, just return failure.  */
+    default:
+      return false;
+    }
+
+  /* Pack half words together.  */
+  for (size_t i = 0; i <= VECTOR_CONST_16BIT; i++)
+    vec_const->h_words[i] = ((vec_const->bytes[2*i] << 8)
+			     | vec_const->bytes[2*i + 1]);
+
+  /* Pack words together.  */
+  for (size_t i = 0; i <= VECTOR_CONST_32BIT; i++)
+    {
+      unsigned word = 0;
+      for (size_t j = 0; j < 4; j++)
+	word = (word << 8) | vec_const->bytes[(4*i) + j];
+
+      vec_const->words[i] = word;
+    }
+
+  /* Pack double words together.  */
+  for (size_t i = 0; i <= VECTOR_CONST_64BIT; i++)
+    {
+      unsigned HOST_WIDE_INT d_word = 0;
+      for (size_t j = 0; j < 8; j++)
+	d_word = (d_word << 8) | vec_const->bytes[(8*i) + j];
+
+      vec_const->d_words[i] = d_word;
+    }
+
+  /* Remember original mode and code.  */
+  vec_const->orig_mode = mode;
+  vec_const->orig_code = GET_CODE (op);
+
+  return true;
+}
+
+\f
 struct gcc_target targetm = TARGET_INITIALIZER;
 
 #include "gt-rs6000.h"
diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md
index 48ecb41801c..751a82e7710 100644
--- a/gcc/config/rs6000/vsx.md
+++ b/gcc/config/rs6000/vsx.md
@@ -6480,9 +6480,13 @@
   [(set (match_dup 0)
 	(unspec:XXSPLTIDP [(match_dup 2)] UNSPEC_XXSPLTIDP))]
 {
-  long immediate = xxspltidp_constant_immediate (operands[1], <MODE>mode);
-  operands[2] = GEN_INT (immediate);
-  })
+  rs6000_vec_const vec_const;
+  if (!vec_const_to_bytes (operands[1], <MODE>mode, &vec_const)
+      || !vec_const_use_xxspltidp (&vec_const))
+    gcc_unreachable ();
+
+  operands[2] = GEN_INT (vec_const.xxspltidp_immediate);
+})
 
 ;; XXSPLTI32DX built-in function support
 (define_expand "xxsplti32dx_v4si"


^ permalink raw reply	[flat|nested] only message in thread

only message in thread, other threads:[~2021-10-13 18:46 UTC | newest]

Thread overview: (only message) (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2021-10-13 18:46 [gcc(refs/users/meissner/heads/work071)] Rework XXSPLTIDP support Michael Meissner

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).