public inbox for gcc-cvs@sourceware.org
help / color / mirror / Atom feed
* [gcc(refs/users/meissner/heads/work086)] Add -mstore-vector-pair and -mno-store-vector-pair.
@ 2022-04-21 18:24 Michael Meissner
0 siblings, 0 replies; only message in thread
From: Michael Meissner @ 2022-04-21 18:24 UTC (permalink / raw)
To: gcc-cvs
https://gcc.gnu.org/g:0a1fcebce6f3c83c8ee6c4ef2f41dc3598812a18
commit 0a1fcebce6f3c83c8ee6c4ef2f41dc3598812a18
Author: Michael Meissner <meissner@linux.ibm.com>
Date: Thu Apr 21 14:24:26 2022 -0400
Add -mstore-vector-pair and -mno-store-vector-pair.
2022-04-21 Michael Meissner <meissner@linux.ibm.com>
gcc/
* config/rs6000/mma.md (movoo): Delete.
(movoo_stxvp): New insn for -mstore-vector-pair.
(movoo_no_stxvp): New insn for -mno-store-vector-pair.
(movxo): Delete.
(movxo_stxvp): New insn for -mstore-vector-pair.
(movxo_no_stxvp): New insn for -mno-store-vector-pair.
* config/rs6000/rs6000.opt (-mstore-vector-pair): New option.
* doc/invoke.texi (RS/6000 & PowerPC Options): Document
-mstore-vector-pair and -mno-store-vector-pair.
gcc/testsuite/
* gcc.target/powerpc/p10-store-vector-pair-1.c: New test.
* gcc.target/powerpc/p10-store-vector-pair-2.c: New test.
Diff:
---
gcc/config/rs6000/mma.md | 53 ++++++++++++--
gcc/config/rs6000/rs6000.opt | 4 ++
gcc/doc/invoke.texi | 8 ++-
.../gcc.target/powerpc/p10-store-vector-pair-1.c | 82 ++++++++++++++++++++++
.../gcc.target/powerpc/p10-store-vector-pair-2.c | 81 +++++++++++++++++++++
5 files changed, 223 insertions(+), 5 deletions(-)
diff --git a/gcc/config/rs6000/mma.md b/gcc/config/rs6000/mma.md
index 907c9d6d516..6715da6226d 100644
--- a/gcc/config/rs6000/mma.md
+++ b/gcc/config/rs6000/mma.md
@@ -274,10 +274,12 @@
DONE;
})
-(define_insn_and_split "*movoo"
+;; Possibly generate store vector pair instructions or split them to two
+;; separate store vector instructions.
+(define_insn_and_split "*movoo_stxvp"
[(set (match_operand:OO 0 "nonimmediate_operand" "=wa,m,wa")
(match_operand:OO 1 "input_operand" "m,wa,wa"))]
- "TARGET_MMA
+ "TARGET_MMA && TARGET_STORE_VECTOR_PAIR
&& (gpc_reg_operand (operands[0], OOmode)
|| gpc_reg_operand (operands[1], OOmode))"
"@
@@ -295,6 +297,27 @@
(set_attr "size" "256")
(set_attr "length" "*,*,8")])
+(define_insn_and_split "*movoo_no_stxvp"
+ [(set (match_operand:OO 0 "nonimmediate_operand" "=wa,oQ,wa")
+ (match_operand:OO 1 "input_operand" "m,wa,wa"))]
+ "TARGET_MMA && !TARGET_STORE_VECTOR_PAIR
+ && (gpc_reg_operand (operands[0], OOmode)
+ || gpc_reg_operand (operands[1], OOmode))"
+ "@
+ lxvp%X1 %x0,%1
+ #
+ #"
+ "&& reload_completed && !MEM_P (operands[1])"
+ [(const_int 0)]
+{
+ rs6000_split_multireg_move (operands[0], operands[1]);
+ DONE;
+}
+ [(set_attr "type" "vecload,vecstore,veclogical")
+ (set_attr "size" "256")
+ (set_attr "length" "*,8,8")
+ (set_attr "max_prefixed_insns" "*,2,*")])
+
\f
;; Vector quad support. XOmode can only live in FPRs.
(define_expand "movxo"
@@ -306,10 +329,12 @@
DONE;
})
-(define_insn_and_split "*movxo"
+;; Possibly generate store vector pair instructions or split them to two
+;; separate store vector instructions.
+(define_insn_and_split "*movxo_stxvp"
[(set (match_operand:XO 0 "nonimmediate_operand" "=d,m,d")
(match_operand:XO 1 "input_operand" "m,d,d"))]
- "TARGET_MMA
+ "TARGET_MMA && TARGET_STORE_VECTOR_PAIR
&& (gpc_reg_operand (operands[0], XOmode)
|| gpc_reg_operand (operands[1], XOmode))"
"@
@@ -326,6 +351,26 @@
(set_attr "length" "*,*,16")
(set_attr "max_prefixed_insns" "2,2,*")])
+(define_insn_and_split "*movxo_no_stxvp"
+ [(set (match_operand:XO 0 "nonimmediate_operand" "=d,m,d")
+ (match_operand:XO 1 "input_operand" "m,d,d"))]
+ "TARGET_MMA && !TARGET_STORE_VECTOR_PAIR
+ && (gpc_reg_operand (operands[0], XOmode)
+ || gpc_reg_operand (operands[1], XOmode))"
+ "@
+ #
+ #
+ #"
+ "&& reload_completed"
+ [(const_int 0)]
+{
+ rs6000_split_multireg_move (operands[0], operands[1]);
+ DONE;
+}
+ [(set_attr "type" "vecload,vecstore,veclogical")
+ (set_attr "length" "*,*,16")
+ (set_attr "max_prefixed_insns" "2,4,*")])
+
(define_expand "vsx_assemble_pair"
[(match_operand:OO 0 "vsx_register_operand")
(match_operand:V16QI 1 "mma_assemble_input_operand")
diff --git a/gcc/config/rs6000/rs6000.opt b/gcc/config/rs6000/rs6000.opt
index 6c4caf4c9ee..0330eb6c60e 100644
--- a/gcc/config/rs6000/rs6000.opt
+++ b/gcc/config/rs6000/rs6000.opt
@@ -624,6 +624,10 @@ mieee128-constant
Target Var(TARGET_IEEE128_CONSTANT) Init(1) Save
Generate (do not generate) code that uses the LXVKQ instruction.
+mstore-vector-pair
+Target Var(TARGET_STORE_VECTOR_PAIR) Init(1) Save
+Generate (do not generate) code that uses the store vector pair instructions.
+
-param=rs6000-density-pct-threshold=
Target Undocumented Joined UInteger Var(rs6000_density_pct_threshold) Init(85) IntegerRange(0, 100) Param
When costing for loop vectorization, we probably need to penalize the loop body
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
index a55bd047509..d7f1caf8fb4 100644
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -1275,7 +1275,7 @@ See RS/6000 and PowerPC Options.
-mstack-protector-guard=@var{guard} -mstack-protector-guard-reg=@var{reg} @gol
-mstack-protector-guard-offset=@var{offset} -mprefixed -mno-prefixed @gol
-mpcrel -mno-pcrel -mmma -mno-mmma -mrop-protect -mno-rop-protect @gol
--mprivileged -mno-privileged}
+-mprivileged -mno-privileged -mstore-vector-pair -mno-store-vector-pair}
@emph{RX Options}
@gccoptlist{-m64bit-doubles -m32bit-doubles -fpu -nofpu@gol
@@ -29359,6 +29359,12 @@ Generate (do not generate) code that will run in privileged state.
@opindex no-block-ops-unaligned-vsx
Generate (do not generate) unaligned vsx loads and stores for
inline expansion of @code{memcpy} and @code{memmove}.
+
+@item -mstore-vector-pair
+@itemx -mno-store-vector-pair
+@opindex mstore-vector-pair
+@opindex mno-store-vector-pair
+Generate (do not generate) code that uses the store vector pair instructions.
@end table
@node RX Options
diff --git a/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-1.c b/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-1.c
new file mode 100644
index 00000000000..197ec2e058e
--- /dev/null
+++ b/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-1.c
@@ -0,0 +1,82 @@
+/* { dg-require-effective-target power10_ok } */
+/* { dg-options "-mdejagnu-cpu=power10 -O2 -mstore-vector-pair -mmma" } */
+
+/* Test if we generate store vector pair instructions if the user uses the
+ -mstore-vector-pair option. */
+static __vector_quad sq;
+static __vector_pair sp;
+
+void
+load_store_pair (__vector_pair *p, __vector_pair *q)
+{
+ *p = *q; /* lxvp, stxvp. */
+}
+
+void
+load_store_pair_1 (__vector_pair *p, __vector_pair *q)
+{
+ p[1] = q[1]; /* lxvp, stxvp. */
+}
+
+void
+load_store_pair_0x10000 (__vector_pair *p, __vector_pair *q)
+{
+ p[0x10000] = q[0x10000]; /* plxvp, pstxvp. */
+}
+
+void
+load_store_pair_n (__vector_pair *p, __vector_pair *q, unsigned long n)
+{
+ p[n] = q[n]; /* lxvpx, 2x stxvp. */
+}
+
+void
+load_pair_static (__vector_pair *p)
+{
+ *p = sp; /* plxvp, stxvp. */
+}
+
+void
+store_pair_static (__vector_pair *p)
+{
+ sp = *p; /* lxvp, pstxvp. */
+}
+
+void
+load_store_quad (__vector_quad *p, __vector_quad *q)
+{
+ *p = *q; /* 2x lxvp, 2x stxvp. */
+}
+
+void
+load_store_quad_1 (__vector_quad *p, __vector_quad *q)
+{
+ p[1] = q[1]; /* 2x lxvp, 2x stxvp. */
+}
+
+void
+load_store_quad_0x10000 (__vector_quad *p, __vector_quad *q)
+{
+ p[0x10000] = q[0x10000]; /* 2x plxvp, 2x pstxvp. */
+}
+
+void
+load_store_quad_n (__vector_quad *p, __vector_quad *q, unsigned long n)
+{
+ p[n] = q[n]; /* 2x lxvp, 2x stxv. */
+}
+
+void
+load_quad_static (__vector_quad *p)
+{
+ *p = sq; /* 2x plxvp, 2x stxvp. */
+}
+
+void
+store_quad_static (__vector_quad *p)
+{
+ sq = *p; /* 2x lxvp, 2x stxvp. */
+}
+
+/* { dg-final { scan-assembler {\mp?vstxvpx?\M} } } */
+
diff --git a/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-2.c b/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-2.c
new file mode 100644
index 00000000000..b8c3bdbfd89
--- /dev/null
+++ b/gcc/testsuite/gcc.target/powerpc/p10-store-vector-pair-2.c
@@ -0,0 +1,81 @@
+/* { dg-require-effective-target power10_ok } */
+/* { dg-options "-mdejagnu-cpu=power10 -O2 -mno-store-vector-pair -mmma" } */
+
+/* Test if we do not generate store vector pair instructions if the user uses
+ the -mno-store-vector-pair option. */
+static __vector_quad sq;
+static __vector_pair sp;
+
+void
+load_store_pair (__vector_pair *p, __vector_pair *q)
+{
+ *p = *q; /* lxvp, 2x stxv. */
+}
+
+void
+load_store_pair_1 (__vector_pair *p, __vector_pair *q)
+{
+ p[1] = q[1]; /* lxvp, 2x stxv. */
+}
+
+void
+load_store_pair_0x10000 (__vector_pair *p, __vector_pair *q)
+{
+ p[0x10000] = q[0x10000]; /* plxvp, 2x pstxv. */
+}
+
+void
+load_store_pair_n (__vector_pair *p, __vector_pair *q, unsigned long n)
+{
+ p[n] = q[n]; /* lxvpx, 2x stxv. */
+}
+
+void
+load_pair_static (__vector_pair *p)
+{
+ *p = sp; /* plxvp, 2x stxv. */
+}
+
+void
+store_pair_static (__vector_pair *p)
+{
+ sp = *p; /* lxvp, 2x pstxv. */
+}
+
+void
+load_store_quad (__vector_quad *p, __vector_quad *q)
+{
+ *p = *q; /* 2x lxvp, 4x stxv. */
+}
+
+void
+load_store_quad_1 (__vector_quad *p, __vector_quad *q)
+{
+ p[1] = q[1]; /* 2x lxvp, 4x stxv. */
+}
+
+void
+load_store_quad_0x10000 (__vector_quad *p, __vector_quad *q)
+{
+ p[0x10000] = q[0x10000]; /* 2x plxvp, 4x pstxv. */
+}
+
+void
+load_store_quad_n (__vector_quad *p, __vector_quad *q, unsigned long n)
+{
+ p[n] = q[n]; /* 2x lxvp, 4x stxv. */
+}
+
+void
+load_quad_static (__vector_quad *p)
+{
+ *p = sq; /* 2x plxvp, 4x stxv. */
+}
+
+void
+store_quad_static (__vector_quad *p)
+{
+ sq = *p; /* 2x lxvp, 4x pstxv. */
+}
+
+/* { dg-final { scan-assembler-not {\mp?vstxvpx?\M} } } */
^ permalink raw reply [flat|nested] only message in thread
only message in thread, other threads:[~2022-04-21 18:24 UTC | newest]
Thread overview: (only message) (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2022-04-21 18:24 [gcc(refs/users/meissner/heads/work086)] Add -mstore-vector-pair and -mno-store-vector-pair Michael Meissner
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).