public inbox for gcc-patches@gcc.gnu.org
 help / color / mirror / Atom feed
From: Daniel Santos <daniel.santos@pobox.com>
To: Uros Bizjak <ubizjak@gmail.com>
Cc: gcc-patches <gcc-patches@gcc.gnu.org>, Jan Hubicka <hubicka@ucw.cz>
Subject: Re: [PATCH 09/12] [i386] Add patterns and predicates foutline-msabi-xlouges
Date: Tue, 02 May 2017 22:19:00 -0000	[thread overview]
Message-ID: <272376f2-178f-4d42-bc88-1555b54282f0@pobox.com> (raw)
In-Reply-To: <CAFULd4af60fqU-Sjfss5VwC8gcjZin8e_cngMuPk=Ubo1Rggzw@mail.gmail.com>

Thank you for the review.

On 05/01/2017 06:18 AM, Uros Bizjak wrote:
> On Thu, Apr 27, 2017 at 10:09 AM, Daniel Santos <daniel.santos@pobox.com> wrote:
>> Adds the predicates save_multiple and restore_multiple to predicates.md,
>> which are used by following patterns in sse.md:
>>
>> * save_multiple - insn that calls a save stub
>> * restore_multiple - call_insn that calls a save stub and returns to the
>>    function to allow a sibling call (which should typically offer better
>>    optimization than the restore stub as the tail call)
>> * restore_multiple_and_return - a jump_insn that returns from the
>>    function as a tail-call.
>> * restore_multiple_leave_return - like the above, but restores the frame
>>    pointer before returning.
>>
>> Signed-off-by: Daniel Santos <daniel.santos@pobox.com>
>> ---
>>   gcc/config/i386/predicates.md | 155 ++++++++++++++++++++++++++++++++++++++++++
>>   gcc/config/i386/sse.md        |  37 ++++++++++
>>   2 files changed, 192 insertions(+)
>>
>> diff --git a/gcc/config/i386/predicates.md b/gcc/config/i386/predicates.md
>> index 8f250a2e720..36fe8abc3f4 100644
>> --- a/gcc/config/i386/predicates.md
>> +++ b/gcc/config/i386/predicates.md
>> @@ -1657,3 +1657,158 @@
>>     (ior (match_operand 0 "register_operand")
>>          (and (match_code "const_int")
>>              (match_test "op == constm1_rtx"))))
>> +
>> +;; Return true if:
>> +;; 1. first op is a symbol reference,
>> +;; 2. >= 13 operands, and
>> +;; 3. operands 2 to end is one of:
>> +;;   a. save a register to a memory location, or
>> +;;   b. restore stack pointer.
>> +(define_predicate "save_multiple"
>> +  (match_code "parallel")
>> +{
>> +  const unsigned nregs = XVECLEN (op, 0);
>> +  rtx head = XVECEXP (op, 0, 0);
>> +  unsigned i;
>> +
>> +  if (GET_CODE (head) != USE)
>> +    return false;
>> +  else
>> +    {
>> +      rtx op0 = XEXP (head, 0);
>> +      if (op0 == NULL_RTX || GET_CODE (op0) != SYMBOL_REF)
>> +       return false;
>> +    }
>> +
>> +  if (nregs < 13)
>> +    return false;
>> +
>> +  for (i = 2; i < nregs; i++)
>> +    {
>> +      rtx e, src, dest;
>> +
>> +      e = XVECEXP (op, 0, i);
>> +
>> +      switch (GET_CODE (e))
>> +       {
>> +         case SET:
>> +           src  = SET_SRC (e);
>> +           dest = SET_DEST (e);
>> +
>> +           /* storing a register to memory.  */
>> +           if (GET_CODE (src) == REG && GET_CODE (dest) == MEM)
> Please use REG_P (...) and MEM_P (...) - and possible others -
> predicates in the code.
>
>> +             {
>> +               rtx addr = XEXP (dest, 0);
>> +
>> +               /* Good if dest address is in RAX.  */
>> +               if (GET_CODE (addr) == REG
>> +                   && REGNO (addr) == AX_REG)
>> +                 continue;
>> +
>> +               /* Good if dest address is offset of RAX.  */
>> +               if (GET_CODE (addr) == PLUS
>> +                   && GET_CODE (XEXP (addr, 0)) == REG
>> +                   && REGNO (XEXP (addr, 0)) == AX_REG)
>> +                 continue;
>> +             }
>> +           break;
>> +
>> +         default:
>> +           break;
>> +       }
>> +       return false;
>> +    }
>> +  return true;
>> +})
>> +
>> +;; Return true if:
>> +;; * first op is (return) or a a use (symbol reference),
>> +;; * >= 14 operands, and
>> +;; * operands 2 to end are one of:
>> +;;   - restoring a register from a memory location that's an offset of RSI.
>> +;;   - clobbering a reg
>> +;;   - adjusting SP
>> +(define_predicate "restore_multiple"
>> +  (match_code "parallel")
>> +{
>> +  const unsigned nregs = XVECLEN (op, 0);
>> +  rtx head = XVECEXP (op, 0, 0);
>> +  unsigned i;
>> +
>> +  switch (GET_CODE (head))
>> +    {
>> +      case RETURN:
>> +       i = 3;
>> +       break;
>> +
>> +      case USE:
>> +      {
>> +       rtx op0 = XEXP (head, 0);
>> +
>> +       if (op0 == NULL_RTX || GET_CODE (op0) != SYMBOL_REF)
>> +         return false;
>> +
>> +       i = 1;
>> +       break;
>> +      }
>> +
>> +      default:
>> +       return false;
>> +    }
>> +
>> +  if (nregs < i + 12)
>> +    return false;
>> +
>> +  for (; i < nregs; i++)
>> +    {
>> +      rtx e, src, dest;
>> +
>> +      e = XVECEXP (op, 0, i);
>> +
>> +      switch (GET_CODE (e))
>> +       {
>> +         case CLOBBER:
>> +           continue;
> I don't see where CLOBBER is genreated in ix86_emit_outlined_ms2sysv_restore.

I think this is clutter that I didn't remove after changing the stubs.

>> +
>> +         case SET:
>> +           src  = SET_SRC (e);
>> +           dest = SET_DEST (e);
>> +
>> +           /* Restoring a register from memory.  */
>> +           if (GET_CODE (src) == MEM && GET_CODE (dest) == REG)
>> +             {
>> +               rtx addr = XEXP (src, 0);
>> +
>> +               /* Good if src address is in RSI.  */
>> +               if (GET_CODE (addr) == REG
>> +                   && REGNO (addr) == SI_REG)
>> +                 continue;
>> +
>> +               /* Good if src address is offset of RSI.  */
>> +               if (GET_CODE (addr) == PLUS
>> +                   && GET_CODE (XEXP (addr, 0)) == REG
>> +                   && REGNO (XEXP (addr, 0)) == SI_REG)
>> +                 continue;
>> +
>> +               /* Good if adjusting stack pointer.  */
>> +               if (GET_CODE (dest) == REG
>> +                   && REGNO (dest) == SP_REG
>> +                   && GET_CODE (src) == PLUS
>> +                   && GET_CODE (XEXP (src, 0)) == REG
>> +                   && REGNO (XEXP (src, 0)) == SP_REG)
>> +                 continue;
>> +             }
>> +
>> +           /* Restoring stack pointer from another register.  */
>> +           if (GET_CODE (dest) == REG && REGNO (dest) == SP_REG
>> +               && GET_CODE (src) == REG)
>> +             continue;
>> +           break;
>> +
>> +         default:
>> +           break;
>> +       }
>> +       return false;
>> +    }
>> +  return true;
>> +})
> I think that the above functions should check only if the function is
> storing/restoring correct registers, all other RTXes should be
> explicitly written in the insn patterns.
>
>> diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md
>> index e8ccb1e10c3..c9fe7274def 100644
>> --- a/gcc/config/i386/sse.md
>> +++ b/gcc/config/i386/sse.md
>> @@ -19997,3 +19997,40 @@
>>             (match_operand:VI48_512 1 "nonimmediate_operand" "vm")))]
>>     "TARGET_AVX512VPOPCNTDQ"
>>     "vpopcnt<ssemodesuffix>\t{%1, %0<mask_operand2>|%0<mask_operand2>, %1}")
>> +
>> +;; Save multiple registers out-of-line.
>> +(define_insn "save_multiple<mode>"
>> +  [(match_parallel 0 "save_multiple"
>> +    [(use (match_operand:P 1 "symbol_operand"))
>> +     (const_int 0)
>> +    ])]
>> +  "TARGET_SSE && TARGET_64BIT"
>> +  "call\t%P1")
> You probably don't need a (const_int 0) tag. According to the
> documentation, RTX matching guarantees subexpression match, so in the
> predicate you should check only stores of registers (as suggested
> above).
>
>> +;; Restore multiple registers out-of-line.
>> +(define_insn "restore_multiple<mode>"
>> +  [(match_parallel 0 "restore_multiple"
>> +    [(use (match_operand:P 1 "symbol_operand"))])]
>> +  "TARGET_SSE && TARGET_64BIT"
>> +  "call\t%P1")
>> +
>> +;; Restore multiple registers out-of-line and return.
>> +(define_insn "restore_multiple_and_return<mode>"
>> +  [(match_parallel 0 "restore_multiple"
>> +    [(return)
>> +     (use (match_operand:P 1 "symbol_operand"))
>> +     (const_int 0)
>> +    ])]
>> +  "TARGET_SSE && TARGET_64BIT"
>> +  "jmp\t%P1")
> No need for (const_int 0) tag.
>
>> +;; Restore multiple registers out-of-line when hard frame pointer is used,
>> +;; perform the leave operation prior to returning (from the function).
>> +(define_insn "restore_multiple_leave_return<mode>"
>> +  [(match_parallel 0 "restore_multiple"
>> +    [(return)
>> +     (use (match_operand:P 1 "symbol_operand"))
>> +     (const_int 1)
>> +    ])]
>> +  "TARGET_SSE && TARGET_64BIT"
>> +  "jmp\t%P1")
> You will have to write out all  sub-RTXes of the "leave" pattern,
> including clobber.
>
> I'd recommend that in the predicate, you check match_parallel from the
> bottom up, since subexpressions on the top are already matched, and
> you can have different number of subexpressions at the top.
>
> Uros.

OK, this all makes sense then. I was using const_int tags to 
differentiate the insns, but omitting the insns for the leave (for 
example) are what ambiguates them in the first place.

So one question I never had resolved is rather or not the order the 
insns in a parallel matters.  From your suggestions, I'm guessing that 
it would be perfectly OK for the leave insns to follow use symbol and 
then have the register restores after that, even though that wouldn't 
make sense from an assembly level because we would be writing beyond the 
stack pointer.  Am I reading this correctly?  If so, then putting the 
register save/restore matching in the predicate (checking top down) and 
having all others in the pattern make great sense and should both 
simplify it and make it more clear.

Also, I'm wondering if there's anything wrong with calling 
ix86_gen_leave () and plucking the insns out of the generated parallel 
insn and moving that into my own parallel rather than generating them in 
my own function.  I guess all the matters is what is cleanest.

Thanks,
Daniel


  reply	other threads:[~2017-05-02 22:11 UTC|newest]

Thread overview: 41+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2017-04-27  8:05 [PATCH v4 0/12] [i386] Improve 64-bit Microsoft to System V ABI pro/epilogues Daniel Santos
2017-04-27  8:05 ` [PATCH 01/12] [i386] Re-align stack frame prior to SSE saves Daniel Santos
2017-04-27  8:05 ` [PATCH 08/12] [i386] Modify ix86_compute_frame_layout for -mcall-ms2sysv-xlogues Daniel Santos
2017-04-27  8:05 ` [PATCH 10/12] [i386] Add ms2sysv pro/epilogue stubs to libgcc Daniel Santos
2017-04-27  8:05 ` [PATCH 03/12] [i386] Use re-aligned stack pointer for aligned SSE movs Daniel Santos
2017-04-27  8:05 ` [PATCH 05/12] [i386] Add option -mcall-ms2sysv-xlogues Daniel Santos
2017-04-28  6:00   ` Sandra Loosemore
2017-04-28  7:37     ` [PATCH 05/12 rev 1] " Daniel Santos
2017-04-27  8:05 ` [PATCH 09/12] [i386] Add patterns and predicates foutline-msabi-xlouges Daniel Santos
2017-05-01 11:18   ` Uros Bizjak
2017-05-02 22:19     ` Daniel Santos [this message]
2017-05-03  6:17       ` Uros Bizjak
2017-05-03  7:38         ` Daniel Santos
2017-05-03  8:38           ` Uros Bizjak
2017-05-04 21:35   ` [PATCH 09/12 rev1] [i386] Add patterns and predicates mcall-ms2sysv-xlogues Daniel Santos
2017-04-27  8:05 ` [PATCH 11/12] [i386] Add remainder of -mcall-ms2sysv-xlogues implementation Daniel Santos
2017-05-04 22:11   ` [PATCH 11/12 rev1] " Daniel Santos
2017-04-27  8:05 ` [PATCH 12/12] [i386,testsuite] Test program for ms to sysv abi function calls Daniel Santos
2017-05-17  9:52   ` Thomas Preudhomme
2017-04-27  8:05 ` [PATCH 02/12] [i386] Keep stack pointer valid after after re-alignment Daniel Santos
2017-04-27  8:23 ` [PATCH 04/12] [i386] Minor refactoring Daniel Santos
2017-04-27  8:44 ` [PATCH 07/12] [i386] Modify ix86_save_reg to optionally omit stub-managed registers Daniel Santos
2017-04-27  8:51 ` [PATCH 06/12] [i386] Add class xlogue_layout and new fields to struct machine_function Daniel Santos
2017-04-27 18:32 ` [PATCH v4 0/12 GCC8] [i386] Improve 64-bit Microsoft to System V ABI pro/epilogues Daniel Santos
2017-05-01 11:31 ` [PATCH v4 0/12] " Uros Bizjak
2017-05-02 10:25   ` JonY
2017-05-02 10:45     ` Kai Tietz
2017-05-03  6:01       ` Daniel Santos
2017-05-05  9:05       ` Daniel Santos
2017-05-06 20:41         ` Daniel Santos
2017-05-08 20:07           ` Daniel Santos
2017-05-03  4:32     ` Daniel Santos
2017-05-13  0:01 ` [PING] " Daniel Santos
2017-05-13 18:29   ` Uros Bizjak
2017-05-13 23:43     ` Daniel Santos
2017-05-14 10:25       ` Uros Bizjak
2017-07-26 19:03         ` H.J. Lu
2017-07-27  0:36           ` Daniel Santos
2017-07-28 13:51           ` Daniel Santos
2017-07-28 14:41             ` H.J. Lu
2017-07-31 10:25               ` Daniel Santos

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=272376f2-178f-4d42-bc88-1555b54282f0@pobox.com \
    --to=daniel.santos@pobox.com \
    --cc=gcc-patches@gcc.gnu.org \
    --cc=hubicka@ucw.cz \
    --cc=ubizjak@gmail.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).