public inbox for gcc-patches@gcc.gnu.org
 help / color / mirror / Atom feed
From: Shahab Vahedi <Shahab.Vahedi@synopsys.com>
To: Claudiu Zissulescu Ianculescu <claziss@gmail.com>,
	Shahab Vahedi <Shahab.Vahedi@synopsys.com>
Cc: "gcc-patches@gcc.gnu.org" <gcc-patches@gcc.gnu.org>,
	Francois Bedard <Francois.Bedard@synopsys.com>
Subject: Re: [PATCH 2/2] ARC: Use intrinsics for __builtin_sub_overflow*()
Date: Fri, 19 Apr 2024 07:20:03 +0000	[thread overview]
Message-ID: <dbccee78-62eb-4af9-a3f0-cbb5e37029ab@synopsys.com> (raw)
In-Reply-To: <CAL0iMy2uqa+u8PMbkjYxgu7BO4t9Lv+-CjFaTyGDzdzK00fPUA@mail.gmail.com>

Hi Claudiu,

On 9/7/23 12:15, Claudiu Zissulescu Ianculescu wrote:
> OK,
> 
> Thank you for your contribution,
> Claudiu

Could you commit this patch?

> 
> On Wed, Sep 6, 2023 at 3:50 PM Shahab Vahedi <Shahab.Vahedi@synopsys.com> wrote:
>>
>> This patch covers signed and unsigned subtractions.  The generated code
>> would be something along these lines:
>>
>> signed:
>>   sub.f   r0, r1, r2
>>   b.v     @label
>>
>> unsigned:
>>   sub.f   r0, r1, r2
>>   b.c     @label
>>
>> gcc/ChangeLog:
>>
>>         * config/arc/arc.md (subsi3_v): New insn.
>>         (subvsi4): New expand.
>>         (subsi3_c): New insn.
>>         (usubvsi4): New expand.
>>
>> gcc/testsuite/ChangeLog:
>>
>>         * gcc.target/arc/overflow-2.c: New.
>>
>> Signed-off-by: Shahab Vahedi <shahab@synopsys.com>
>> ---
>>  gcc/config/arc/arc.md                     | 48 +++++++++++
>>  gcc/testsuite/gcc.target/arc/overflow-2.c | 97 +++++++++++++++++++++++
>>  2 files changed, 145 insertions(+)
>>  create mode 100644 gcc/testsuite/gcc.target/arc/overflow-2.c
>>
>> diff --git a/gcc/config/arc/arc.md b/gcc/config/arc/arc.md
>> index 9d011f6b4a9..34e9e1a7f1d 100644
>> --- a/gcc/config/arc/arc.md
>> +++ b/gcc/config/arc/arc.md
>> @@ -2973,6 +2973,54 @@ archs4x, archs4xd"
>>    (set_attr "cpu_facility" "*,cd,*,*,*,*,*,*,*,*")
>>    ])
>>
>> +(define_insn "subsi3_v"
>> +  [(set (match_operand:SI          0 "register_operand"  "=r,r,r,  r")
>> +       (minus:SI (match_operand:SI 1 "register_operand"   "r,r,0,  r")
>> +                 (match_operand:SI 2 "nonmemory_operand"  "r,L,I,C32")))
>> +   (set (reg:CC_V CC_REG)
>> +       (compare:CC_V (sign_extend:DI (minus:SI (match_dup 1)
>> +                                               (match_dup 2)))
>> +                     (minus:DI (sign_extend:DI (match_dup 1))
>> +                               (sign_extend:DI (match_dup 2)))))]
>> +   ""
>> +   "sub.f\\t%0,%1,%2"
>> +   [(set_attr "cond"   "set")
>> +    (set_attr "type"   "compare")
>> +    (set_attr "length" "4,4,4,8")])
>> +
>> +(define_expand "subvsi4"
>> + [(match_operand:SI 0 "register_operand")
>> +  (match_operand:SI 1 "register_operand")
>> +  (match_operand:SI 2 "nonmemory_operand")
>> +  (label_ref (match_operand 3 "" ""))]
>> +  ""
>> +  "emit_insn (gen_subsi3_v (operands[0], operands[1], operands[2]));
>> +   arc_gen_unlikely_cbranch (NE, CC_Vmode, operands[3]);
>> +   DONE;")
>> +
>> +(define_insn "subsi3_c"
>> +  [(set (match_operand:SI          0 "register_operand"  "=r,r,r,  r")
>> +       (minus:SI (match_operand:SI 1 "register_operand"   "r,r,0,  r")
>> +                 (match_operand:SI 2 "nonmemory_operand"  "r,L,I,C32")))
>> +   (set (reg:CC_C CC_REG)
>> +       (compare:CC_C (match_dup 1)
>> +                     (match_dup 2)))]
>> +   ""
>> +   "sub.f\\t%0,%1,%2"
>> +   [(set_attr "cond"   "set")
>> +    (set_attr "type"   "compare")
>> +    (set_attr "length" "4,4,4,8")])
>> +
>> +(define_expand "usubvsi4"
>> +  [(match_operand:SI 0 "register_operand")
>> +   (match_operand:SI 1 "register_operand")
>> +   (match_operand:SI 2 "nonmemory_operand")
>> +   (label_ref (match_operand 3 "" ""))]
>> +   ""
>> +   "emit_insn (gen_subsi3_c (operands[0], operands[1], operands[2]));
>> +    arc_gen_unlikely_cbranch (LTU, CC_Cmode, operands[3]);
>> +    DONE;")
>> +
>>  (define_expand "subdi3"
>>    [(set (match_operand:DI 0 "register_operand" "")
>>         (minus:DI (match_operand:DI 1 "register_operand" "")
>> diff --git a/gcc/testsuite/gcc.target/arc/overflow-2.c b/gcc/testsuite/gcc.target/arc/overflow-2.c
>> new file mode 100644
>> index 00000000000..b4de8c03b22
>> --- /dev/null
>> +++ b/gcc/testsuite/gcc.target/arc/overflow-2.c
>> @@ -0,0 +1,97 @@
>> +/* { dg-do compile } */
>> +/* { dg-options "-O1" } */
>> +
>> +#include <stdbool.h>
>> +#include <stdint.h>
>> +
>> +/*
>> + * sub.f  r0,r0,r1
>> + * st_s   r0,[r2]
>> + * mov_s  r0,1
>> + * j_s.d  [blink]
>> + * mov.nv r0,0
>> + */
>> +bool sub_overflow (int32_t a, int32_t b, int32_t *res)
>> +{
>> +  return __builtin_sub_overflow (a, b, res);
>> +}
>> +
>> +/*
>> + * sub.f  r0,r0,-1234
>> + * st_s   r0,[r1]
>> + * mov_s  r0,1
>> + * j_s.d  [blink]
>> + * mov.nv r0,0
>> + */
>> +bool subi_overflow (int32_t a, int32_t *res)
>> +{
>> +  return __builtin_sub_overflow (a, -1234, res);
>> +}
>> +
>> +/*
>> + * sub.f  r3,r0,r1
>> + * st_s   r3,[r2]
>> + * j_s.d  [blink]
>> + * setlo  r0,r0,r1
>> + */
>> +bool usub_overflow (uint32_t a, uint32_t b, uint32_t *res)
>> +{
>> +  return __builtin_sub_overflow (a, b, res);
>> +}
>> +
>> +/*
>> + * sub.f  r2,r0,4321
>> + * seths  r0,4320,r0
>> + * j_s.d  [blink]
>> + * st_s   r2,[r1]
>> + */
>> +bool usubi_overflow (uint32_t a, uint32_t *res)
>> +{
>> +  return __builtin_sub_overflow (a, 4321, res);
>> +}
>> +
>> +/*
>> + * sub.f  r0,r0,r1
>> + * mov_s  r0,1
>> + * j_s.d  [blink]
>> + * mov.nv r0,0
>> + */
>> +bool sub_overflow_p (int32_t a, int32_t b, int32_t res)
>> +{
>> +  return __builtin_sub_overflow_p (a, b, res);
>> +}
>> +
>> +/*
>> + * sub.f  r0,r0,-1000
>> + * mov_s  r0,1
>> + * j_s.d  [blink]
>> + * mov.nv r0,0
>> + */
>> +bool subi_overflow_p (int32_t a, int32_t res)
>> +{
>> +  return __builtin_sub_overflow_p (a, -1000, res);
>> +}
>> +
>> +/*
>> + * j_s.d  [blink]
>> + * setlo  r0,r0,r1
>> + */
>> +bool usub_overflow_p (uint32_t a, uint32_t b, uint32_t res)
>> +{
>> +  return __builtin_sub_overflow_p (a, b, res);
>> +}
>> +
>> +/*
>> + * seths  r0,1999,r0
>> + * j_s.d  [blink]
>> + */
>> +bool usubi_overflow_p (uint32_t a, uint32_t res)
>> +{
>> +  return __builtin_sub_overflow_p (a, 2000, res);
>> +}
>> +
>> +/* { dg-final { scan-assembler-times "sub.f\\s\+"   6 } } */
>> +/* { dg-final { scan-assembler-times "mov\.nv\\s\+" 4 } } */
>> +/* { dg-final { scan-assembler-times "setlo\\s\+"   2 } } */
>> +/* { dg-final { scan-assembler-times "seths\\s\+"   2 } } */
>> +/* { dg-final { scan-assembler-not   "cmp" } } */
>> --
>> 2.42.0
>>

-- 
Shahab


  reply	other threads:[~2024-04-19  7:20 UTC|newest]

Thread overview: 6+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2023-09-06 12:50 [PATCH 1/2] ARC: Use intrinsics for __builtin_add_overflow*() Shahab Vahedi
2023-09-06 12:50 ` [PATCH 2/2] ARC: Use intrinsics for __builtin_sub_overflow*() Shahab Vahedi
2023-09-07 10:15   ` Claudiu Zissulescu Ianculescu
2024-04-19  7:20     ` Shahab Vahedi [this message]
2023-09-07 10:15 ` [PATCH 1/2] ARC: Use intrinsics for __builtin_add_overflow*() Claudiu Zissulescu Ianculescu
2024-04-19  7:19   ` Shahab Vahedi

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=dbccee78-62eb-4af9-a3f0-cbb5e37029ab@synopsys.com \
    --to=shahab.vahedi@synopsys.com \
    --cc=Francois.Bedard@synopsys.com \
    --cc=claziss@gmail.com \
    --cc=gcc-patches@gcc.gnu.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).