Re: [PATCH v3] LoongArch: Add prefetch instructions.

public inbox for gcc-patches@gcc.gnu.org
 help / color / mirror / Atom feed

From: Lulu Cheng <chenglulu@loongson.cn>
To: WANG Xuerui <i@xen0n.name>, gcc-patches@gcc.gnu.org
Cc: xry111@xry111.site, xuchenghua@loongson.cn,
	xujiahao <xujiahao@loongson.cn>
Subject: Re: [PATCH v3] LoongArch: Add prefetch instructions.
Date: Wed, 16 Nov 2022 11:19:23 +0800	[thread overview]
Message-ID: <05ac7d65-3f1a-92ff-401c-71fcc36dd422@loongson.cn> (raw)
In-Reply-To: <d937c83d-02ab-1985-c4ee-9ac9ec629c57@xen0n.name>

[-- Attachment #1: Type: text/plain, Size: 7005 bytes --]


在 2022/11/16 上午11:06, WANG Xuerui 写道:
>
> On 2022/11/16 10:10, Lulu Cheng wrote:
>> v2 -> v3:
>> 1. Remove preldx support.
>>
>> ---------------------------------------
>> Enable sw prefetching at -O3 and higher.
>>
>> Co-Authored-By: xujiahao <xujiahao@loongson.cn>
>>
>> gcc/ChangeLog:
>>
>>     * config/loongarch/constraints.md (ZD): New constraint.
>>     * config/loongarch/loongarch-def.c: Initial number of parallel 
>> prefetch.
>>     * config/loongarch/loongarch-tune.h (struct loongarch_cache):
>>     Define number of parallel prefetch.
>>     * config/loongarch/loongarch.cc 
>> (loongarch_option_override_internal):
>>     Set up parameters to be used in prefetching algorithm.
>>     * config/loongarch/loongarch.md (prefetch): New template.
>> ---
>>   gcc/config/loongarch/constraints.md   | 10 ++++++++++
>>   gcc/config/loongarch/loongarch-def.c  |  2 ++
>>   gcc/config/loongarch/loongarch-tune.h |  1 +
>>   gcc/config/loongarch/loongarch.cc     | 28 +++++++++++++++++++++++++++
>>   gcc/config/loongarch/loongarch.md     | 14 ++++++++++++++
>>   5 files changed, 55 insertions(+)
>>
>> diff --git a/gcc/config/loongarch/constraints.md 
>> b/gcc/config/loongarch/constraints.md
>> index 43cb7b5f0f5..46f7f63ae31 100644
>> --- a/gcc/config/loongarch/constraints.md
>> +++ b/gcc/config/loongarch/constraints.md
>> @@ -86,6 +86,10 @@
>>   ;;    "ZB"
>>   ;;      "An address that is held in a general-purpose register.
>>   ;;      The offset is zero"
>> +;;    "ZD"
>> +;;    "An address operand whose address is formed by a base register
>> +;;     and offset that is suitable for use in instructions with the 
>> same
>> +;;     addressing mode as @code{preld}."
>>   ;; "<" "Matches a pre-dec or post-dec operand." (Global 
>> non-architectural)
>>   ;; ">" "Matches a pre-inc or post-inc operand." (Global 
>> non-architectural)
>>   @@ -190,3 +194,9 @@ (define_memory_constraint "ZB"
>>     The offset is zero"
>>     (and (match_code "mem")
>>          (match_test "REG_P (XEXP (op, 0))")))
>> +
>> +(define_address_constraint "ZD"
>> +  "An address operand whose address is formed by a base register
>> +   and offset that is suitable for use in instructions with the same
>> +   addressing mode as @code{preld}."
>> +   (match_test "loongarch_12bit_offset_address_p (op, mode)"))
>
> How is this different with the "m" constraint? AFAIK preld and ld 
> share the same addressing mode (i.e. base register + 12-bit signed 
> immediate offset).
The "m" constraint is defined as follows:
(define_memory_constraint "m"
*  (and (match_code "mem")*

        (match_test "loongarch_12bit_offset_address_p (XEXP (op, 0), 
mode)")))

This setting must be a memory operand.

''ZD" constraint is a address operand.

I think (mem:mode (address operand)) = memory operand.


>
>> diff --git a/gcc/config/loongarch/loongarch-def.c 
>> b/gcc/config/loongarch/loongarch-def.c
>> index cbf995d81b5..80ab10a52a8 100644
>> --- a/gcc/config/loongarch/loongarch-def.c
>> +++ b/gcc/config/loongarch/loongarch-def.c
>> @@ -62,11 +62,13 @@ loongarch_cpu_cache[N_TUNE_TYPES] = {
>>         .l1d_line_size = 64,
>>         .l1d_size = 64,
>>         .l2d_size = 256,
>> +      .simultaneous_prefetches = 4,
>>     },
>>     [CPU_LA464] = {
>>         .l1d_line_size = 64,
>>         .l1d_size = 64,
>>         .l2d_size = 256,
>> +      .simultaneous_prefetches = 4,
>>     },
>>   };
>>   diff --git a/gcc/config/loongarch/loongarch-tune.h 
>> b/gcc/config/loongarch/loongarch-tune.h
>> index 6f3530f5c02..8e3eb29472b 100644
>> --- a/gcc/config/loongarch/loongarch-tune.h
>> +++ b/gcc/config/loongarch/loongarch-tune.h
>> @@ -45,6 +45,7 @@ struct loongarch_cache {
>>       int l1d_line_size;  /* bytes */
>>       int l1d_size;       /* KiB */
>>       int l2d_size;       /* kiB */
>> +    int simultaneous_prefetches; /* number of parallel prefetch */
> nit: "prefetches" or "prefetch ops" or "int prefetch_width"?
>>   };
>>     #endif /* LOONGARCH_TUNE_H */
>> diff --git a/gcc/config/loongarch/loongarch.cc 
>> b/gcc/config/loongarch/loongarch.cc
>> index 8d5d8d965dd..8ee32c90573 100644
>> --- a/gcc/config/loongarch/loongarch.cc
>> +++ b/gcc/config/loongarch/loongarch.cc
>> @@ -63,6 +63,7 @@ along with GCC; see the file COPYING3.  If not see
>>   #include "context.h"
>>   #include "builtins.h"
>>   #include "rtl-iter.h"
>> +#include "opts.h"
>>     /* This file should be included last.  */
>>   #include "target-def.h"
>> @@ -6100,6 +6101,33 @@ loongarch_option_override_internal (struct 
>> gcc_options *opts)
>>     if (loongarch_branch_cost == 0)
>>       loongarch_branch_cost = loongarch_cost->branch_cost;
>>   +  /* Set up parameters to be used in prefetching algorithm. */
>> +  int simultaneous_prefetches
>> +    = loongarch_cpu_cache[LARCH_ACTUAL_TUNE].simultaneous_prefetches;
>> +
>> +  SET_OPTION_IF_UNSET (opts, &global_options_set,
>> +               param_simultaneous_prefetches,
>> +               simultaneous_prefetches);
>> +
>> +  SET_OPTION_IF_UNSET (opts, &global_options_set,
>> +               param_l1_cache_line_size,
>> + loongarch_cpu_cache[LARCH_ACTUAL_TUNE].l1d_line_size);
>> +
>> +  SET_OPTION_IF_UNSET (opts, &global_options_set,
>> +               param_l1_cache_size,
>> + loongarch_cpu_cache[LARCH_ACTUAL_TUNE].l1d_size);
>> +
>> +  SET_OPTION_IF_UNSET (opts, &global_options_set,
>> +               param_l2_cache_size,
>> + loongarch_cpu_cache[LARCH_ACTUAL_TUNE].l2d_size);
>> +
>> +
>> +  /* Enable sw prefetching at -O3 and higher.  */
>> +  if (opts->x_flag_prefetch_loop_arrays < 0
>> +      && (opts->x_optimize >= 3 || opts->x_flag_profile_use)
>> +      && !opts->x_optimize_size)
>> +    opts->x_flag_prefetch_loop_arrays = 1;
>> +
>>     if (TARGET_DIRECT_EXTERN_ACCESS && flag_shlib)
>>       error ("%qs cannot be used for compiling a shared library",
>>          "-mdirect-extern-access");
>> diff --git a/gcc/config/loongarch/loongarch.md 
>> b/gcc/config/loongarch/loongarch.md
>> index 682ab961741..2fda5381904 100644
>> --- a/gcc/config/loongarch/loongarch.md
>> +++ b/gcc/config/loongarch/loongarch.md
>> @@ -3282,6 +3282,20 @@ (define_expand "untyped_call"
>>   ;;  ....................
>>   ;;
>>   +(define_insn "prefetch"
>> +  [(prefetch (match_operand 0 "address_operand" "ZD")
>> +         (match_operand 1 "const_int_operand" "n")
>> +         (match_operand 2 "const_int_operand" "n"))]
>> +  ""
>> +{
>> +  switch (INTVAL (operands[1]))
>> +  {
>> +    case 0: return "preld\t0,%a0";
>> +    case 1: return "preld\t8,%a0";
>> +    default: gcc_unreachable ();
>> +  }
>> +})
>> +
>>   (define_insn "nop"
>>     [(const_int 0)]
>>     ""

next prev parent reply	other threads:[~2022-11-16  3:19 UTC|newest]

Thread overview: 6+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2022-11-16  2:10 Lulu Cheng
2022-11-16  3:06 ` WANG Xuerui
2022-11-16  3:19   ` Lulu Cheng [this message]
2022-11-16 16:22     ` Xi Ruoyao
2022-11-17  6:28 ` Xi Ruoyao
2022-11-23  3:08 ` [pushed][PATCH " chenglulu

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=05ac7d65-3f1a-92ff-401c-71fcc36dd422@loongson.cn \
    --to=chenglulu@loongson.cn \
    --cc=gcc-patches@gcc.gnu.org \
    --cc=i@xen0n.name \
    --cc=xry111@xry111.site \
    --cc=xuchenghua@loongson.cn \
    --cc=xujiahao@loongson.cn \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link

Be sure your reply has a Subject: header at the top and a blank line before the message body.

This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).