public inbox for gcc-bugs@sourceware.org
help / color / mirror / Atom feed
From: "hubicka at gcc dot gnu.org" <gcc-bugzilla@gcc.gnu.org>
To: gcc-bugs@gcc.gnu.org
Subject: [Bug tree-optimization/99395] s116 benchmark of TSVC is vectorized by clang and not by gcc
Date: Fri, 05 Mar 2021 15:42:18 +0000	[thread overview]
Message-ID: <bug-99395-4-QqngQmCKlt@http.gcc.gnu.org/bugzilla/> (raw)
In-Reply-To: <bug-99395-4@http.gcc.gnu.org/bugzilla/>

https://gcc.gnu.org/bugzilla/show_bug.cgi?id=99395

--- Comment #3 from Jan Hubicka <hubicka at gcc dot gnu.org> ---
ICC version seems to run faster
000000000040a050 <s116>:
  40a050:       55                      push   %rbp
  40a051:       48 89 e5                mov    %rsp,%rbp
  40a054:       48 83 e4 e0             and    $0xffffffffffffffe0,%rsp
  40a058:       41 57                   push   %r15
  40a05a:       53                      push   %rbx
  40a05b:       48 83 ec 10             sub    $0x10,%rsp
  40a05f:       48 89 fb                mov    %rdi,%rbx
  40a062:       bf 74 f5 42 00          mov    $0x42f574,%edi
  40a067:       e8 14 cc 00 00          call   416c80 <initialise_arrays>
  40a06c:       48 89 df                mov    %rbx,%rdi
  40a06f:       33 f6                   xor    %esi,%esi
  40a071:       e8 4a 70 ff ff          call   4010c0 <gettimeofday@plt>
  40a076:       33 c0                   xor    %eax,%eax
  40a078:       41 89 c7                mov    %eax,%r15d
  40a07b:       33 d2                   xor    %edx,%edx
  40a07d:       0f 1f 00                nopl   (%rax)
  40a080:       c5 fc 10 04 95 04 9d    vmovups 0x579d04(,%rdx,4),%ymm0
  40a087:       57 00 
  40a089:       c5 fc 10 14 95 24 9d    vmovups 0x579d24(,%rdx,4),%ymm2
  40a090:       57 00 
  40a092:       c5 fc 10 24 95 44 9d    vmovups 0x579d44(,%rdx,4),%ymm4
  40a099:       57 00 
  40a09b:       c5 fc 10 34 95 64 9d    vmovups 0x579d64(,%rdx,4),%ymm6
  40a0a2:       57 00 
  40a0a4:       c5 fc 59 0c 95 00 9d    vmulps 0x579d00(,%rdx,4),%ymm0,%ymm1
  40a0ab:       57 00 
  40a0ad:       c5 ec 59 1c 95 20 9d    vmulps 0x579d20(,%rdx,4),%ymm2,%ymm3
  40a0b4:       57 00 
  40a0b6:       c5 dc 59 2c 95 40 9d    vmulps 0x579d40(,%rdx,4),%ymm4,%ymm5
  40a0bd:       57 00 
  40a0bf:       c5 cc 59 3c 95 60 9d    vmulps 0x579d60(,%rdx,4),%ymm6,%ymm7
  40a0c6:       57 00 
  40a0c8:       c5 fc 11 0c 95 00 9d    vmovups %ymm1,0x579d00(,%rdx,4)
  40a0cf:       57 00 
  40a0d1:       c5 fc 11 1c 95 20 9d    vmovups %ymm3,0x579d20(,%rdx,4)
  40a0d8:       57 00 
  40a0da:       c5 fc 11 2c 95 40 9d    vmovups %ymm5,0x579d40(,%rdx,4)
  40a0e1:       57 00 
  40a0e3:       c5 fc 11 3c 95 60 9d    vmovups %ymm7,0x579d60(,%rdx,4)
  40a0ea:       57 00 
  40a0ec:       48 83 c2 20             add    $0x20,%rdx
  40a0f0:       48 81 fa e0 7c 00 00    cmp    $0x7ce0,%rdx
  40a0f7:       72 87                   jb     40a080 <s116+0x30>
  40a0f9:       33 c9                   xor    %ecx,%ecx
  40a0fb:       ba e1 7c 00 00          mov    $0x7ce1,%edx
  40a100:       c5 fc 10 04 95 00 9d    vmovups 0x579d00(,%rdx,4),%ymm0
  40a107:       57 00 
  40a109:       48 83 c2 08             add    $0x8,%rdx
  40a10d:       c5 fc 59 0c 8d 80 90    vmulps 0x599080(,%rcx,4),%ymm0,%ymm1
  40a114:       59 00 
  40a116:       c5 fc 11 0c 8d 80 90    vmovups %ymm1,0x599080(,%rcx,4)
  40a11d:       59 00 
  40a11f:       48 83 c1 08             add    $0x8,%rcx
  40a123:       48 83 f9 18             cmp    $0x18,%rcx
  40a127:       72 d7                   jb     40a100 <s116+0xb0>
  40a129:       c5 fa 10 0d b3 ef 18    vmovss 0x18efb3(%rip),%xmm1        #
5990e4 <a+0x1f3e4>
  40a130:       00 
  40a131:       bf 00 9d 57 00          mov    $0x579d00,%edi
  40a136:       c5 fa 10 1d aa ef 18    vmovss 0x18efaa(%rip),%xmm3        #
5990e8 <a+0x1f3e8>
  40a13d:       00 
  40a13e:       be 80 d8 45 00          mov    $0x45d880,%esi
  40a143:       c5 f2 59 05 95 ef 18    vmulss 0x18ef95(%rip),%xmm1,%xmm0      
 # 5990e0 <a+0x1f3e0>
  40a14a:       00 
  40a14b:       ba 00 a9 55 00          mov    $0x55a900,%edx
  40a150:       c5 e2 59 25 94 ef 18    vmulss 0x18ef94(%rip),%xmm3,%xmm4      
 # 5990ec <a+0x1f3ec>
  40a157:       00 
  40a158:       c5 f2 59 d3             vmulss %xmm3,%xmm1,%xmm2
  40a15c:       c5 fa 11 05 7c ef 18    vmovss %xmm0,0x18ef7c(%rip)        #
5990e0 <a+0x1f3e0>
  40a163:       00 
  40a164:       b9 80 e4 43 00          mov    $0x43e480,%ecx
  40a169:       c5 fa 11 15 73 ef 18    vmovss %xmm2,0x18ef73(%rip)        #
5990e4 <a+0x1f3e4>
  40a170:       00 
  40a171:       41 b8 00 b5 53 00       mov    $0x53b500,%r8d
  40a177:       c5 fa 11 25 69 ef 18    vmovss %xmm4,0x18ef69(%rip)        #
5990e8 <a+0x1f3e8>
  40a17e:       00 
  40a17f:       41 b9 c0 b4 4b 00       mov    $0x4bb4c0,%r9d
  40a185:       68 00 91 59 00          push   $0x599100
  40a18a:       68 00 b5 4f 00          push   $0x4fb500
  40a18f:       c5 f8 77                vzeroupper 
  40a192:       c5 f8 57 c0             vxorps %xmm0,%xmm0,%xmm0
  40a196:       e8 d5 92 00 00          call   413470 <dummy>
  40a19b:       48 83 c4 10             add    $0x10,%rsp
  40a19f:       41 ff c7                inc    %r15d
  40a1a2:       41 81 ff 40 42 0f 00    cmp    $0xf4240,%r15d
  40a1a9:       0f 82 cc fe ff ff       jb     40a07b <s116+0x2b>
  40a1af:       48 83 c3 10             add    $0x10,%rbx
  40a1b3:       33 f6                   xor    %esi,%esi
  40a1b5:       48 89 df                mov    %rbx,%rdi
  40a1b8:       e8 03 6f ff ff          call   4010c0 <gettimeofday@plt>
  40a1bd:       bf 74 f5 42 00          mov    $0x42f574,%edi
  40a1c2:       48 83 c4 10             add    $0x10,%rsp
  40a1c6:       5b                      pop    %rbx
  40a1c7:       41 5f                   pop    %r15
  40a1c9:       48 89 ec                mov    %rbp,%rsp
  40a1cc:       5d                      pop    %rbp
  40a1cd:       e9 de 97 00 00          jmp    4139b0 <calc_checksum>
  40a1d2:       0f 1f 80 00 00 00 00    nopl   0x0(%rax)
  40a1d9:       0f 1f 80 00 00 00 00    nopl   0x0(%rax)

  parent reply	other threads:[~2021-03-05 15:42 UTC|newest]

Thread overview: 21+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2021-03-04 23:01 [Bug middle-end/99395] New: " hubicka at gcc dot gnu.org
2021-03-04 23:24 ` [Bug middle-end/99395] " hubicka at gcc dot gnu.org
2021-03-05  8:27 ` [Bug tree-optimization/99395] " rguenth at gcc dot gnu.org
2021-03-05 15:42 ` hubicka at gcc dot gnu.org [this message]
2022-10-18 10:28 ` rguenth at gcc dot gnu.org
2022-10-18 10:37 ` rguenth at gcc dot gnu.org
2023-10-07  9:10 ` juzhe.zhong at rivai dot ai
2023-10-09  6:30 ` rguenth at gcc dot gnu.org
2024-01-30 11:37 ` juzhe.zhong at rivai dot ai
2024-01-30 12:26 ` rguenth at gcc dot gnu.org
2024-01-31  1:32 ` juzhe.zhong at rivai dot ai
2024-01-31  3:50 ` juzhe.zhong at rivai dot ai
2024-01-31  7:00 ` juzhe.zhong at rivai dot ai
2024-01-31  7:59 ` rguenth at gcc dot gnu.org
2024-01-31  8:09 ` juzhe.zhong at rivai dot ai
2024-01-31  8:18 ` rguenther at suse dot de
2024-01-31  8:27 ` juzhe.zhong at rivai dot ai
2024-01-31  9:08 ` rguenther at suse dot de
2024-01-31  9:19 ` juzhe.zhong at rivai dot ai
2024-01-31  9:56 ` rguenther at suse dot de
2024-04-07 21:33 ` pinskia at gcc dot gnu.org

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=bug-99395-4-QqngQmCKlt@http.gcc.gnu.org/bugzilla/ \
    --to=gcc-bugzilla@gcc.gnu.org \
    --cc=gcc-bugs@gcc.gnu.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).