From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: by sourceware.org (Postfix, from userid 2038) id 91DC13861024; Fri, 30 Jul 2021 21:56:57 +0000 (GMT) DKIM-Filter: OpenDKIM Filter v2.11.0 sourceware.org 91DC13861024 MIME-Version: 1.0 Content-Transfer-Encoding: 7bit Content-Type: text/plain; charset="utf-8" From: Paul Clarke To: gcc-cvs@gcc.gnu.org Subject: [gcc r12-2643] rs6000: Add support for SSE4.1 "ceil" intrinsics X-Act-Checkin: gcc X-Git-Author: Paul A. Clarke X-Git-Refname: refs/heads/master X-Git-Oldrev: ed04cf6d73e233c74c4e55c27f1cbd89ae4710e8 X-Git-Newrev: bd9a8737d478f7f1d01a9d5f1cc4309ffbb53103 Message-Id: <20210730215657.91DC13861024@sourceware.org> Date: Fri, 30 Jul 2021 21:56:57 +0000 (GMT) X-BeenThere: gcc-cvs@gcc.gnu.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: Gcc-cvs mailing list List-Unsubscribe: , List-Archive: List-Help: List-Subscribe: , X-List-Received-Date: Fri, 30 Jul 2021 21:56:57 -0000 https://gcc.gnu.org/g:bd9a8737d478f7f1d01a9d5f1cc4309ffbb53103 commit r12-2643-gbd9a8737d478f7f1d01a9d5f1cc4309ffbb53103 Author: Paul A. Clarke Date: Thu Jul 1 17:04:51 2021 -0500 rs6000: Add support for SSE4.1 "ceil" intrinsics 2021-07-30 Paul A. Clarke gcc * config/rs6000/smmintrin.h (_mm_ceil_pd, _mm_ceil_ps, _mm_ceil_sd, _mm_ceil_ss): New. Diff: --- gcc/config/rs6000/smmintrin.h | 32 ++++++++++++++++++++++++++++++++ 1 file changed, 32 insertions(+) diff --git a/gcc/config/rs6000/smmintrin.h b/gcc/config/rs6000/smmintrin.h index 382f50c90c5..919627b0810 100644 --- a/gcc/config/rs6000/smmintrin.h +++ b/gcc/config/rs6000/smmintrin.h @@ -232,4 +232,36 @@ _mm_test_mix_ones_zeros (__m128i __A, __m128i __mask) return any_ones * any_zeros; } +__inline __m128d +__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) +_mm_ceil_pd (__m128d __A) +{ + return (__m128d) vec_ceil ((__v2df) __A); +} + +__inline __m128d +__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) +_mm_ceil_sd (__m128d __A, __m128d __B) +{ + __v2df __r = vec_ceil ((__v2df) __B); + __r[1] = ((__v2df) __A)[1]; + return (__m128d) __r; +} + +__inline __m128 +__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) +_mm_ceil_ps (__m128 __A) +{ + return (__m128) vec_ceil ((__v4sf) __A); +} + +__inline __m128 +__attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) +_mm_ceil_ss (__m128 __A, __m128 __B) +{ + __v4sf __r = (__v4sf) __A; + __r[0] = __builtin_ceil (((__v4sf) __B)[0]); + return __r; +} + #endif