From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: by sourceware.org (Postfix, from userid 7852) id 9643A3857C46; Tue, 8 Mar 2022 05:43:38 +0000 (GMT) DKIM-Filter: OpenDKIM Filter v2.11.0 sourceware.org 9643A3857C46 Content-Type: text/plain; charset="us-ascii" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit From: Sunil Pandey To: glibc-cvs@sourceware.org Subject: [glibc] x86_64: Fix svml_d_acos4_core_avx2.S code formatting X-Act-Checkin: glibc X-Git-Author: Sunil K Pandey X-Git-Refname: refs/heads/master X-Git-Oldrev: 97f84927880317dc11c3b7a0166a044f8787f8cf X-Git-Newrev: 656ff2e94e8440112882fad2f68b75c44ab41abc Message-Id: <20220308054338.9643A3857C46@sourceware.org> Date: Tue, 8 Mar 2022 05:43:38 +0000 (GMT) X-BeenThere: glibc-cvs@sourceware.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: Glibc-cvs mailing list List-Unsubscribe: , List-Archive: List-Help: List-Subscribe: , X-List-Received-Date: Tue, 08 Mar 2022 05:43:38 -0000 https://sourceware.org/git/gitweb.cgi?p=glibc.git;h=656ff2e94e8440112882fad2f68b75c44ab41abc commit 656ff2e94e8440112882fad2f68b75c44ab41abc Author: Sunil K Pandey Date: Mon Mar 7 10:47:08 2022 -0800 x86_64: Fix svml_d_acos4_core_avx2.S code formatting This commit contains following formatting changes 1. Instructions proceeded by a tab. 2. Instruction less than 8 characters in length have a tab between it and the first operand. 3. Instruction greater than 7 characters in length have a space between it and the first operand. 4. Tabs after `#define`d names and their value. 5. 8 space at the beginning of line replaced by tab. 6. Indent comments with code. 7. Remove redundent .text section. 8. 1 space between line content and line comment. 9. Space after all commas. Reviewed-by: Noah Goldstein Diff: --- .../x86_64/fpu/multiarch/svml_d_acos4_core_avx2.S | 455 ++++++++++----------- 1 file changed, 227 insertions(+), 228 deletions(-) diff --git a/sysdeps/x86_64/fpu/multiarch/svml_d_acos4_core_avx2.S b/sysdeps/x86_64/fpu/multiarch/svml_d_acos4_core_avx2.S index 9efd359bfa..e19bddd2e2 100644 --- a/sysdeps/x86_64/fpu/multiarch/svml_d_acos4_core_avx2.S +++ b/sysdeps/x86_64/fpu/multiarch/svml_d_acos4_core_avx2.S @@ -28,258 +28,257 @@ /* Offsets for data table __svml_dacos_data_internal */ -#define SgnBit 0 -#define OneHalf 32 -#define SmallNorm 64 -#define MOne 96 -#define Two 128 -#define sqrt_coeff 160 -#define poly_coeff 288 -#define PiH 672 -#define Pi2H 704 +#define SgnBit 0 +#define OneHalf 32 +#define SmallNorm 64 +#define MOne 96 +#define Two 128 +#define sqrt_coeff 160 +#define poly_coeff 288 +#define PiH 672 +#define Pi2H 704 #include - .text - .section .text.avx2,"ax",@progbits + .section .text.avx2, "ax", @progbits ENTRY(_ZGVdN4v_acos_avx2) - pushq %rbp - cfi_def_cfa_offset(16) - movq %rsp, %rbp - cfi_def_cfa(6, 16) - cfi_offset(6, -16) - andq $-32, %rsp - subq $96, %rsp - vmovupd __svml_dacos_data_internal(%rip), %ymm6 - vmovupd OneHalf+__svml_dacos_data_internal(%rip), %ymm7 - vmovapd %ymm0, %ymm5 - -/* x = -|arg| */ - vorpd %ymm5, %ymm6, %ymm4 - -/* Y = 0.5 + 0.5*(-x) */ - vfmadd231pd %ymm4, %ymm7, %ymm7 - -/* x^2 */ - vmulpd %ymm4, %ymm4, %ymm8 - -/* S ~ 2*sqrt(Y) */ - vmovupd sqrt_coeff+__svml_dacos_data_internal(%rip), %ymm0 - vcmplt_oqpd SmallNorm+__svml_dacos_data_internal(%rip), %ymm7, %ymm12 - vminpd %ymm7, %ymm8, %ymm2 - -/* NaN processed in special branch (so wind test passed) */ - vcmpnge_uqpd MOne+__svml_dacos_data_internal(%rip), %ymm4, %ymm9 - vcvtpd2ps %ymm7, %xmm10 - vmovupd poly_coeff+64+__svml_dacos_data_internal(%rip), %ymm8 - vcmpnlt_uqpd %ymm7, %ymm2, %ymm1 - vrsqrtps %xmm10, %xmm11 - vfmadd213pd poly_coeff+96+__svml_dacos_data_internal(%rip), %ymm2, %ymm8 - vcvtps2pd %xmm11, %ymm13 - vmovupd poly_coeff+128+__svml_dacos_data_internal(%rip), %ymm11 - vandnpd %ymm13, %ymm12, %ymm14 - vmulpd %ymm14, %ymm14, %ymm15 - vfmadd213pd poly_coeff+160+__svml_dacos_data_internal(%rip), %ymm2, %ymm11 - vmulpd %ymm2, %ymm2, %ymm13 - vmovupd poly_coeff+256+__svml_dacos_data_internal(%rip), %ymm12 - vmulpd %ymm13, %ymm13, %ymm10 - vfmadd213pd poly_coeff+288+__svml_dacos_data_internal(%rip), %ymm2, %ymm12 - vandpd %ymm5, %ymm6, %ymm3 - vaddpd %ymm7, %ymm7, %ymm6 - vmulpd %ymm6, %ymm14, %ymm7 - vfmsub213pd Two+__svml_dacos_data_internal(%rip), %ymm15, %ymm6 - vmovupd poly_coeff+320+__svml_dacos_data_internal(%rip), %ymm14 - vfmadd213pd sqrt_coeff+32+__svml_dacos_data_internal(%rip), %ymm6, %ymm0 - vmulpd %ymm6, %ymm7, %ymm15 - vfmadd213pd poly_coeff+352+__svml_dacos_data_internal(%rip), %ymm2, %ymm14 - vfmadd213pd sqrt_coeff+64+__svml_dacos_data_internal(%rip), %ymm6, %ymm0 - vfmadd213pd sqrt_coeff+96+__svml_dacos_data_internal(%rip), %ymm6, %ymm0 - -/* polynomial */ - vmovupd poly_coeff+__svml_dacos_data_internal(%rip), %ymm6 - vfnmadd213pd %ymm7, %ymm15, %ymm0 - vfmadd213pd poly_coeff+32+__svml_dacos_data_internal(%rip), %ymm2, %ymm6 - vblendvpd %ymm1, %ymm0, %ymm4, %ymm0 - vfmadd213pd %ymm8, %ymm13, %ymm6 - vmovmskpd %ymm9, %edx - vmovupd poly_coeff+192+__svml_dacos_data_internal(%rip), %ymm9 - vfmadd213pd poly_coeff+224+__svml_dacos_data_internal(%rip), %ymm2, %ymm9 - vfmadd213pd %ymm9, %ymm13, %ymm11 - vfmadd213pd %ymm11, %ymm10, %ymm6 - vfmadd213pd %ymm12, %ymm13, %ymm6 - vfmadd213pd %ymm14, %ymm13, %ymm6 - vmulpd %ymm6, %ymm2, %ymm9 - -/* X