From 35668c8d9475d7fe061978ce79a286ba972062cc Mon Sep 17 00:00:00 2001 From: Sunil K Pandey Date: Mon, 7 Mar 2022 10:47:08 -0800 Subject: x86_64: Fix svml_s_acosf8_core_avx2.S code formatting This commit contains following formatting changes 1. Instructions proceeded by a tab. 2. Instruction less than 8 characters in length have a tab between it and the first operand. 3. Instruction greater than 7 characters in length have a space between it and the first operand. 4. Tabs after `#define`d names and their value. 5. 8 space at the beginning of line replaced by tab. 6. Indent comments with code. 7. Remove redundent .text section. 8. 1 space between line content and line comment. 9. Space after all commas. Reviewed-by: Noah Goldstein --- .../x86_64/fpu/multiarch/svml_s_acosf8_core_avx2.S | 411 ++++++++++----------- 1 file changed, 205 insertions(+), 206 deletions(-) (limited to 'sysdeps') diff --git a/sysdeps/x86_64/fpu/multiarch/svml_s_acosf8_core_avx2.S b/sysdeps/x86_64/fpu/multiarch/svml_s_acosf8_core_avx2.S index 94402554ad..bf28a5dd00 100644 --- a/sysdeps/x86_64/fpu/multiarch/svml_s_acosf8_core_avx2.S +++ b/sysdeps/x86_64/fpu/multiarch/svml_s_acosf8_core_avx2.S @@ -29,236 +29,235 @@ /* Offsets for data table __svml_sacos_data_internal */ -#define SgnBit 0 -#define OneHalf 32 -#define SmallNorm 64 -#define MOne 96 -#define Two 128 -#define sqrt_coeff 160 -#define poly_coeff 224 -#define Pi2H 384 -#define PiH 416 +#define SgnBit 0 +#define OneHalf 32 +#define SmallNorm 64 +#define MOne 96 +#define Two 128 +#define sqrt_coeff 160 +#define poly_coeff 224 +#define Pi2H 384 +#define PiH 416 #include - .text - .section .text.avx2,"ax",@progbits + .section .text.avx2, "ax", @progbits ENTRY(_ZGVdN8v_acosf_avx2) - pushq %rbp - cfi_def_cfa_offset(16) - movq %rsp, %rbp - cfi_def_cfa(6, 16) - cfi_offset(6, -16) - andq $-32, %rsp - subq $96, %rsp - -/* - * 2*sqrt(X) ~ Sh - Sl (to 24+ bits) - * SQ ~ 2*sqrt(X) - */ - vmovups __svml_sacos_data_internal(%rip), %ymm6 - vmovups OneHalf+__svml_sacos_data_internal(%rip), %ymm7 - vmovaps %ymm0, %ymm5 - -/* x = -|arg| */ - vorps %ymm5, %ymm6, %ymm4 - -/* Y = 0.5 + 0.5*(-x) */ - vfmadd231ps %ymm4, %ymm7, %ymm7 - -/* x^2 */ - vmulps %ymm4, %ymm4, %ymm8 - -/* SQ ~ 2*sqrt(Y) */ - vmovups sqrt_coeff+__svml_sacos_data_internal(%rip), %ymm0 - vcmpnge_uqps MOne+__svml_sacos_data_internal(%rip), %ymm4, %ymm9 - vcmplt_oqps SmallNorm+__svml_sacos_data_internal(%rip), %ymm7, %ymm10 - vminps %ymm7, %ymm8, %ymm2 - vaddps %ymm7, %ymm7, %ymm14 - vrsqrtps %ymm7, %ymm11 - vmovups poly_coeff+64+__svml_sacos_data_internal(%rip), %ymm8 - vcmpnlt_uqps %ymm7, %ymm2, %ymm1 - vmulps %ymm2, %ymm2, %ymm7 - vfmadd213ps poly_coeff+96+__svml_sacos_data_internal(%rip), %ymm2, %ymm8 - vmovmskps %ymm9, %edx - -/* polynomial */ - vmovups poly_coeff+__svml_sacos_data_internal(%rip), %ymm9 - vandnps %ymm11, %ymm10, %ymm12 - vmulps %ymm12, %ymm12, %ymm13 - vfmadd213ps poly_coeff+32+__svml_sacos_data_internal(%rip), %ymm2, %ymm9 - -/* X