From 3a79c88e7e1ecd21bcd62074c014ba3e84553959 Mon Sep 17 00:00:00 2001 From: Runxi Yu Date: Fri, 19 Dec 2025 23:02:46 +0800 Subject: adler32: More descriptive constants --- internal/adler32/adler32_avx2.s | 28 ++++++++++++++-------------- internal/adler32/adler32_sse3.s | 24 ++++++++++++------------ 2 files changed, 26 insertions(+), 26 deletions(-) (limited to 'internal/adler32') diff --git a/internal/adler32/adler32_avx2.s b/internal/adler32/adler32_avx2.s index ee9cc9b0..1b9a1c50 100644 --- a/internal/adler32/adler32_avx2.s +++ b/internal/adler32/adler32_avx2.s @@ -2,20 +2,20 @@ #include "textflag.h" -DATA LCPI0_0<>+0x00(SB)/8, $0x191a1b1c1d1e1f20 -DATA LCPI0_0<>+0x08(SB)/8, $0x1112131415161718 -DATA LCPI0_0<>+0x10(SB)/8, $0x090a0b0c0d0e0f10 -DATA LCPI0_0<>+0x18(SB)/8, $0x0102030405060708 -GLOBL LCPI0_0<>(SB), (RODATA|NOPTR), $32 +DATA weights_1_32<>+0x00(SB)/8, $0x191a1b1c1d1e1f20 +DATA weights_1_32<>+0x08(SB)/8, $0x1112131415161718 +DATA weights_1_32<>+0x10(SB)/8, $0x090a0b0c0d0e0f10 +DATA weights_1_32<>+0x18(SB)/8, $0x0102030405060708 +GLOBL weights_1_32<>(SB), (RODATA|NOPTR), $32 -DATA LCPI0_1<>+0x00(SB)/8, $0x0001000100010001 -DATA LCPI0_1<>+0x08(SB)/8, $0x0001000100010001 -DATA LCPI0_1<>+0x10(SB)/8, $0x0001000100010001 -DATA LCPI0_1<>+0x18(SB)/8, $0x0001000100010001 -GLOBL LCPI0_1<>(SB), (RODATA|NOPTR), $32 +DATA ones_u16<>+0x00(SB)/8, $0x0001000100010001 +DATA ones_u16<>+0x08(SB)/8, $0x0001000100010001 +DATA ones_u16<>+0x10(SB)/8, $0x0001000100010001 +DATA ones_u16<>+0x18(SB)/8, $0x0001000100010001 +GLOBL ones_u16<>(SB), (RODATA|NOPTR), $32 -DATA LCPI0_2<>+0x00(SB)/2, $0x0001 -GLOBL LCPI0_2<>(SB), (RODATA|NOPTR), $2 +DATA one_u16<>+0x00(SB)/2, $0x0001 +GLOBL one_u16<>(SB), (RODATA|NOPTR), $2 TEXT ·adler32_avx2(SB), NOSPLIT, $0-36 MOVLQZX in+0(FP), DI @@ -37,8 +37,8 @@ TEXT ·adler32_avx2(SB), NOSPLIT, $0-36 JB tail16_check LONG $0x078071bf; BYTE $0x80 LONG $0xc0eff9c5 - VMOVDQA LCPI0_0<>(SB), Y1 - VPBROADCASTW LCPI0_2<>(SB), Y2 + VMOVDQA weights_1_32<>(SB), Y1 + VPBROADCASTW one_u16<>(SB), Y2 JMP block_loop_setup block_accum_init: diff --git a/internal/adler32/adler32_sse3.s b/internal/adler32/adler32_sse3.s index adeb7d2c..5880bab8 100644 --- a/internal/adler32/adler32_sse3.s +++ b/internal/adler32/adler32_sse3.s @@ -2,17 +2,17 @@ #include "textflag.h" -DATA LCPI0_0<>+0x00(SB)/8, $0x191a1b1c1d1e1f20 -DATA LCPI0_0<>+0x08(SB)/8, $0x1112131415161718 -GLOBL LCPI0_0<>(SB), (RODATA|NOPTR), $16 +DATA weights_17_32<>+0x00(SB)/8, $0x191a1b1c1d1e1f20 +DATA weights_17_32<>+0x08(SB)/8, $0x1112131415161718 +GLOBL weights_17_32<>(SB), (RODATA|NOPTR), $16 -DATA LCPI0_1<>+0x00(SB)/8, $0x0001000100010001 -DATA LCPI0_1<>+0x08(SB)/8, $0x0001000100010001 -GLOBL LCPI0_1<>(SB), (RODATA|NOPTR), $16 +DATA ones_u16<>+0x00(SB)/8, $0x0001000100010001 +DATA ones_u16<>+0x08(SB)/8, $0x0001000100010001 +GLOBL ones_u16<>(SB), (RODATA|NOPTR), $16 -DATA LCPI0_2<>+0x00(SB)/8, $0x090a0b0c0d0e0f10 -DATA LCPI0_2<>+0x08(SB)/8, $0x0102030405060708 -GLOBL LCPI0_2<>(SB), (RODATA|NOPTR), $16 +DATA weights_1_16<>+0x00(SB)/8, $0x090a0b0c0d0e0f10 +DATA weights_1_16<>+0x08(SB)/8, $0x0102030405060708 +GLOBL weights_1_16<>(SB), (RODATA|NOPTR), $16 TEXT ·adler32_sse3(SB), NOSPLIT, $0-36 MOVLQZX in+0(FP), DI @@ -35,9 +35,9 @@ TEXT ·adler32_sse3(SB), NOSPLIT, $0-36 block_loop_setup: SHRQ $0x5, DX LONG $0xc0ef0f66 - MOVO LCPI0_0<>(SB), X1 - MOVO LCPI0_1<>(SB), X2 - MOVO LCPI0_2<>(SB), X3 + MOVO weights_17_32<>(SB), X1 + MOVO ones_u16<>(SB), X2 + MOVO weights_1_16<>(SB), X3 LONG $0x8071b841; WORD $0x8007 block_outer_loop: -- cgit v1.3.1-10-gc9f91