shithub: furgit

Download patch

ref: 3a79c88e7e1ecd21bcd62074c014ba3e84553959
parent: 4d930c1478f6b9e4851e84e139b4cdf4450fb963
author: Runxi Yu <me@runxiyu.org>
date: Fri Dec 19 18:02:46 EST 2025

adler32: More descriptive constants

--- a/internal/adler32/adler32_avx2.s
+++ b/internal/adler32/adler32_avx2.s
@@ -2,20 +2,20 @@
 
 #include "textflag.h"
 
-DATA LCPI0_0<>+0x00(SB)/8, $0x191a1b1c1d1e1f20
-DATA LCPI0_0<>+0x08(SB)/8, $0x1112131415161718
-DATA LCPI0_0<>+0x10(SB)/8, $0x090a0b0c0d0e0f10
-DATA LCPI0_0<>+0x18(SB)/8, $0x0102030405060708
-GLOBL LCPI0_0<>(SB), (RODATA|NOPTR), $32
+DATA weights_1_32<>+0x00(SB)/8, $0x191a1b1c1d1e1f20
+DATA weights_1_32<>+0x08(SB)/8, $0x1112131415161718
+DATA weights_1_32<>+0x10(SB)/8, $0x090a0b0c0d0e0f10
+DATA weights_1_32<>+0x18(SB)/8, $0x0102030405060708
+GLOBL weights_1_32<>(SB), (RODATA|NOPTR), $32
 
-DATA LCPI0_1<>+0x00(SB)/8, $0x0001000100010001
-DATA LCPI0_1<>+0x08(SB)/8, $0x0001000100010001
-DATA LCPI0_1<>+0x10(SB)/8, $0x0001000100010001
-DATA LCPI0_1<>+0x18(SB)/8, $0x0001000100010001
-GLOBL LCPI0_1<>(SB), (RODATA|NOPTR), $32
+DATA ones_u16<>+0x00(SB)/8, $0x0001000100010001
+DATA ones_u16<>+0x08(SB)/8, $0x0001000100010001
+DATA ones_u16<>+0x10(SB)/8, $0x0001000100010001
+DATA ones_u16<>+0x18(SB)/8, $0x0001000100010001
+GLOBL ones_u16<>(SB), (RODATA|NOPTR), $32
 
-DATA LCPI0_2<>+0x00(SB)/2, $0x0001
-GLOBL LCPI0_2<>(SB), (RODATA|NOPTR), $2
+DATA one_u16<>+0x00(SB)/2, $0x0001
+GLOBL one_u16<>(SB), (RODATA|NOPTR), $2
 
 TEXT ·adler32_avx2(SB), NOSPLIT, $0-36
 	MOVLQZX      in+0(FP), DI
@@ -37,8 +37,8 @@
 	JB           tail16_check
 	LONG         $0x078071bf; BYTE $0x80
 	LONG         $0xc0eff9c5
-	VMOVDQA      LCPI0_0<>(SB), Y1
-	VPBROADCASTW LCPI0_2<>(SB), Y2
+	VMOVDQA      weights_1_32<>(SB), Y1
+	VPBROADCASTW one_u16<>(SB), Y2
 	JMP          block_loop_setup
 
 block_accum_init:
--- a/internal/adler32/adler32_sse3.s
+++ b/internal/adler32/adler32_sse3.s
@@ -2,17 +2,17 @@
 
 #include "textflag.h"
 
-DATA LCPI0_0<>+0x00(SB)/8, $0x191a1b1c1d1e1f20
-DATA LCPI0_0<>+0x08(SB)/8, $0x1112131415161718
-GLOBL LCPI0_0<>(SB), (RODATA|NOPTR), $16
+DATA weights_17_32<>+0x00(SB)/8, $0x191a1b1c1d1e1f20
+DATA weights_17_32<>+0x08(SB)/8, $0x1112131415161718
+GLOBL weights_17_32<>(SB), (RODATA|NOPTR), $16
 
-DATA LCPI0_1<>+0x00(SB)/8, $0x0001000100010001
-DATA LCPI0_1<>+0x08(SB)/8, $0x0001000100010001
-GLOBL LCPI0_1<>(SB), (RODATA|NOPTR), $16
+DATA ones_u16<>+0x00(SB)/8, $0x0001000100010001
+DATA ones_u16<>+0x08(SB)/8, $0x0001000100010001
+GLOBL ones_u16<>(SB), (RODATA|NOPTR), $16
 
-DATA LCPI0_2<>+0x00(SB)/8, $0x090a0b0c0d0e0f10
-DATA LCPI0_2<>+0x08(SB)/8, $0x0102030405060708
-GLOBL LCPI0_2<>(SB), (RODATA|NOPTR), $16
+DATA weights_1_16<>+0x00(SB)/8, $0x090a0b0c0d0e0f10
+DATA weights_1_16<>+0x08(SB)/8, $0x0102030405060708
+GLOBL weights_1_16<>(SB), (RODATA|NOPTR), $16
 
 TEXT ·adler32_sse3(SB), NOSPLIT, $0-36
 	MOVLQZX in+0(FP), DI
@@ -35,9 +35,9 @@
 block_loop_setup:
 	SHRQ $0x5, DX
 	LONG $0xc0ef0f66
-	MOVO LCPI0_0<>(SB), X1
-	MOVO LCPI0_1<>(SB), X2
-	MOVO LCPI0_2<>(SB), X3
+	MOVO weights_17_32<>(SB), X1
+	MOVO ones_u16<>(SB), X2
+	MOVO weights_1_16<>(SB), X3
 	LONG $0x8071b841; WORD $0x8007
 
 block_outer_loop:
--