git: b49a0db6628e - main - Revert "amd64: implement strlen in assembly"

Mateusz Guzik mjg at FreeBSD.org
Tue Feb 9 15:28:07 UTC 2021


The branch main has been updated by mjg:

URL: https://cgit.FreeBSD.org/src/commit/?id=b49a0db6628e6f953504ebc8712ed582471ccd05

commit b49a0db6628e6f953504ebc8712ed582471ccd05
Author:     Mateusz Guzik <mjg at FreeBSD.org>
AuthorDate: 2021-02-09 15:18:58 +0000
Commit:     Mateusz Guzik <mjg at FreeBSD.org>
CommitDate: 2021-02-09 15:23:18 +0000

    Revert "amd64: implement strlen in assembly"
    
    This reverts commit af366d353b84bdc4e730f0fc563853abc338271c.
    
    Trips over '\xa4' byte and terminates early, as found in
    lib/libc/gen/setdomainname_test:setdomainname_basic testcase
    
    However, keep moving libkern/strlen.c out of conf/files.
    
    Reported by:    lwhsu
---
 sys/amd64/amd64/support.S | 66 -----------------------------------------------
 sys/conf/files.amd64      |  1 +
 2 files changed, 1 insertion(+), 66 deletions(-)

diff --git a/sys/amd64/amd64/support.S b/sys/amd64/amd64/support.S
index a059b520c5d5..b623fba277db 100644
--- a/sys/amd64/amd64/support.S
+++ b/sys/amd64/amd64/support.S
@@ -697,72 +697,6 @@ ENTRY(fillw)
 	ret
 END(fillw)
 
-/*
- * strlen(string)
- *	  %rdi
- *
- * Uses the ((x - 0x01....01) & ~x & 0x80....80) trick.
- *
- * 0x01....01 is replaced with 0x0 - 0x01....01 so that it can be added
- * with leaq.
- *
- * For a description see either:
- * - "Hacker's Delight" by Henry S. Warren, Jr.
- * - "Optimizing subroutines in assembly language: An optimization guide for x86 platforms"
- *   by Agner Fog
- *
- * The latter contains a 32-bit variant of the same algorithm coded in assembly for i386.
- */
-ENTRY(strlen)
-	PUSH_FRAME_POINTER
-	movabsq	$0xfefefefefefefeff,%r8
-	movabsq	$0x8080808080808080,%r9
-
-	movq	%rdi,%r10
-	movq	%rdi,%rcx
-	testb	$7,%dil
-	jz	2f
-
-	/*
-	 * Handle misaligned reads: align to 8 and fill
-	 * the spurious bytes.
-	 */
-	andq	$~7,%rdi
-	movq	(%rdi),%r11
-	shlq	$3,%rcx
-	movq	$-1,%rdx
-	shlq	%cl,%rdx
-	notq	%rdx
-	orq	%rdx,%r11
-
-	leaq	(%r11,%r8),%rcx
-	notq	%r11
-	andq	%r11,%rcx
-	andq	%r9,%rcx
-	jnz	3f
-
-	/*
-	 * Main loop.
-	 */
-	ALIGN_TEXT
-1:
-	leaq	8(%rdi),%rdi
-2:
-	movq	(%rdi),%r11
-	leaq	(%r11,%r8),%rcx
-	notq	%r11
-	andq	%rcx,%r11
-	andq	%r9,%rcx
-	jz	1b
-3:
-	bsfq	%rcx,%rcx
-	shrq	$3,%rcx
-	leaq	(%rcx,%rdi),%rax
-	subq	%r10,%rax
-	POP_FRAME_POINTER
-	ret
-END(strlen)
-
 /*****************************************************************************/
 /* copyout and fubyte family                                                 */
 /*****************************************************************************/
diff --git a/sys/conf/files.amd64 b/sys/conf/files.amd64
index 395f501198f8..98a78a8b1ef9 100644
--- a/sys/conf/files.amd64
+++ b/sys/conf/files.amd64
@@ -390,6 +390,7 @@ isa/syscons_isa.c		optional	sc
 isa/vga_isa.c			optional	vga
 kern/imgact_aout.c		optional compat_aout
 kern/link_elf_obj.c		standard
+libkern/strlen.c		standard
 #
 # IA32 binary support
 #


More information about the dev-commits-src-main mailing list