Forgot some more cleanups for the SSE4.2 strlen on x86-64.

This commit is contained in:
Ulrich Drepper 2009-06-05 11:51:59 -07:00
parent f85a9e72e2
commit 6f9eea15bf
1 changed files with 7 additions and 2 deletions

View File

@ -43,6 +43,8 @@ END(strlen)
.align 16 .align 16
.type __strlen_sse42, @function .type __strlen_sse42, @function
__strlen_sse42: __strlen_sse42:
cfi_startproc
CALL_MCOUNT
pxor %xmm2, %xmm2 pxor %xmm2, %xmm2
movq %rdi, %rcx movq %rdi, %rcx
movq %rdi, %r8 movq %rdi, %r8
@ -68,15 +70,18 @@ __strlen_sse42:
bsfl %edx, %eax bsfl %edx, %eax
addq %rdi, %rax addq %rdi, %rax
ret ret
cfi_endproc
.size __strlen_sse42, .-__strlen_sse42 .size __strlen_sse42, .-__strlen_sse42
# undef ENTRY # undef ENTRY
# define ENTRY(name) \ # define ENTRY(name) \
.type __strlen_sse2, @function; __strlen_sse2: .type __strlen_sse2, @function; \
__strlen_sse2: cfi_startproc; \
CALL_MCOUNT
# undef END # undef END
# define END(name) \ # define END(name) \
.size __strlen_sse2, .-__strlen_sse2 cfi_endproc; .size __strlen_sse2, .-__strlen_sse2
# undef libc_hidden_builtin_def # undef libc_hidden_builtin_def
/* It doesn't make sense to send libc-internal strlen calls through a PLT. /* It doesn't make sense to send libc-internal strlen calls through a PLT.
The speedup we get from using SSE4.2 instruction is likely eaten away The speedup we get from using SSE4.2 instruction is likely eaten away