aboutsummaryrefslogtreecommitdiff
path: root/sysdeps
diff options
context:
space:
mode:
authorUlrich Drepper <drepper@redhat.com>2009-06-05 11:51:59 -0700
committerUlrich Drepper <drepper@redhat.com>2009-06-05 11:51:59 -0700
commit6f9eea15bf8d49d64ca1f3fd6d1a528c40f658a4 (patch)
tree33019cc8fcc41f8fbc8bcc4b28c18b288e5fea7c /sysdeps
parentf85a9e72e21c3fc79dbad53c170251a16d1760ab (diff)
downloadglibc-6f9eea15bf8d49d64ca1f3fd6d1a528c40f658a4.zip
glibc-6f9eea15bf8d49d64ca1f3fd6d1a528c40f658a4.tar.gz
glibc-6f9eea15bf8d49d64ca1f3fd6d1a528c40f658a4.tar.bz2
Forgot some more cleanups for the SSE4.2 strlen on x86-64.
Diffstat (limited to 'sysdeps')
-rw-r--r--sysdeps/x86_64/multiarch/strlen.S9
1 files changed, 7 insertions, 2 deletions
diff --git a/sysdeps/x86_64/multiarch/strlen.S b/sysdeps/x86_64/multiarch/strlen.S
index 3f03b69..79e6a97 100644
--- a/sysdeps/x86_64/multiarch/strlen.S
+++ b/sysdeps/x86_64/multiarch/strlen.S
@@ -43,6 +43,8 @@ END(strlen)
.align 16
.type __strlen_sse42, @function
__strlen_sse42:
+ cfi_startproc
+ CALL_MCOUNT
pxor %xmm2, %xmm2
movq %rdi, %rcx
movq %rdi, %r8
@@ -68,15 +70,18 @@ __strlen_sse42:
bsfl %edx, %eax
addq %rdi, %rax
ret
+ cfi_endproc
.size __strlen_sse42, .-__strlen_sse42
# undef ENTRY
# define ENTRY(name) \
- .type __strlen_sse2, @function; __strlen_sse2:
+ .type __strlen_sse2, @function; \
+ __strlen_sse2: cfi_startproc; \
+ CALL_MCOUNT
# undef END
# define END(name) \
- .size __strlen_sse2, .-__strlen_sse2
+ cfi_endproc; .size __strlen_sse2, .-__strlen_sse2
# undef libc_hidden_builtin_def
/* It doesn't make sense to send libc-internal strlen calls through a PLT.
The speedup we get from using SSE4.2 instruction is likely eaten away