From 607b05aca683eee5bcdb7bf9af4ebf02adc635d9 Mon Sep 17 00:00:00 2001 From: Rich Felker Date: Thu, 25 Oct 2012 15:40:58 -0400 Subject: use explicit visibility to optimize a few hot-path function calls on x86 and some other archs, functions which make function calls which might go through a PLT incur a significant overhead cost loading the GOT register prior to making the call. this load is utterly useless in musl, since all calls are bound at library-creation time using -Bsymbolic-functions, but the compiler has no way of knowing this, and attempts to set the default visibility to protected have failed due to bugs in GCC and binutils. this commit simply manually assigns hidden/protected visibility, as appropriate, to a few internal-use-only functions which have many callers, or which have callers that are hot paths like getc/putc. it shaves about 5k off the i386 libc.so with -Os. many of the improvements are in syscall wrappers, where the benefit is just size and performance improvement is unmeasurable noise amid the syscall overhead. however, stdio may be measurably faster. if in the future there are toolchains that can do the same thing globally without introducing linking bugs, it might be worth considering removing these workarounds. --- src/internal/syscall.h | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) (limited to 'src/internal/syscall.h') diff --git a/src/internal/syscall.h b/src/internal/syscall.h index 50409ef8..7381efea 100644 --- a/src/internal/syscall.h +++ b/src/internal/syscall.h @@ -1,9 +1,11 @@ #ifndef _INTERNAL_SYSCALL_H #define _INTERNAL_SYSCALL_H -long __syscall_ret(unsigned long); -long __syscall(long, ...); -long __syscall_cp(long, long, long, long, long, long, long); +#if defined(__PIC__) && (100*__GNUC__+__GNUC_MINOR__ >= 303) +__attribute__((visibility("protected"))) +#endif +long __syscall_ret(unsigned long), __syscall(long, ...), + __syscall_cp(long, long, long, long, long, long, long); #include #include "syscall_arch.h" -- cgit v1.2.1