diff options
author | Lepton Wu <[email protected]> | 2019-10-21 20:22:18 -0700 |
---|---|---|
committer | Matt Turner <[email protected]> | 2019-10-29 17:18:06 -0700 |
commit | 41407d5e9fcf9b73d402292e64fa9db02c372b5f (patch) | |
tree | a57f966c1363519ef223419515919e32475cfd4c | |
parent | b2b8639d8e901008b4501e35957d27da170de042 (diff) |
mapi: Inline call x86_current_tls.
This saves one return and a simple benchmark which calls glGetString
repeatedly on my desktop shows it improves calls per second from 123M
to 141M.
Closes: https://gitlab.freedesktop.org/mesa/mesa/issues/1997
Reviewed-by: Matt Turner <[email protected]>
Signed-off-by: Lepton Wu <[email protected]>
-rw-r--r-- | src/mapi/entry_x86_tls.h | 12 |
1 files changed, 8 insertions, 4 deletions
diff --git a/src/mapi/entry_x86_tls.h b/src/mapi/entry_x86_tls.h index b9386799792..58a27cef18e 100644 --- a/src/mapi/entry_x86_tls.h +++ b/src/mapi/entry_x86_tls.h @@ -33,7 +33,7 @@ #define HIDDEN #endif -#define X86_ENTRY_SIZE 16 +#define X86_ENTRY_SIZE 32 __asm__(".text"); @@ -58,9 +58,13 @@ __asm__(".balign 16\n" ".balign 16\n" \ func ":" -#define STUB_ASM_CODE(slot) \ - "call x86_current_tls\n\t" \ - "movl %gs:(%eax), %eax\n\t" \ +#define STUB_ASM_CODE(slot) \ + "call 1f\n" \ + "1:\n\t" \ + "popl %eax\n\t" \ + "addl $_GLOBAL_OFFSET_TABLE_+[.-1b], %eax\n\t" \ + "movl " ENTRY_CURRENT_TABLE "@GOTNTPOFF(%eax), %eax\n\t" \ + "movl %gs:(%eax), %eax\n\t" \ "jmp *(4 * " slot ")(%eax)" #define MAPI_TMP_STUB_ASM_GCC |