Skip to content

Commit

Permalink
Extend x86-64 sem_timedwait to use futex syscall with absolute timeout.
Browse files Browse the repository at this point in the history
  • Loading branch information
Ulrich Drepper committed Jul 18, 2009
1 parent 312d667 commit f351f2b
Show file tree
Hide file tree
Showing 2 changed files with 120 additions and 46 deletions.
4 changes: 4 additions & 0 deletions nptl/ChangeLog
Original file line number Diff line number Diff line change
@@ -1,5 +1,9 @@
2009-07-17 Ulrich Drepper <drepper@redhat.com>

* sysdeps/unix/sysv/linux/x86_64/sem_timedwait.S (sem_timedwait):
If possible use FUTEX_WAIT_BITSET|FUTEX_CLOCK_REALTIME to directly
use absolute timeout.

* sysdeps/unix/sysv/linux/x86_64/sem_wait.S (sem_wait): Optimize
handling of uncontested semaphore.

Expand Down
162 changes: 116 additions & 46 deletions nptl/sysdeps/unix/sysv/linux/x86_64/sem_timedwait.S
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@
02111-1307 USA. */

#include <sysdep.h>
#include <kernel-features.h>
#include <lowlevellock.h>
#include <shlib-compat.h>
#include <pthread-errnos.h>
Expand Down Expand Up @@ -73,8 +74,13 @@ sem_timedwait:
pushq %r14
cfi_adjust_cfa_offset(8)
cfi_rel_offset(%r14, 0)
subq $24, %rsp
cfi_adjust_cfa_offset(24)
#ifdef __ASSUME_FUTEX_CLOCK_REALTIME
# define STACKFRAME 8
#else
# define STACKFRAME 24
#endif
subq $STACKFRAME, %rsp
cfi_adjust_cfa_offset(STACKFRAME)

movq %rdi, %r12
movq %rsi, %r13
Expand All @@ -87,67 +93,50 @@ sem_timedwait:
LOCK
addq $1, NWAITERS(%r12)

7: xorl %esi, %esi
movq %rsp, %rdi
movq $VSYSCALL_ADDR_vgettimeofday, %rax
callq *%rax

/* Compute relative timeout. */
movq 8(%rsp), %rax
movl $1000, %edi
mul %rdi /* Milli seconds to nano seconds. */
movq (%r13), %rdi
movq 8(%r13), %rsi
subq (%rsp), %rdi
subq %rax, %rsi
jns 5f
addq $1000000000, %rsi
decq %rdi
5: testq %rdi, %rdi
movl $ETIMEDOUT, %r14d
js 6f /* Time is already up. */

movq %rdi, (%rsp) /* Store relative timeout. */
movq %rsi, 8(%rsp)
#ifndef __ASSUME_FUTEX_CLOCK_REALTIME
# ifdef PIC
cmpl $0, __have_futex_clock_realtime(%rip)
# else
cmpl $0, __have_futex_clock_realtime
# endif
je .Lreltmo
#endif

.LcleanupSTART:
call __pthread_enable_asynccancel
movl %eax, 16(%rsp)
13: call __pthread_enable_asynccancel
movl %eax, (%rsp)

movq %rsp, %r10
movq %r13, %r10
#if VALUE == 0
movq %r12, %rdi
#else
leaq VALUE(%r12), %rdi
#endif
#if FUTEX_WAIT == 0
movl PRIVATE(%rdi), %esi
#else
movl $FUTEX_WAIT, %esi
movl $0xffffffff, %r9d
movl $FUTEX_WAIT_BITSET|FUTEX_CLOCK_REALTIME, %esi
orl PRIVATE(%rdi), %esi
#endif
movl $SYS_futex, %eax
xorl %edx, %edx
syscall
movq %rax, %r14

movl 16(%rsp), %edi
movl (%rsp), %edi
call __pthread_disable_asynccancel
.LcleanupEND:

testq %r14, %r14
je 9f
je 11f
cmpq $-EWOULDBLOCK, %r14
jne 3f

9:
11:
#if VALUE == 0
movl (%r12), %eax
#else
movl VALUE(%r12), %eax
#endif
8: testl %eax, %eax
je 7b
14: testl %eax, %eax
je 13b

leaq -1(%rax), %rcx
LOCK
Expand All @@ -156,15 +145,15 @@ sem_timedwait:
#else
cmpxchgl %ecx, VALUE(%r12)
#endif
jne 8b
jne 14b

xorl %eax, %eax
10: xorl %eax, %eax

10: LOCK
15: LOCK
subq $1, NWAITERS(%r12)

addq $24, %rsp
cfi_adjust_cfa_offset(-24)
addq $STACKFRAME, %rsp
cfi_adjust_cfa_offset(-STACKFRAME)
popq %r14
cfi_adjust_cfa_offset(-8)
cfi_restore(%r14)
Expand All @@ -176,10 +165,10 @@ sem_timedwait:
cfi_restore(%r12)
retq

cfi_adjust_cfa_offset(3 * 8 + 24)
cfi_rel_offset(%r12, 24 + 2 * 8)
cfi_rel_offset(%r13, 24 + 1 * 8)
cfi_rel_offset(%r14, 24)
cfi_adjust_cfa_offset(STACKFRAME + 3 * 8)
cfi_rel_offset(%r12, STACKFRAME + 2 * 8)
cfi_rel_offset(%r13, STACKFRAME + 1 * 8)
cfi_rel_offset(%r14, STACKFRAME)
3: negq %r14
6:
#if USE___THREAD
Expand All @@ -191,7 +180,82 @@ sem_timedwait:
#endif

orl $-1, %eax
jmp 15b

#ifndef __ASSUME_FUTEX_CLOCK_REALTIME
.Lreltmo:
7: xorl %esi, %esi
movq %rsp, %rdi
movq $VSYSCALL_ADDR_vgettimeofday, %rax
callq *%rax

/* Compute relative timeout. */
movq 8(%rsp), %rax
movl $1000, %edi
mul %rdi /* Milli seconds to nano seconds. */
movq (%r13), %rdi
movq 8(%r13), %rsi
subq (%rsp), %rdi
subq %rax, %rsi
jns 5f
addq $1000000000, %rsi
decq %rdi
5: testq %rdi, %rdi
movl $ETIMEDOUT, %r14d
js 6b /* Time is already up. */

movq %rdi, (%rsp) /* Store relative timeout. */
movq %rsi, 8(%rsp)

.LcleanupSTART2:
call __pthread_enable_asynccancel
movl %eax, 16(%rsp)

movq %rsp, %r10
# if VALUE == 0
movq %r12, %rdi
# else
leaq VALUE(%r12), %rdi
# endif
# if FUTEX_WAIT == 0
movl PRIVATE(%rdi), %esi
# else
movl $FUTEX_WAIT, %esi
orl PRIVATE(%rdi), %esi
# endif
movl $SYS_futex, %eax
xorl %edx, %edx
syscall
movq %rax, %r14

movl 16(%rsp), %edi
call __pthread_disable_asynccancel
.LcleanupEND2:

testq %r14, %r14
je 9f
cmpq $-EWOULDBLOCK, %r14
jne 3b

9:
# if VALUE == 0
movl (%r12), %eax
# else
movl VALUE(%r12), %eax
# endif
8: testl %eax, %eax
je 7b

leaq -1(%rax), %rcx
LOCK
# if VALUE == 0
cmpxchgl %ecx, (%r12)
# else
cmpxchgl %ecx, VALUE(%r12)
# endif
jne 8b
jmp 10b
#endif
.size sem_timedwait,.-sem_timedwait


Expand Down Expand Up @@ -219,6 +283,12 @@ sem_timedwait_cleanup:
.uleb128 .LcleanupEND-.LcleanupSTART
.uleb128 sem_timedwait_cleanup-.LSTARTCODE
.uleb128 0
#ifndef __ASSUME_FUTEX_CLOCK_REALTIME
.uleb128 .LcleanupSTART2-.LSTARTCODE
.uleb128 .LcleanupEND2-.LcleanupSTART2
.uleb128 sem_timedwait_cleanup-.LSTARTCODE
.uleb128 0
#endif
.uleb128 .LcallUR-.LSTARTCODE
.uleb128 .LENDCODE-.LcallUR
.uleb128 0
Expand Down

0 comments on commit f351f2b

Please sign in to comment.