mirror of
https://github.com/nginx/nginx.git
synced 2025-06-07 17:52:38 +08:00
optimization
This commit is contained in:
parent
896b5e4a4f
commit
43bb0077d1
@ -24,8 +24,11 @@
|
|||||||
*
|
*
|
||||||
*
|
*
|
||||||
* The "r" is any register, %rax (%r0) - %r16.
|
* The "r" is any register, %rax (%r0) - %r16.
|
||||||
* The "=a" and "a" are the %rax register. Although we can return result
|
* The "=a" and "a" are the %rax register.
|
||||||
* in any register, we use %rax because it is used in cmpxchgq anyway.
|
* Although we can return result in any register, we use "a" because it is
|
||||||
|
* used in cmpxchgq anyway. The result is actually in %al but not in $rax,
|
||||||
|
* however as the code is inlined gcc can test %al as well as %rax.
|
||||||
|
*
|
||||||
* The "cc" means that flags were changed.
|
* The "cc" means that flags were changed.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@ -33,14 +36,13 @@ static ngx_inline ngx_atomic_uint_t
|
|||||||
ngx_atomic_cmp_set(ngx_atomic_t *lock, ngx_atomic_uint_t old,
|
ngx_atomic_cmp_set(ngx_atomic_t *lock, ngx_atomic_uint_t old,
|
||||||
ngx_atomic_uint_t set)
|
ngx_atomic_uint_t set)
|
||||||
{
|
{
|
||||||
ngx_atomic_uint_t res;
|
u_char res;
|
||||||
|
|
||||||
__asm__ volatile (
|
__asm__ volatile (
|
||||||
|
|
||||||
NGX_SMP_LOCK
|
NGX_SMP_LOCK
|
||||||
" cmpxchgq %3, %1; "
|
" cmpxchgq %3, %1; "
|
||||||
" setz %b0; "
|
" sete %0; "
|
||||||
" movzbq %b0, %0; "
|
|
||||||
|
|
||||||
: "=a" (res) : "m" (*lock), "a" (old), "r" (set) : "cc", "memory");
|
: "=a" (res) : "m" (*lock), "a" (old), "r" (set) : "cc", "memory");
|
||||||
|
|
||||||
|
@ -23,9 +23,13 @@
|
|||||||
* }
|
* }
|
||||||
*
|
*
|
||||||
*
|
*
|
||||||
* The "q" is any of the %eax, %ebx, %ecx, or %edx registers.
|
* The "r" means the general register.
|
||||||
* The "=a" and "a" are the %eax register. Although we can return result
|
* The "=a" and "a" are the %eax register.
|
||||||
* in any register, we use %eax because it is used in cmpxchgl anyway.
|
* Although we can return result in any register, we use "a" because it is
|
||||||
|
* used in cmpxchgl anyway. The result is actually in %al but not in %eax,
|
||||||
|
* however, as the code is inlined gcc can test %al as well as %eax,
|
||||||
|
* and icc adds "movzbl %al, %eax" by itself.
|
||||||
|
*
|
||||||
* The "cc" means that flags were changed.
|
* The "cc" means that flags were changed.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@ -33,16 +37,15 @@ static ngx_inline ngx_atomic_uint_t
|
|||||||
ngx_atomic_cmp_set(ngx_atomic_t *lock, ngx_atomic_uint_t old,
|
ngx_atomic_cmp_set(ngx_atomic_t *lock, ngx_atomic_uint_t old,
|
||||||
ngx_atomic_uint_t set)
|
ngx_atomic_uint_t set)
|
||||||
{
|
{
|
||||||
ngx_atomic_uint_t res;
|
u_char res;
|
||||||
|
|
||||||
__asm__ volatile (
|
__asm__ volatile (
|
||||||
|
|
||||||
NGX_SMP_LOCK
|
NGX_SMP_LOCK
|
||||||
" cmpxchgl %3, %1; "
|
" cmpxchgl %3, %1; "
|
||||||
" setz %b0; "
|
" sete %0; "
|
||||||
" movzbl %b0, %0; "
|
|
||||||
|
|
||||||
: "=a" (res) : "m" (*lock), "a" (old), "q" (set) : "cc", "memory");
|
: "=a" (res) : "m" (*lock), "a" (old), "r" (set) : "cc", "memory");
|
||||||
|
|
||||||
return res;
|
return res;
|
||||||
}
|
}
|
||||||
@ -56,7 +59,7 @@ ngx_atomic_cmp_set(ngx_atomic_t *lock, ngx_atomic_uint_t old,
|
|||||||
* r = temp;
|
* r = temp;
|
||||||
*
|
*
|
||||||
*
|
*
|
||||||
* The "+q" is any of the %eax, %ebx, %ecx, or %edx registers.
|
* The "+r" means the general register.
|
||||||
* The "cc" means that flags were changed.
|
* The "cc" means that flags were changed.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@ -80,7 +83,7 @@ ngx_atomic_fetch_add(ngx_atomic_t *value, ngx_atomic_int_t add)
|
|||||||
NGX_SMP_LOCK
|
NGX_SMP_LOCK
|
||||||
" xaddl %0, %1; "
|
" xaddl %0, %1; "
|
||||||
|
|
||||||
: "+q" (add) : "m" (*value) : "cc", "memory");
|
: "+r" (add) : "m" (*value) : "cc", "memory");
|
||||||
|
|
||||||
return add;
|
return add;
|
||||||
}
|
}
|
||||||
@ -89,9 +92,9 @@ ngx_atomic_fetch_add(ngx_atomic_t *value, ngx_atomic_int_t add)
|
|||||||
#else
|
#else
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* gcc 2.7 does not support "+q", so we have to use the fixed %eax ("=a" and
|
* gcc 2.7 does not support "+r", so we have to use the fixed
|
||||||
* "a") and this adds two superfluous instructions in the end of code,
|
* %eax ("=a" and "a") and this adds two superfluous instructions in the end
|
||||||
* something like this: "mov %eax, %edx / mov %edx, %eax".
|
* of code, something like this: "mov %eax, %edx / mov %edx, %eax".
|
||||||
*/
|
*/
|
||||||
|
|
||||||
static ngx_inline ngx_atomic_int_t
|
static ngx_inline ngx_atomic_int_t
|
||||||
|
Loading…
Reference in New Issue
Block a user