x86/64: Adjust types of temporaries used by ffs()/fls()/fls64()
The 64-bit special cases of the former two (the thrird one is 64-bit only anyway) don't need to use "long" temporaries, as the result will always fit in a 32-bit variable, and the functions return plain "int". This avoids a few REX prefixes, i.e. minimally reduces code size. Signed-off-by: Jan Beulich <jbeulich@suse.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Link: http://lkml.kernel.org/r/504DE550020000780009A258@nat28.tlf.novell.com Signed-off-by: Ingo Molnar <mingo@kernel.org>
This commit is contained in:
parent
6eebdda35e
commit
1edfbb4153
1 changed files with 4 additions and 6 deletions
|
@ -417,10 +417,9 @@ static inline int ffs(int x)
|
||||||
* We cannot do this on 32 bits because at the very least some
|
* We cannot do this on 32 bits because at the very least some
|
||||||
* 486 CPUs did not behave this way.
|
* 486 CPUs did not behave this way.
|
||||||
*/
|
*/
|
||||||
long tmp = -1;
|
|
||||||
asm("bsfl %1,%0"
|
asm("bsfl %1,%0"
|
||||||
: "=r" (r)
|
: "=r" (r)
|
||||||
: "rm" (x), "0" (tmp));
|
: "rm" (x), "0" (-1));
|
||||||
#elif defined(CONFIG_X86_CMOV)
|
#elif defined(CONFIG_X86_CMOV)
|
||||||
asm("bsfl %1,%0\n\t"
|
asm("bsfl %1,%0\n\t"
|
||||||
"cmovzl %2,%0"
|
"cmovzl %2,%0"
|
||||||
|
@ -459,10 +458,9 @@ static inline int fls(int x)
|
||||||
* We cannot do this on 32 bits because at the very least some
|
* We cannot do this on 32 bits because at the very least some
|
||||||
* 486 CPUs did not behave this way.
|
* 486 CPUs did not behave this way.
|
||||||
*/
|
*/
|
||||||
long tmp = -1;
|
|
||||||
asm("bsrl %1,%0"
|
asm("bsrl %1,%0"
|
||||||
: "=r" (r)
|
: "=r" (r)
|
||||||
: "rm" (x), "0" (tmp));
|
: "rm" (x), "0" (-1));
|
||||||
#elif defined(CONFIG_X86_CMOV)
|
#elif defined(CONFIG_X86_CMOV)
|
||||||
asm("bsrl %1,%0\n\t"
|
asm("bsrl %1,%0\n\t"
|
||||||
"cmovzl %2,%0"
|
"cmovzl %2,%0"
|
||||||
|
@ -490,13 +488,13 @@ static inline int fls(int x)
|
||||||
#ifdef CONFIG_X86_64
|
#ifdef CONFIG_X86_64
|
||||||
static __always_inline int fls64(__u64 x)
|
static __always_inline int fls64(__u64 x)
|
||||||
{
|
{
|
||||||
long bitpos = -1;
|
int bitpos = -1;
|
||||||
/*
|
/*
|
||||||
* AMD64 says BSRQ won't clobber the dest reg if x==0; Intel64 says the
|
* AMD64 says BSRQ won't clobber the dest reg if x==0; Intel64 says the
|
||||||
* dest reg is undefined if x==0, but their CPU architect says its
|
* dest reg is undefined if x==0, but their CPU architect says its
|
||||||
* value is written to set it to the same as before.
|
* value is written to set it to the same as before.
|
||||||
*/
|
*/
|
||||||
asm("bsrq %1,%0"
|
asm("bsrq %1,%q0"
|
||||||
: "+r" (bitpos)
|
: "+r" (bitpos)
|
||||||
: "rm" (x));
|
: "rm" (x));
|
||||||
return bitpos + 1;
|
return bitpos + 1;
|
||||||
|
|
Loading…
Reference in a new issue