From: Rich Felker <dalias@libc.org>
To: musl@lists.openwall.com
Subject: Re: [PATCH] remove a_ctz_l from atomic_arch.h
Date: Thu, 14 Dec 2017 23:41:22 -0500 [thread overview]
Message-ID: <20171215044122.GK1627@brightrain.aerifal.cx> (raw)
In-Reply-To: <1512439521-12466-1-git-send-email-armccurdy@gmail.com>
On Mon, Dec 04, 2017 at 06:05:21PM -0800, Andre McCurdy wrote:
> Arch specific code should now define only a_ctz_32 and/or a_ctz_64
> and a_ctz_l will always be defined generically.
>
> Provide an ARM specific a_ctz_32 helper function for ARM architecture
> versions for which it can be implemented efficiently via the "rbit"
> instruction (ie all Thumb-2 capable versions of ARM v6 and above).
>
> Provide a more optimal generic a_ctz_32 for targets which support
> a_clz_32 but not a_ctz_32 (e.g. ARMv5) and define generic a_ctz_64 in
> terms of a_ctz_32 to make better use of architure specific a_ctz_32.
>
> Signed-off-by: Andre McCurdy <armccurdy@gmail.com>
> ---
> arch/arm/atomic_arch.h | 12 ++++++++++++
> arch/i386/atomic_arch.h | 6 +++---
> arch/x32/atomic_arch.h | 4 ++--
> src/internal/atomic.h | 42 +++++++++++++++++++++++-------------------
> 4 files changed, 40 insertions(+), 24 deletions(-)
>
> diff --git a/arch/arm/atomic_arch.h b/arch/arm/atomic_arch.h
> index 6e2e3b4..62458b4 100644
> --- a/arch/arm/atomic_arch.h
> +++ b/arch/arm/atomic_arch.h
> @@ -91,4 +91,16 @@ static inline int a_clz_32(uint32_t x)
> return x;
> }
>
> +#if __ARM_ARCH_6T2__ || __ARM_ARCH_7A__ || __ARM_ARCH_7R__ || __ARM_ARCH >= 7
> +
> +#define a_ctz_32 a_ctz_32
> +static inline int a_ctz_32(uint32_t x)
> +{
> + uint32_t xr;
> + __asm__ ("rbit %0, %1" : "=r"(xr) : "r"(x));
> + return a_clz_32(xr);
> +}
> +
> +#endif
> +
> #endif
> diff --git a/arch/i386/atomic_arch.h b/arch/i386/atomic_arch.h
> index 7d2a48a..047fb68 100644
> --- a/arch/i386/atomic_arch.h
> +++ b/arch/i386/atomic_arch.h
> @@ -92,10 +92,10 @@ static inline int a_ctz_64(uint64_t x)
> return r;
> }
>
> -#define a_ctz_l a_ctz_l
> -static inline int a_ctz_l(unsigned long x)
> +#define a_ctz_32 a_ctz_32
> +static inline int a_ctz_32(uint32_t x)
> {
> - long r;
> + int r;
> __asm__( "bsf %1,%0" : "=r"(r) : "r"(x) );
> return r;
> }
> diff --git a/arch/x32/atomic_arch.h b/arch/x32/atomic_arch.h
> index a744c29..918c2d4 100644
> --- a/arch/x32/atomic_arch.h
> +++ b/arch/x32/atomic_arch.h
> @@ -106,8 +106,8 @@ static inline int a_ctz_64(uint64_t x)
> return x;
> }
>
> -#define a_ctz_l a_ctz_l
> -static inline int a_ctz_l(unsigned long x)
> +#define a_ctz_32 a_ctz_32
> +static inline int a_ctz_32(uint32_t x)
> {
> __asm__( "bsf %1,%0" : "=r"(x) : "r"(x) );
> return x;
> diff --git a/src/internal/atomic.h b/src/internal/atomic.h
> index ab473dd..f938879 100644
> --- a/src/internal/atomic.h
> +++ b/src/internal/atomic.h
> @@ -251,6 +251,22 @@ static inline void a_crash()
> }
> #endif
>
> +#ifndef a_ctz_32
> +#define a_ctz_32 a_ctz_32
> +static inline int a_ctz_32(uint32_t x)
> +{
> +#ifdef a_clz_32
> + return 31-a_clz_32(x&-x);
> +#else
> + static const char debruijn32[32] = {
> + 0, 1, 23, 2, 29, 24, 19, 3, 30, 27, 25, 11, 20, 8, 4, 13,
> + 31, 22, 28, 18, 26, 10, 7, 12, 21, 17, 9, 6, 16, 5, 15, 14
> + };
> + return debruijn32[(x&-x)*0x076be629 >> 27];
> +#endif
> +}
> +#endif
> +
> #ifndef a_ctz_64
> #define a_ctz_64 a_ctz_64
> static inline int a_ctz_64(uint64_t x)
> @@ -261,22 +277,23 @@ static inline int a_ctz_64(uint64_t x)
> 63, 52, 6, 26, 37, 40, 33, 47, 61, 45, 43, 21, 23, 58, 17, 10,
> 51, 25, 36, 32, 60, 20, 57, 16, 50, 31, 19, 15, 30, 14, 13, 12
> };
> - static const char debruijn32[32] = {
> - 0, 1, 23, 2, 29, 24, 19, 3, 30, 27, 25, 11, 20, 8, 4, 13,
> - 31, 22, 28, 18, 26, 10, 7, 12, 21, 17, 9, 6, 16, 5, 15, 14
> - };
> if (sizeof(long) < 8) {
> uint32_t y = x;
> if (!y) {
> y = x>>32;
> - return 32 + debruijn32[(y&-y)*0x076be629 >> 27];
> + return 32 + a_ctz_32(y);
> }
> - return debruijn32[(y&-y)*0x076be629 >> 27];
> + return a_ctz_32(y);
> }
> return debruijn64[(x&-x)*0x022fdd63cc95386dull >> 58];
> }
> #endif
>
> +static inline int a_ctz_l(unsigned long x)
> +{
> + return (sizeof(long) < 8) ? a_ctz_32(x) : a_ctz_64(x);
> +}
> +
> #ifndef a_clz_64
> #define a_clz_64 a_clz_64
> static inline int a_clz_64(uint64_t x)
> @@ -298,17 +315,4 @@ static inline int a_clz_64(uint64_t x)
> }
> #endif
>
> -#ifndef a_ctz_l
> -#define a_ctz_l a_ctz_l
> -static inline int a_ctz_l(unsigned long x)
> -{
> - static const char debruijn32[32] = {
> - 0, 1, 23, 2, 29, 24, 19, 3, 30, 27, 25, 11, 20, 8, 4, 13,
> - 31, 22, 28, 18, 26, 10, 7, 12, 21, 17, 9, 6, 16, 5, 15, 14
> - };
> - if (sizeof(long) == 8) return a_ctz_64(x);
> - return debruijn32[(x&-x)*0x076be629 >> 27];
> -}
> -#endif
> -
> #endif
> --
> 1.9.1
Overall I think this looks good. I want to recheck it again before
committing, and I'd like to separate out the ARM rbit addition from
the refactoring as a separate commit, but I can do that when I merge
unless you really want to do it first.
Rich
prev parent reply other threads:[~2017-12-15 4:41 UTC|newest]
Thread overview: 2+ messages / expand[flat|nested] mbox.gz Atom feed top
2017-12-05 2:05 Andre McCurdy
2017-12-15 4:41 ` Rich Felker [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20171215044122.GK1627@brightrain.aerifal.cx \
--to=dalias@libc.org \
--cc=musl@lists.openwall.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
Code repositories for project(s) associated with this public inbox
https://git.vuxu.org/mirror/musl/
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).