1
0
mirror of https://github.com/RIOT-OS/RIOT.git synced 2025-01-18 12:52:44 +01:00
RIOT/core/include/bitarithm.h
Benjamin Valentin 14144030fa core/bitarithm: use __builtin_clz() for bitarithm_msb()
The `clz` instruction pretty much implements getting the most significant bit
in hardware, so use it instead of the software implementation.

This reults in both a reduction in code size as in a speedup:

master:

  text    data     bss     dec     hex filename
 14816     136    2424   17376    43e0 tests/bitarithm_timings/bin/same54-xpro/tests_bitarithm_timings.elf

 + bitarithm_msb: 3529411 iterations per second

this patch:

  text    data     bss     dec     hex filename
 14768     136    2424   17328    43b0 tests/bitarithm_timings/bin/same54-xpro/tests_bitarithm_timings.elf

 + bitarithm_msb: 9230761 iterations per second
2020-08-04 17:50:09 +02:00

237 lines
5.9 KiB
C

/*
* Copyright (C) 2017 Kaspar Schleiser <kaspar@schleiser.de>
* 2014 Freie Universität Berlin
*
* This file is subject to the terms and conditions of the GNU Lesser
* General Public License v2.1. See the file LICENSE in the top level
* directory for more details.
*/
/**
* @ingroup core_util
* @{
*
* @file
* @brief Helper functions for bit arithmetic
*
* @author Kaspar Schleiser <kaspar@schleiser.de>
* @author Martine Lenders <mlenders@inf.fu-berlin.de>
*/
#ifndef BITARITHM_H
#define BITARITHM_H
#include <stdint.h>
#include "cpu_conf.h"
#ifdef __cplusplus
extern "C" {
#endif
/**
* @def SETBIT
* @brief Sets a bitmask for a bitfield
*
* @param[in] val The bitfield
* @param[in] bit Specifies the bits to be set
*
* @return The modified bitfield
*/
#define SETBIT(val, bit) val |= (bit)
/**
* @def CLRBIT
* @brief Clears bitmask for a bitfield
*
* @param[in] val The bitfield
* @param[in] bit Specifies the bits to be cleared
*
* @return The modified bitfield
*/
#define CLRBIT(val, bit) val &= (~(bit))
/**
* @name Single Bit Defines
* @{
*/
#ifndef BIT0
#define BIT0 0x00000001
#define BIT1 0x00000002
#define BIT2 0x00000004
#define BIT3 0x00000008
#define BIT4 0x00000010
#define BIT5 0x00000020
#define BIT6 0x00000040
#define BIT7 0x00000080
#define BIT8 0x00000100
#define BIT9 0x00000200
#define BIT10 0x00000400
#define BIT11 0x00000800
#define BIT12 0x00001000
#define BIT13 0x00002000
#define BIT14 0x00004000
#define BIT15 0x00008000
#endif
#ifndef BIT16
#define BIT16 0x00010000
#define BIT17 0x00020000
#define BIT18 0x00040000
#define BIT19 0x00080000
#define BIT20 0x00100000
#define BIT21 0x00200000
#define BIT22 0x00400000
#define BIT23 0x00800000
#define BIT24 0x01000000
#define BIT25 0x02000000
#define BIT26 0x04000000
#define BIT27 0x08000000
#define BIT28 0x10000000
#define BIT29 0x20000000
#define BIT30 0x40000000
#define BIT31 0x80000000
#endif
/** @} */
#define ARCH_32_BIT (__INT_MAX__ == 2147483647) /**< 1 for 32 bit architectures, 0 otherwise */
/**
* @brief Returns the number of the highest '1' bit in a value
* @param[in] v Input value
* @return Bit Number
*
* Source: http://graphics.stanford.edu/~seander/bithacks.html#IntegerLogObvious
*/
static inline unsigned bitarithm_msb(unsigned v);
/**
* @brief Returns the number of the lowest '1' bit in a value
* @param[in] v Input value - must be unequal to '0', otherwise the
* function will produce an infinite loop
* @return Bit Number
*
*/
static inline unsigned bitarithm_lsb(unsigned v);
/**
* @brief Returns the number of bits set in a value
* @param[in] v Input value with platform-dependent word size
* @return Number of set bits
*
*/
unsigned bitarithm_bits_set(unsigned v);
/**
* @brief Returns the (uint32_t version) number of bits set in a value
* @param[in] v Input value with 32 bit size
* @return Number of set bits
*
*/
#if ARCH_32_BIT
static inline uint8_t bitarithm_bits_set_u32(uint32_t v)
{
return bitarithm_bits_set(v);
}
#else
uint8_t bitarithm_bits_set_u32(uint32_t v);
#endif
/**
* @brief Returns the number of the highest '1' bit in a value
*
* Internal software implementation for 32 bit platforms,
* use @see bitarithm_msb in application code.
* @param[in] v Input value
* @return Bit Number
*/
unsigned bitarith_msb_32bit_no_native_clz(unsigned v);
/* implementations */
static inline unsigned bitarithm_msb(unsigned v)
{
#if defined(BITARITHM_HAS_CLZ)
return 8 * sizeof(v) - __builtin_clz(v) - 1;
#elif ARCH_32_BIT
return bitarith_msb_32bit_no_native_clz(v);
#else
unsigned r = 0;
while (v >>= 1) { /* unroll for more speed... */
++r;
}
return r;
#endif
}
static inline unsigned bitarithm_lsb(unsigned v)
#if defined(BITARITHM_LSB_BUILTIN)
{
return __builtin_ffs(v) - 1;
}
#elif defined(BITARITHM_LSB_LOOKUP)
{
/* Source: http://graphics.stanford.edu/~seander/bithacks.html#ZerosOnRightMultLookup */
extern const uint8_t MultiplyDeBruijnBitPosition[32];
return MultiplyDeBruijnBitPosition[((uint32_t)((v & -v) * 0x077CB531U)) >>
27];
}
#else
{
/* Source: http://graphics.stanford.edu/~seander/bithacks.html#IntegerLogObvious */
unsigned r = 0;
while ((v & 0x01) == 0) {
v >>= 1;
r++;
}
return r;
}
#endif
/**
* @brief Used for iterating over the bits in @p state.
* Returns the index of a set bit in @p state, returns @p state with that bit cleared.
*
* @warning This is a low-level helper function, arguments are not checked.
* It is intended to iterate over a bit map until all bits are cleared.
* Whether it starts with the highest or lowest bit will depend on what is fastest
* on the given hardware.
*
* @warning @p state must not be zero.
*
* @param[in] state Bit Map with at least one bit set
* @param[out] index Index of the first set bit. Must be initialized with 0 before the
* first call to this function, must not be modified between subsequent
* calls.
*
* @return new state value - must be treated as opaque value
*
*/
static inline unsigned bitarithm_test_and_clear(unsigned state, uint8_t *index)
{
#if defined(BITARITHM_HAS_CLZ)
*index = 8 * sizeof(state) - __builtin_clz(state) - 1;
return state & ~(1 << *index);
#elif defined(BITARITHM_LSB_LOOKUP)
/* Source: http://graphics.stanford.edu/~seander/bithacks.html#ZerosOnRightMultLookup */
extern const uint8_t MultiplyDeBruijnBitPosition[32];
uint32_t least_bit = state & -state;
*index = MultiplyDeBruijnBitPosition[(least_bit * 0x077CB531U) >> 27];
return state & ~least_bit;
#else
while ((state & 1) == 0) {
*index += 1;
state >>= 1;
}
return state & ~1;
#endif
}
#ifdef __cplusplus
}
#endif
#endif /* BITARITHM_H */
/** @} */