[qemu.git] / include / qemu / host-utils.h

/*
 * Utility compute operations used by translated code.
 *
 * Copyright (c) 2007 Thiemo Seufer
 * Copyright (c) 2007 Jocelyn Mayer
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */

#ifndef HOST_UTILS_H
#define HOST_UTILS_H

#include "qemu/bswap.h"

#ifdef CONFIG_INT128
static inline void mulu64(uint64_t *plow, uint64_t *phigh,
                          uint64_t a, uint64_t b)
{
    __uint128_t r = (__uint128_t)a * b;
    *plow = r;
    *phigh = r >> 64;
}

static inline void muls64(uint64_t *plow, uint64_t *phigh,
                          int64_t a, int64_t b)
{
    __int128_t r = (__int128_t)a * b;
    *plow = r;
    *phigh = r >> 64;
}

/* compute with 96 bit intermediate result: (a*b)/c */
static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
{
    return (__int128_t)a * b / c;
}

static inline int divu128(uint64_t *plow, uint64_t *phigh, uint64_t divisor)
{
    if (divisor == 0) {
        return 1;
    } else {
        __uint128_t dividend = ((__uint128_t)*phigh << 64) | *plow;
        __uint128_t result = dividend / divisor;
        *plow = result;
        *phigh = dividend % divisor;
        return result > UINT64_MAX;
    }
}

static inline int divs128(int64_t *plow, int64_t *phigh, int64_t divisor)
{
    if (divisor == 0) {
        return 1;
    } else {
        __int128_t dividend = ((__int128_t)*phigh << 64) | *plow;
        __int128_t result = dividend / divisor;
        *plow = result;
        *phigh = dividend % divisor;
        return result != *plow;
    }
}
#else
void muls64(uint64_t *phigh, uint64_t *plow, int64_t a, int64_t b);
void mulu64(uint64_t *phigh, uint64_t *plow, uint64_t a, uint64_t b);
int divu128(uint64_t *plow, uint64_t *phigh, uint64_t divisor);
int divs128(int64_t *plow, int64_t *phigh, int64_t divisor);

static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
{
    union {
        uint64_t ll;
        struct {
#ifdef HOST_WORDS_BIGENDIAN
            uint32_t high, low;
#else
            uint32_t low, high;
#endif
        } l;
    } u, res;
    uint64_t rl, rh;

    u.ll = a;
    rl = (uint64_t)u.l.low * (uint64_t)b;
    rh = (uint64_t)u.l.high * (uint64_t)b;
    rh += (rl >> 32);
    res.l.high = rh / c;
    res.l.low = (((rh % c) << 32) + (rl & 0xffffffff)) / c;
    return res.ll;
}
#endif

/**
 * clz32 - count leading zeros in a 32-bit value.
 * @val: The value to search
 *
 * Returns 32 if the value is zero.  Note that the GCC builtin is
 * undefined if the value is zero.
 */
static inline int clz32(uint32_t val)
{
    return val ? __builtin_clz(val) : 32;
}

/**
 * clo32 - count leading ones in a 32-bit value.
 * @val: The value to search
 *
 * Returns 32 if the value is -1.
 */
static inline int clo32(uint32_t val)
{
    return clz32(~val);
}

/**
 * clz64 - count leading zeros in a 64-bit value.
 * @val: The value to search
 *
 * Returns 64 if the value is zero.  Note that the GCC builtin is
 * undefined if the value is zero.
 */
static inline int clz64(uint64_t val)
{
    return val ? __builtin_clzll(val) : 64;
}

/**
 * clo64 - count leading ones in a 64-bit value.
 * @val: The value to search
 *
 * Returns 64 if the value is -1.
 */
static inline int clo64(uint64_t val)
{
    return clz64(~val);
}

/**
 * ctz32 - count trailing zeros in a 32-bit value.
 * @val: The value to search
 *
 * Returns 32 if the value is zero.  Note that the GCC builtin is
 * undefined if the value is zero.
 */
static inline int ctz32(uint32_t val)
{
    return val ? __builtin_ctz(val) : 32;
}

/**
 * cto32 - count trailing ones in a 32-bit value.
 * @val: The value to search
 *
 * Returns 32 if the value is -1.
 */
static inline int cto32(uint32_t val)
{
    return ctz32(~val);
}

/**
 * ctz64 - count trailing zeros in a 64-bit value.
 * @val: The value to search
 *
 * Returns 64 if the value is zero.  Note that the GCC builtin is
 * undefined if the value is zero.
 */
static inline int ctz64(uint64_t val)
{
    return val ? __builtin_ctzll(val) : 64;
}

/**
 * cto64 - count trailing ones in a 64-bit value.
 * @val: The value to search
 *
 * Returns 64 if the value is -1.
 */
static inline int cto64(uint64_t val)
{
    return ctz64(~val);
}

/**
 * clrsb32 - count leading redundant sign bits in a 32-bit value.
 * @val: The value to search
 *
 * Returns the number of bits following the sign bit that are equal to it.
 * No special cases; output range is [0-31].
 */
static inline int clrsb32(uint32_t val)
{
#if __has_builtin(__builtin_clrsb) || !defined(__clang__)
    return __builtin_clrsb(val);
#else
    return clz32(val ^ ((int32_t)val >> 1)) - 1;
#endif
}

/**
 * clrsb64 - count leading redundant sign bits in a 64-bit value.
 * @val: The value to search
 *
 * Returns the number of bits following the sign bit that are equal to it.
 * No special cases; output range is [0-63].
 */
static inline int clrsb64(uint64_t val)
{
#if __has_builtin(__builtin_clrsbll) || !defined(__clang__)
    return __builtin_clrsbll(val);
#else
    return clz64(val ^ ((int64_t)val >> 1)) - 1;
#endif
}

/**
 * ctpop8 - count the population of one bits in an 8-bit value.
 * @val: The value to search
 */
static inline int ctpop8(uint8_t val)
{
    return __builtin_popcount(val);
}

/**
 * ctpop16 - count the population of one bits in a 16-bit value.
 * @val: The value to search
 */
static inline int ctpop16(uint16_t val)
{
    return __builtin_popcount(val);
}

/**
 * ctpop32 - count the population of one bits in a 32-bit value.
 * @val: The value to search
 */
static inline int ctpop32(uint32_t val)
{
    return __builtin_popcount(val);
}

/**
 * ctpop64 - count the population of one bits in a 64-bit value.
 * @val: The value to search
 */
static inline int ctpop64(uint64_t val)
{
    return __builtin_popcountll(val);
}

/**
 * revbit8 - reverse the bits in an 8-bit value.
 * @x: The value to modify.
 */
static inline uint8_t revbit8(uint8_t x)
{
    /* Assign the correct nibble position.  */
    x = ((x & 0xf0) >> 4)
      | ((x & 0x0f) << 4);
    /* Assign the correct bit position.  */
    x = ((x & 0x88) >> 3)
      | ((x & 0x44) >> 1)
      | ((x & 0x22) << 1)
      | ((x & 0x11) << 3);
    return x;
}

/**
 * revbit16 - reverse the bits in a 16-bit value.
 * @x: The value to modify.
 */
static inline uint16_t revbit16(uint16_t x)
{
    /* Assign the correct byte position.  */
    x = bswap16(x);
    /* Assign the correct nibble position.  */
    x = ((x & 0xf0f0) >> 4)
      | ((x & 0x0f0f) << 4);
    /* Assign the correct bit position.  */
    x = ((x & 0x8888) >> 3)
      | ((x & 0x4444) >> 1)
      | ((x & 0x2222) << 1)
      | ((x & 0x1111) << 3);
    return x;
}

/**
 * revbit32 - reverse the bits in a 32-bit value.
 * @x: The value to modify.
 */
static inline uint32_t revbit32(uint32_t x)
{
    /* Assign the correct byte position.  */
    x = bswap32(x);
    /* Assign the correct nibble position.  */
    x = ((x & 0xf0f0f0f0u) >> 4)
      | ((x & 0x0f0f0f0fu) << 4);
    /* Assign the correct bit position.  */
    x = ((x & 0x88888888u) >> 3)
      | ((x & 0x44444444u) >> 1)
      | ((x & 0x22222222u) << 1)
      | ((x & 0x11111111u) << 3);
    return x;
}

/**
 * revbit64 - reverse the bits in a 64-bit value.
 * @x: The value to modify.
 */
static inline uint64_t revbit64(uint64_t x)
{
    /* Assign the correct byte position.  */
    x = bswap64(x);
    /* Assign the correct nibble position.  */
    x = ((x & 0xf0f0f0f0f0f0f0f0ull) >> 4)
      | ((x & 0x0f0f0f0f0f0f0f0full) << 4);
    /* Assign the correct bit position.  */
    x = ((x & 0x8888888888888888ull) >> 3)
      | ((x & 0x4444444444444444ull) >> 1)
      | ((x & 0x2222222222222222ull) << 1)
      | ((x & 0x1111111111111111ull) << 3);
    return x;
}

/* Host type specific sizes of these routines.  */

#if ULONG_MAX == UINT32_MAX
# define clzl   clz32
# define ctzl   ctz32
# define clol   clo32
# define ctol   cto32
# define ctpopl ctpop32
# define revbitl revbit32
#elif ULONG_MAX == UINT64_MAX
# define clzl   clz64
# define ctzl   ctz64
# define clol   clo64
# define ctol   cto64
# define ctpopl ctpop64
# define revbitl revbit64
#else
# error Unknown sizeof long
#endif

static inline bool is_power_of_2(uint64_t value)
{
    if (!value) {
        return false;
    }

    return !(value & (value - 1));
}

/**
 * Return @value rounded down to the nearest power of two or zero.
 */
static inline uint64_t pow2floor(uint64_t value)
{
    if (!value) {
        /* Avoid undefined shift by 64 */
        return 0;
    }
    return 0x8000000000000000ull >> clz64(value);
}

/*
 * Return @value rounded up to the nearest power of two modulo 2^64.
 * This is *zero* for @value > 2^63, so be careful.
 */
static inline uint64_t pow2ceil(uint64_t value)
{
    int n = clz64(value - 1);

    if (!n) {
        /*
         * @value - 1 has no leading zeroes, thus @value - 1 >= 2^63
         * Therefore, either @value == 0 or @value > 2^63.
         * If it's 0, return 1, else return 0.
         */
        return !value;
    }
    return 0x8000000000000000ull >> (n - 1);
}

static inline uint32_t pow2roundup32(uint32_t x)
{
    x |= (x >> 1);
    x |= (x >> 2);
    x |= (x >> 4);
    x |= (x >> 8);
    x |= (x >> 16);
    return x + 1;
}

/**
 * urshift - 128-bit Unsigned Right Shift.
 * @plow: in/out - lower 64-bit integer.
 * @phigh: in/out - higher 64-bit integer.
 * @shift: in - bytes to shift, between 0 and 127.
 *
 * Result is zero-extended and stored in plow/phigh, which are
 * input/output variables. Shift values outside the range will
 * be mod to 128. In other words, the caller is responsible to
 * verify/assert both the shift range and plow/phigh pointers.
 */
void urshift(uint64_t *plow, uint64_t *phigh, int32_t shift);

/**
 * ulshift - 128-bit Unsigned Left Shift.
 * @plow: in/out - lower 64-bit integer.
 * @phigh: in/out - higher 64-bit integer.
 * @shift: in - bytes to shift, between 0 and 127.
 * @overflow: out - true if any 1-bit is shifted out.
 *
 * Result is zero-extended and stored in plow/phigh, which are
 * input/output variables. Shift values outside the range will
 * be mod to 128. In other words, the caller is responsible to
 * verify/assert both the shift range and plow/phigh pointers.
 */
void ulshift(uint64_t *plow, uint64_t *phigh, int32_t shift, bool *overflow);

#endif
Commit	Line	Data
05f778c8 TS	1	/*
	2	* Utility compute operations used by translated code.
	3	*
	4	* Copyright (c) 2007 Thiemo Seufer
	5	* Copyright (c) 2007 Jocelyn Mayer
	6	*
	7	* Permission is hereby granted, free of charge, to any person obtaining a copy
	8	* of this software and associated documentation files (the "Software"), to deal
	9	* in the Software without restriction, including without limitation the rights
	10	* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
	11	* copies of the Software, and to permit persons to whom the Software is
	12	* furnished to do so, subject to the following conditions:
	13	*
	14	* The above copyright notice and this permission notice shall be included in
	15	* all copies or substantial portions of the Software.
	16	*
	17	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	18	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	19	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
	20	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	21	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	22	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
	23	* THE SOFTWARE.
	24	*/
175de524	25
cb9c377f	26	#ifndef HOST_UTILS_H
175de524	27	#define HOST_UTILS_H
05f778c8	28
652a4b7e	29	#include "qemu/bswap.h"
cebdff77	30
f540166b	31	#ifdef CONFIG_INT128
facd2857 BS	32	static inline void mulu64(uint64_t plow, uint64_t phigh,
facd2857 BS	33	uint64_t a, uint64_t b)
7a51ad82	34	{
f540166b RH	35	__uint128_t r = (__uint128_t)a * b;
	36	*plow = r;
	37	*phigh = r >> 64;
7a51ad82	38	}
f540166b	39
facd2857 BS	40	static inline void muls64(uint64_t plow, uint64_t phigh,
facd2857 BS	41	int64_t a, int64_t b)
7a51ad82	42	{
f540166b RH	43	__int128_t r = (__int128_t)a * b;
	44	*plow = r;
	45	*phigh = r >> 64;
7a51ad82	46	}
98d1eb27	47
49caffe0 PM	48	/* compute with 96 bit intermediate result: (ab)/c /
	49	static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
	50	{
	51	return (__int128_t)a * b / c;
	52	}
	53
98d1eb27 TM	54	static inline int divu128(uint64_t plow, uint64_t phigh, uint64_t divisor)
	55	{
	56	if (divisor == 0) {
	57	return 1;
	58	} else {
	59	__uint128_t dividend = ((__uint128_t)phigh << 64) \| plow;
	60	__uint128_t result = dividend / divisor;
	61	*plow = result;
	62	*phigh = dividend % divisor;
	63	return result > UINT64_MAX;
	64	}
	65	}
e44259b6 TM	66
	67	static inline int divs128(int64_t plow, int64_t phigh, int64_t divisor)
	68	{
	69	if (divisor == 0) {
	70	return 1;
	71	} else {
	72	__int128_t dividend = ((__int128_t)phigh << 64) \| plow;
	73	__int128_t result = dividend / divisor;
	74	*plow = result;
	75	*phigh = dividend % divisor;
	76	return result != *plow;
	77	}
	78	}
7a51ad82	79	#else
05e1d830	80	void muls64(uint64_t phigh, uint64_t plow, int64_t a, int64_t b);
7a51ad82	81	void mulu64(uint64_t phigh, uint64_t plow, uint64_t a, uint64_t b);
98d1eb27	82	int divu128(uint64_t plow, uint64_t phigh, uint64_t divisor);
e44259b6	83	int divs128(int64_t plow, int64_t phigh, int64_t divisor);
49caffe0 PM	84
	85	static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
	86	{
	87	union {
	88	uint64_t ll;
	89	struct {
	90	#ifdef HOST_WORDS_BIGENDIAN
	91	uint32_t high, low;
	92	#else
	93	uint32_t low, high;
	94	#endif
	95	} l;
	96	} u, res;
	97	uint64_t rl, rh;
	98
	99	u.ll = a;
	100	rl = (uint64_t)u.l.low * (uint64_t)b;
	101	rh = (uint64_t)u.l.high * (uint64_t)b;
	102	rh += (rl >> 32);
	103	res.l.high = rh / c;
	104	res.l.low = (((rh % c) << 32) + (rl & 0xffffffff)) / c;
	105	return res.ll;
	106	}
7a51ad82 JM	107	#endif
7a51ad82 JM	108
72d81155 RH	109	/**
	110	* clz32 - count leading zeros in a 32-bit value.
	111	* @val: The value to search
	112	*
	113	* Returns 32 if the value is zero. Note that the GCC builtin is
	114	* undefined if the value is zero.
	115	*/
facd2857	116	static inline int clz32(uint32_t val)
05f778c8	117	{
72d81155	118	return val ? __builtin_clz(val) : 32;
05f778c8 TS	119	}
05f778c8 TS	120
72d81155 RH	121	/**
	122	* clo32 - count leading ones in a 32-bit value.
	123	* @val: The value to search
	124	*
	125	* Returns 32 if the value is -1.
	126	*/
facd2857	127	static inline int clo32(uint32_t val)
05f778c8 TS	128	{
	129	return clz32(~val);
	130	}
	131
72d81155 RH	132	/**
	133	* clz64 - count leading zeros in a 64-bit value.
	134	* @val: The value to search
	135	*
	136	* Returns 64 if the value is zero. Note that the GCC builtin is
	137	* undefined if the value is zero.
	138	*/
facd2857	139	static inline int clz64(uint64_t val)
05f778c8	140	{
72d81155	141	return val ? __builtin_clzll(val) : 64;
05f778c8 TS	142	}
05f778c8 TS	143
72d81155 RH	144	/**
	145	* clo64 - count leading ones in a 64-bit value.
	146	* @val: The value to search
	147	*
	148	* Returns 64 if the value is -1.
	149	*/
facd2857	150	static inline int clo64(uint64_t val)
05f778c8 TS	151	{
	152	return clz64(~val);
	153	}
b9ef45ff	154
72d81155 RH	155	/**
	156	* ctz32 - count trailing zeros in a 32-bit value.
	157	* @val: The value to search
	158	*
	159	* Returns 32 if the value is zero. Note that the GCC builtin is
	160	* undefined if the value is zero.
	161	*/
facd2857	162	static inline int ctz32(uint32_t val)
b9ef45ff	163	{
72d81155	164	return val ? __builtin_ctz(val) : 32;
c8906845 AZ	165	}
c8906845 AZ	166
72d81155 RH	167	/**
	168	* cto32 - count trailing ones in a 32-bit value.
	169	* @val: The value to search
	170	*
	171	* Returns 32 if the value is -1.
	172	*/
facd2857	173	static inline int cto32(uint32_t val)
c8906845	174	{
b9ef45ff JM	175	return ctz32(~val);
	176	}
	177
72d81155 RH	178	/**
	179	* ctz64 - count trailing zeros in a 64-bit value.
	180	* @val: The value to search
	181	*
	182	* Returns 64 if the value is zero. Note that the GCC builtin is
	183	* undefined if the value is zero.
	184	*/
facd2857	185	static inline int ctz64(uint64_t val)
b9ef45ff	186	{
72d81155	187	return val ? __builtin_ctzll(val) : 64;
b9ef45ff JM	188	}
b9ef45ff JM	189
72d81155	190	/**
1c884abe	191	* cto64 - count trailing ones in a 64-bit value.
72d81155 RH	192	* @val: The value to search
	193	*
	194	* Returns 64 if the value is -1.
	195	*/
facd2857	196	static inline int cto64(uint64_t val)
b9ef45ff JM	197	{
	198	return ctz64(~val);
	199	}
	200
afd3fe4c CF	201	/**
	202	* clrsb32 - count leading redundant sign bits in a 32-bit value.
	203	* @val: The value to search
	204	*
	205	* Returns the number of bits following the sign bit that are equal to it.
	206	* No special cases; output range is [0-31].
	207	*/
	208	static inline int clrsb32(uint32_t val)
	209	{
f773b423	210	#if __has_builtin(__builtin_clrsb) \|\| !defined(__clang__)
afd3fe4c CF	211	return __builtin_clrsb(val);
	212	#else
	213	return clz32(val ^ ((int32_t)val >> 1)) - 1;
	214	#endif
	215	}
	216
	217	/**
	218	* clrsb64 - count leading redundant sign bits in a 64-bit value.
	219	* @val: The value to search
	220	*
	221	* Returns the number of bits following the sign bit that are equal to it.
	222	* No special cases; output range is [0-63].
	223	*/
	224	static inline int clrsb64(uint64_t val)
	225	{
f773b423	226	#if __has_builtin(__builtin_clrsbll) \|\| !defined(__clang__)
afd3fe4c CF	227	return __builtin_clrsbll(val);
	228	#else
	229	return clz64(val ^ ((int64_t)val >> 1)) - 1;
	230	#endif
	231	}
	232
72d81155 RH	233	/**
	234	* ctpop8 - count the population of one bits in an 8-bit value.
	235	* @val: The value to search
	236	*/
facd2857	237	static inline int ctpop8(uint8_t val)
b9ef45ff	238	{
72d81155	239	return __builtin_popcount(val);
b9ef45ff JM	240	}
b9ef45ff JM	241
72d81155 RH	242	/**
	243	* ctpop16 - count the population of one bits in a 16-bit value.
	244	* @val: The value to search
	245	*/
facd2857	246	static inline int ctpop16(uint16_t val)
b9ef45ff	247	{
72d81155	248	return __builtin_popcount(val);
b9ef45ff JM	249	}
b9ef45ff JM	250
72d81155 RH	251	/**
	252	* ctpop32 - count the population of one bits in a 32-bit value.
	253	* @val: The value to search
	254	*/
facd2857	255	static inline int ctpop32(uint32_t val)
b9ef45ff	256	{
7d019980	257	return __builtin_popcount(val);
b9ef45ff JM	258	}
b9ef45ff JM	259
72d81155 RH	260	/**
	261	* ctpop64 - count the population of one bits in a 64-bit value.
	262	* @val: The value to search
	263	*/
facd2857	264	static inline int ctpop64(uint64_t val)
b9ef45ff	265	{
7d019980	266	return __builtin_popcountll(val);
3800af9e	267	}
cb9c377f	268
652a4b7e RH	269	/**
	270	* revbit8 - reverse the bits in an 8-bit value.
	271	* @x: The value to modify.
	272	*/
	273	static inline uint8_t revbit8(uint8_t x)
	274	{
	275	/* Assign the correct nibble position. */
	276	x = ((x & 0xf0) >> 4)
	277	\| ((x & 0x0f) << 4);
	278	/* Assign the correct bit position. */
	279	x = ((x & 0x88) >> 3)
	280	\| ((x & 0x44) >> 1)
	281	\| ((x & 0x22) << 1)
	282	\| ((x & 0x11) << 3);
	283	return x;
	284	}
	285
	286	/**
	287	* revbit16 - reverse the bits in a 16-bit value.
	288	* @x: The value to modify.
	289	*/
	290	static inline uint16_t revbit16(uint16_t x)
	291	{
	292	/* Assign the correct byte position. */
	293	x = bswap16(x);
	294	/* Assign the correct nibble position. */
	295	x = ((x & 0xf0f0) >> 4)
	296	\| ((x & 0x0f0f) << 4);
	297	/* Assign the correct bit position. */
	298	x = ((x & 0x8888) >> 3)
	299	\| ((x & 0x4444) >> 1)
	300	\| ((x & 0x2222) << 1)
	301	\| ((x & 0x1111) << 3);
	302	return x;
	303	}
	304
	305	/**
	306	* revbit32 - reverse the bits in a 32-bit value.
	307	* @x: The value to modify.
	308	*/
	309	static inline uint32_t revbit32(uint32_t x)
	310	{
	311	/* Assign the correct byte position. */
	312	x = bswap32(x);
	313	/* Assign the correct nibble position. */
	314	x = ((x & 0xf0f0f0f0u) >> 4)
	315	\| ((x & 0x0f0f0f0fu) << 4);
	316	/* Assign the correct bit position. */
	317	x = ((x & 0x88888888u) >> 3)
	318	\| ((x & 0x44444444u) >> 1)
	319	\| ((x & 0x22222222u) << 1)
	320	\| ((x & 0x11111111u) << 3);
	321	return x;
	322	}
	323
	324	/**
	325	* revbit64 - reverse the bits in a 64-bit value.
	326	* @x: The value to modify.
	327	*/
	328	static inline uint64_t revbit64(uint64_t x)
	329	{
	330	/* Assign the correct byte position. */
	331	x = bswap64(x);
	332	/* Assign the correct nibble position. */
333	x = ((x & 0xf0f0f0f0f0f0f0f0ull) >> 4)
334	\| ((x & 0x0f0f0f0f0f0f0f0full) << 4);
335	/* Assign the correct bit position. */
336	x = ((x & 0x8888888888888888ull) >> 3)
337	\| ((x & 0x4444444444444444ull) >> 1)
338	\| ((x & 0x2222222222222222ull) << 1)
339	\| ((x & 0x1111111111111111ull) << 3);
340	return x;
341	}
342
01654373 RH	343	/* Host type specific sizes of these routines. */
	344
	345	#if ULONG_MAX == UINT32_MAX
	346	# define clzl clz32
	347	# define ctzl ctz32
	348	# define clol clo32
	349	# define ctol cto32
	350	# define ctpopl ctpop32
652a4b7e	351	# define revbitl revbit32
01654373 RH	352	#elif ULONG_MAX == UINT64_MAX
	353	# define clzl clz64
	354	# define ctzl ctz64
	355	# define clol clo64
	356	# define ctol cto64
	357	# define ctpopl ctpop64
652a4b7e	358	# define revbitl revbit64
01654373 RH	359	#else
	360	# error Unknown sizeof long
	361	#endif
	362
8f1ed5f5 PM	363	static inline bool is_power_of_2(uint64_t value)
	364	{
	365	if (!value) {
e52eeb46	366	return false;
8f1ed5f5 PM	367	}
	368
	369	return !(value & (value - 1));
	370	}
	371
43c64a09 MA	372	/**
	373	* Return @value rounded down to the nearest power of two or zero.
	374	*/
	375	static inline uint64_t pow2floor(uint64_t value)
8f1ed5f5	376	{
43c64a09 MA	377	if (!value) {
	378	/* Avoid undefined shift by 64 */
	379	return 0;
8f1ed5f5	380	}
43c64a09	381	return 0x8000000000000000ull >> clz64(value);
8f1ed5f5 PM	382	}
8f1ed5f5 PM	383
362aaf14 MA	384	/*
	385	* Return @value rounded up to the nearest power of two modulo 2^64.
	386	* This is zero for @value > 2^63, so be careful.
	387	*/
8f1ed5f5 PM	388	static inline uint64_t pow2ceil(uint64_t value)
8f1ed5f5 PM	389	{
362aaf14 MA	390	int n = clz64(value - 1);
	391
	392	if (!n) {
	393	/*
	394	* @value - 1 has no leading zeroes, thus @value - 1 >= 2^63
	395	* Therefore, either @value == 0 or @value > 2^63.
	396	* If it's 0, return 1, else return 0.
	397	*/
	398	return !value;
8f1ed5f5	399	}
362aaf14	400	return 0x8000000000000000ull >> (n - 1);
8f1ed5f5 PM	401	}
8f1ed5f5 PM	402
37e626ce YS	403	static inline uint32_t pow2roundup32(uint32_t x)
	404	{
	405	x \|= (x >> 1);
	406	x \|= (x >> 2);
	407	x \|= (x >> 4);
	408	x \|= (x >> 8);
	409	x \|= (x >> 16);
	410	return x + 1;
	411	}
	412
f539fbe3 JRZ	413	/**
	414	* urshift - 128-bit Unsigned Right Shift.
	415	* @plow: in/out - lower 64-bit integer.
	416	* @phigh: in/out - higher 64-bit integer.
	417	* @shift: in - bytes to shift, between 0 and 127.
	418	*
	419	* Result is zero-extended and stored in plow/phigh, which are
	420	* input/output variables. Shift values outside the range will
	421	* be mod to 128. In other words, the caller is responsible to
	422	* verify/assert both the shift range and plow/phigh pointers.
	423	*/
	424	void urshift(uint64_t plow, uint64_t phigh, int32_t shift);
	425
	426	/**
	427	* ulshift - 128-bit Unsigned Left Shift.
	428	* @plow: in/out - lower 64-bit integer.
	429	* @phigh: in/out - higher 64-bit integer.
	430	* @shift: in - bytes to shift, between 0 and 127.
	431	* @overflow: out - true if any 1-bit is shifted out.
	432	*
	433	* Result is zero-extended and stored in plow/phigh, which are
	434	* input/output variables. Shift values outside the range will
	435	* be mod to 128. In other words, the caller is responsible to
	436	* verify/assert both the shift range and plow/phigh pointers.
	437	*/
	438	void ulshift(uint64_t plow, uint64_t phigh, int32_t shift, bool *overflow);
	439
cb9c377f	440	#endif