Blame jemalloc/include/jemalloc/internal/prng.h

Packit 345191
#ifndef JEMALLOC_INTERNAL_PRNG_H
Packit 345191
#define JEMALLOC_INTERNAL_PRNG_H
Packit 345191
Packit 345191
#include "jemalloc/internal/atomic.h"
Packit 345191
#include "jemalloc/internal/bit_util.h"
Packit 345191
Packit 345191
/*
Packit 345191
 * Simple linear congruential pseudo-random number generator:
Packit 345191
 *
Packit 345191
 *   prng(y) = (a*x + c) % m
Packit 345191
 *
Packit 345191
 * where the following constants ensure maximal period:
Packit 345191
 *
Packit 345191
 *   a == Odd number (relatively prime to 2^n), and (a-1) is a multiple of 4.
Packit 345191
 *   c == Odd number (relatively prime to 2^n).
Packit 345191
 *   m == 2^32
Packit 345191
 *
Packit 345191
 * See Knuth's TAOCP 3rd Ed., Vol. 2, pg. 17 for details on these constraints.
Packit 345191
 *
Packit 345191
 * This choice of m has the disadvantage that the quality of the bits is
Packit 345191
 * proportional to bit position.  For example, the lowest bit has a cycle of 2,
Packit 345191
 * the next has a cycle of 4, etc.  For this reason, we prefer to use the upper
Packit 345191
 * bits.
Packit 345191
 */
Packit 345191
Packit 345191
/******************************************************************************/
Packit 345191
/* INTERNAL DEFINITIONS -- IGNORE */
Packit 345191
/******************************************************************************/
Packit 345191
#define PRNG_A_32	UINT32_C(1103515241)
Packit 345191
#define PRNG_C_32	UINT32_C(12347)
Packit 345191
Packit 345191
#define PRNG_A_64	UINT64_C(6364136223846793005)
Packit 345191
#define PRNG_C_64	UINT64_C(1442695040888963407)
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint32_t
Packit 345191
prng_state_next_u32(uint32_t state) {
Packit 345191
	return (state * PRNG_A_32) + PRNG_C_32;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint64_t
Packit 345191
prng_state_next_u64(uint64_t state) {
Packit 345191
	return (state * PRNG_A_64) + PRNG_C_64;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE size_t
Packit 345191
prng_state_next_zu(size_t state) {
Packit 345191
#if LG_SIZEOF_PTR == 2
Packit 345191
	return (state * PRNG_A_32) + PRNG_C_32;
Packit 345191
#elif LG_SIZEOF_PTR == 3
Packit 345191
	return (state * PRNG_A_64) + PRNG_C_64;
Packit 345191
#else
Packit 345191
#error Unsupported pointer size
Packit 345191
#endif
Packit 345191
}
Packit 345191
Packit 345191
/******************************************************************************/
Packit 345191
/* BEGIN PUBLIC API */
Packit 345191
/******************************************************************************/
Packit 345191
Packit 345191
/*
Packit 345191
 * The prng_lg_range functions give a uniform int in the half-open range [0,
Packit 345191
 * 2**lg_range).  If atomic is true, they do so safely from multiple threads.
Packit 345191
 * Multithreaded 64-bit prngs aren't supported.
Packit 345191
 */
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint32_t
Packit 345191
prng_lg_range_u32(atomic_u32_t *state, unsigned lg_range, bool atomic) {
Packit 345191
	uint32_t ret, state0, state1;
Packit 345191
Packit 345191
	assert(lg_range > 0);
Packit 345191
	assert(lg_range <= 32);
Packit 345191
Packit 345191
	state0 = atomic_load_u32(state, ATOMIC_RELAXED);
Packit 345191
Packit 345191
	if (atomic) {
Packit 345191
		do {
Packit 345191
			state1 = prng_state_next_u32(state0);
Packit 345191
		} while (!atomic_compare_exchange_weak_u32(state, &state0,
Packit 345191
		    state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
Packit 345191
	} else {
Packit 345191
		state1 = prng_state_next_u32(state0);
Packit 345191
		atomic_store_u32(state, state1, ATOMIC_RELAXED);
Packit 345191
	}
Packit 345191
	ret = state1 >> (32 - lg_range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint64_t
Packit 345191
prng_lg_range_u64(uint64_t *state, unsigned lg_range) {
Packit 345191
	uint64_t ret, state1;
Packit 345191
Packit 345191
	assert(lg_range > 0);
Packit 345191
	assert(lg_range <= 64);
Packit 345191
Packit 345191
	state1 = prng_state_next_u64(*state);
Packit 345191
	*state = state1;
Packit 345191
	ret = state1 >> (64 - lg_range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE size_t
Packit 345191
prng_lg_range_zu(atomic_zu_t *state, unsigned lg_range, bool atomic) {
Packit 345191
	size_t ret, state0, state1;
Packit 345191
Packit 345191
	assert(lg_range > 0);
Packit 345191
	assert(lg_range <= ZU(1) << (3 + LG_SIZEOF_PTR));
Packit 345191
Packit 345191
	state0 = atomic_load_zu(state, ATOMIC_RELAXED);
Packit 345191
Packit 345191
	if (atomic) {
Packit 345191
		do {
Packit 345191
			state1 = prng_state_next_zu(state0);
Packit 345191
		} while (atomic_compare_exchange_weak_zu(state, &state0,
Packit 345191
		    state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
Packit 345191
	} else {
Packit 345191
		state1 = prng_state_next_zu(state0);
Packit 345191
		atomic_store_zu(state, state1, ATOMIC_RELAXED);
Packit 345191
	}
Packit 345191
	ret = state1 >> ((ZU(1) << (3 + LG_SIZEOF_PTR)) - lg_range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
/*
Packit 345191
 * The prng_range functions behave like the prng_lg_range, but return a result
Packit 345191
 * in [0, range) instead of [0, 2**lg_range).
Packit 345191
 */
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint32_t
Packit 345191
prng_range_u32(atomic_u32_t *state, uint32_t range, bool atomic) {
Packit 345191
	uint32_t ret;
Packit 345191
	unsigned lg_range;
Packit 345191
Packit 345191
	assert(range > 1);
Packit 345191
Packit 345191
	/* Compute the ceiling of lg(range). */
Packit 345191
	lg_range = ffs_u32(pow2_ceil_u32(range)) - 1;
Packit 345191
Packit 345191
	/* Generate a result in [0..range) via repeated trial. */
Packit 345191
	do {
Packit 345191
		ret = prng_lg_range_u32(state, lg_range, atomic);
Packit 345191
	} while (ret >= range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE uint64_t
Packit 345191
prng_range_u64(uint64_t *state, uint64_t range) {
Packit 345191
	uint64_t ret;
Packit 345191
	unsigned lg_range;
Packit 345191
Packit 345191
	assert(range > 1);
Packit 345191
Packit 345191
	/* Compute the ceiling of lg(range). */
Packit 345191
	lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
Packit 345191
Packit 345191
	/* Generate a result in [0..range) via repeated trial. */
Packit 345191
	do {
Packit 345191
		ret = prng_lg_range_u64(state, lg_range);
Packit 345191
	} while (ret >= range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
JEMALLOC_ALWAYS_INLINE size_t
Packit 345191
prng_range_zu(atomic_zu_t *state, size_t range, bool atomic) {
Packit 345191
	size_t ret;
Packit 345191
	unsigned lg_range;
Packit 345191
Packit 345191
	assert(range > 1);
Packit 345191
Packit 345191
	/* Compute the ceiling of lg(range). */
Packit 345191
	lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
Packit 345191
Packit 345191
	/* Generate a result in [0..range) via repeated trial. */
Packit 345191
	do {
Packit 345191
		ret = prng_lg_range_zu(state, lg_range, atomic);
Packit 345191
	} while (ret >= range);
Packit 345191
Packit 345191
	return ret;
Packit 345191
}
Packit 345191
Packit 345191
#endif /* JEMALLOC_INTERNAL_PRNG_H */