xref: /aosp_15_r20/external/jemalloc_new/include/jemalloc/internal/prng.h (revision 1208bc7e437ced7eb82efac44ba17e3beba411da)
1*1208bc7eSAndroid Build Coastguard Worker #ifndef JEMALLOC_INTERNAL_PRNG_H
2*1208bc7eSAndroid Build Coastguard Worker #define JEMALLOC_INTERNAL_PRNG_H
3*1208bc7eSAndroid Build Coastguard Worker 
4*1208bc7eSAndroid Build Coastguard Worker #include "jemalloc/internal/atomic.h"
5*1208bc7eSAndroid Build Coastguard Worker #include "jemalloc/internal/bit_util.h"
6*1208bc7eSAndroid Build Coastguard Worker 
7*1208bc7eSAndroid Build Coastguard Worker /*
8*1208bc7eSAndroid Build Coastguard Worker  * Simple linear congruential pseudo-random number generator:
9*1208bc7eSAndroid Build Coastguard Worker  *
10*1208bc7eSAndroid Build Coastguard Worker  *   prng(y) = (a*x + c) % m
11*1208bc7eSAndroid Build Coastguard Worker  *
12*1208bc7eSAndroid Build Coastguard Worker  * where the following constants ensure maximal period:
13*1208bc7eSAndroid Build Coastguard Worker  *
14*1208bc7eSAndroid Build Coastguard Worker  *   a == Odd number (relatively prime to 2^n), and (a-1) is a multiple of 4.
15*1208bc7eSAndroid Build Coastguard Worker  *   c == Odd number (relatively prime to 2^n).
16*1208bc7eSAndroid Build Coastguard Worker  *   m == 2^32
17*1208bc7eSAndroid Build Coastguard Worker  *
18*1208bc7eSAndroid Build Coastguard Worker  * See Knuth's TAOCP 3rd Ed., Vol. 2, pg. 17 for details on these constraints.
19*1208bc7eSAndroid Build Coastguard Worker  *
20*1208bc7eSAndroid Build Coastguard Worker  * This choice of m has the disadvantage that the quality of the bits is
21*1208bc7eSAndroid Build Coastguard Worker  * proportional to bit position.  For example, the lowest bit has a cycle of 2,
22*1208bc7eSAndroid Build Coastguard Worker  * the next has a cycle of 4, etc.  For this reason, we prefer to use the upper
23*1208bc7eSAndroid Build Coastguard Worker  * bits.
24*1208bc7eSAndroid Build Coastguard Worker  */
25*1208bc7eSAndroid Build Coastguard Worker 
26*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
27*1208bc7eSAndroid Build Coastguard Worker /* INTERNAL DEFINITIONS -- IGNORE */
28*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
29*1208bc7eSAndroid Build Coastguard Worker #define PRNG_A_32	UINT32_C(1103515241)
30*1208bc7eSAndroid Build Coastguard Worker #define PRNG_C_32	UINT32_C(12347)
31*1208bc7eSAndroid Build Coastguard Worker 
32*1208bc7eSAndroid Build Coastguard Worker #define PRNG_A_64	UINT64_C(6364136223846793005)
33*1208bc7eSAndroid Build Coastguard Worker #define PRNG_C_64	UINT64_C(1442695040888963407)
34*1208bc7eSAndroid Build Coastguard Worker 
35*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_state_next_u32(uint32_t state)36*1208bc7eSAndroid Build Coastguard Worker prng_state_next_u32(uint32_t state) {
37*1208bc7eSAndroid Build Coastguard Worker 	return (state * PRNG_A_32) + PRNG_C_32;
38*1208bc7eSAndroid Build Coastguard Worker }
39*1208bc7eSAndroid Build Coastguard Worker 
40*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_state_next_u64(uint64_t state)41*1208bc7eSAndroid Build Coastguard Worker prng_state_next_u64(uint64_t state) {
42*1208bc7eSAndroid Build Coastguard Worker 	return (state * PRNG_A_64) + PRNG_C_64;
43*1208bc7eSAndroid Build Coastguard Worker }
44*1208bc7eSAndroid Build Coastguard Worker 
45*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_state_next_zu(size_t state)46*1208bc7eSAndroid Build Coastguard Worker prng_state_next_zu(size_t state) {
47*1208bc7eSAndroid Build Coastguard Worker #if LG_SIZEOF_PTR == 2
48*1208bc7eSAndroid Build Coastguard Worker 	return (state * PRNG_A_32) + PRNG_C_32;
49*1208bc7eSAndroid Build Coastguard Worker #elif LG_SIZEOF_PTR == 3
50*1208bc7eSAndroid Build Coastguard Worker 	return (state * PRNG_A_64) + PRNG_C_64;
51*1208bc7eSAndroid Build Coastguard Worker #else
52*1208bc7eSAndroid Build Coastguard Worker #error Unsupported pointer size
53*1208bc7eSAndroid Build Coastguard Worker #endif
54*1208bc7eSAndroid Build Coastguard Worker }
55*1208bc7eSAndroid Build Coastguard Worker 
56*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
57*1208bc7eSAndroid Build Coastguard Worker /* BEGIN PUBLIC API */
58*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
59*1208bc7eSAndroid Build Coastguard Worker 
60*1208bc7eSAndroid Build Coastguard Worker /*
61*1208bc7eSAndroid Build Coastguard Worker  * The prng_lg_range functions give a uniform int in the half-open range [0,
62*1208bc7eSAndroid Build Coastguard Worker  * 2**lg_range).  If atomic is true, they do so safely from multiple threads.
63*1208bc7eSAndroid Build Coastguard Worker  * Multithreaded 64-bit prngs aren't supported.
64*1208bc7eSAndroid Build Coastguard Worker  */
65*1208bc7eSAndroid Build Coastguard Worker 
66*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_lg_range_u32(atomic_u32_t * state,unsigned lg_range,bool atomic)67*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_u32(atomic_u32_t *state, unsigned lg_range, bool atomic) {
68*1208bc7eSAndroid Build Coastguard Worker 	uint32_t ret, state0, state1;
69*1208bc7eSAndroid Build Coastguard Worker 
70*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range > 0);
71*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range <= 32);
72*1208bc7eSAndroid Build Coastguard Worker 
73*1208bc7eSAndroid Build Coastguard Worker 	state0 = atomic_load_u32(state, ATOMIC_RELAXED);
74*1208bc7eSAndroid Build Coastguard Worker 
75*1208bc7eSAndroid Build Coastguard Worker 	if (atomic) {
76*1208bc7eSAndroid Build Coastguard Worker 		do {
77*1208bc7eSAndroid Build Coastguard Worker 			state1 = prng_state_next_u32(state0);
78*1208bc7eSAndroid Build Coastguard Worker 		} while (!atomic_compare_exchange_weak_u32(state, &state0,
79*1208bc7eSAndroid Build Coastguard Worker 		    state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
80*1208bc7eSAndroid Build Coastguard Worker 	} else {
81*1208bc7eSAndroid Build Coastguard Worker 		state1 = prng_state_next_u32(state0);
82*1208bc7eSAndroid Build Coastguard Worker 		atomic_store_u32(state, state1, ATOMIC_RELAXED);
83*1208bc7eSAndroid Build Coastguard Worker 	}
84*1208bc7eSAndroid Build Coastguard Worker 	ret = state1 >> (32 - lg_range);
85*1208bc7eSAndroid Build Coastguard Worker 
86*1208bc7eSAndroid Build Coastguard Worker 	return ret;
87*1208bc7eSAndroid Build Coastguard Worker }
88*1208bc7eSAndroid Build Coastguard Worker 
89*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_lg_range_u64(uint64_t * state,unsigned lg_range)90*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_u64(uint64_t *state, unsigned lg_range) {
91*1208bc7eSAndroid Build Coastguard Worker 	uint64_t ret, state1;
92*1208bc7eSAndroid Build Coastguard Worker 
93*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range > 0);
94*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range <= 64);
95*1208bc7eSAndroid Build Coastguard Worker 
96*1208bc7eSAndroid Build Coastguard Worker 	state1 = prng_state_next_u64(*state);
97*1208bc7eSAndroid Build Coastguard Worker 	*state = state1;
98*1208bc7eSAndroid Build Coastguard Worker 	ret = state1 >> (64 - lg_range);
99*1208bc7eSAndroid Build Coastguard Worker 
100*1208bc7eSAndroid Build Coastguard Worker 	return ret;
101*1208bc7eSAndroid Build Coastguard Worker }
102*1208bc7eSAndroid Build Coastguard Worker 
103*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_lg_range_zu(atomic_zu_t * state,unsigned lg_range,bool atomic)104*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_zu(atomic_zu_t *state, unsigned lg_range, bool atomic) {
105*1208bc7eSAndroid Build Coastguard Worker 	size_t ret, state0, state1;
106*1208bc7eSAndroid Build Coastguard Worker 
107*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range > 0);
108*1208bc7eSAndroid Build Coastguard Worker 	assert(lg_range <= ZU(1) << (3 + LG_SIZEOF_PTR));
109*1208bc7eSAndroid Build Coastguard Worker 
110*1208bc7eSAndroid Build Coastguard Worker 	state0 = atomic_load_zu(state, ATOMIC_RELAXED);
111*1208bc7eSAndroid Build Coastguard Worker 
112*1208bc7eSAndroid Build Coastguard Worker 	if (atomic) {
113*1208bc7eSAndroid Build Coastguard Worker 		do {
114*1208bc7eSAndroid Build Coastguard Worker 			state1 = prng_state_next_zu(state0);
115*1208bc7eSAndroid Build Coastguard Worker 		} while (atomic_compare_exchange_weak_zu(state, &state0,
116*1208bc7eSAndroid Build Coastguard Worker 		    state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
117*1208bc7eSAndroid Build Coastguard Worker 	} else {
118*1208bc7eSAndroid Build Coastguard Worker 		state1 = prng_state_next_zu(state0);
119*1208bc7eSAndroid Build Coastguard Worker 		atomic_store_zu(state, state1, ATOMIC_RELAXED);
120*1208bc7eSAndroid Build Coastguard Worker 	}
121*1208bc7eSAndroid Build Coastguard Worker 	ret = state1 >> ((ZU(1) << (3 + LG_SIZEOF_PTR)) - lg_range);
122*1208bc7eSAndroid Build Coastguard Worker 
123*1208bc7eSAndroid Build Coastguard Worker 	return ret;
124*1208bc7eSAndroid Build Coastguard Worker }
125*1208bc7eSAndroid Build Coastguard Worker 
126*1208bc7eSAndroid Build Coastguard Worker /*
127*1208bc7eSAndroid Build Coastguard Worker  * The prng_range functions behave like the prng_lg_range, but return a result
128*1208bc7eSAndroid Build Coastguard Worker  * in [0, range) instead of [0, 2**lg_range).
129*1208bc7eSAndroid Build Coastguard Worker  */
130*1208bc7eSAndroid Build Coastguard Worker 
131*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_range_u32(atomic_u32_t * state,uint32_t range,bool atomic)132*1208bc7eSAndroid Build Coastguard Worker prng_range_u32(atomic_u32_t *state, uint32_t range, bool atomic) {
133*1208bc7eSAndroid Build Coastguard Worker 	uint32_t ret;
134*1208bc7eSAndroid Build Coastguard Worker 	unsigned lg_range;
135*1208bc7eSAndroid Build Coastguard Worker 
136*1208bc7eSAndroid Build Coastguard Worker 	assert(range > 1);
137*1208bc7eSAndroid Build Coastguard Worker 
138*1208bc7eSAndroid Build Coastguard Worker 	/* Compute the ceiling of lg(range). */
139*1208bc7eSAndroid Build Coastguard Worker 	lg_range = ffs_u32(pow2_ceil_u32(range)) - 1;
140*1208bc7eSAndroid Build Coastguard Worker 
141*1208bc7eSAndroid Build Coastguard Worker 	/* Generate a result in [0..range) via repeated trial. */
142*1208bc7eSAndroid Build Coastguard Worker 	do {
143*1208bc7eSAndroid Build Coastguard Worker 		ret = prng_lg_range_u32(state, lg_range, atomic);
144*1208bc7eSAndroid Build Coastguard Worker 	} while (ret >= range);
145*1208bc7eSAndroid Build Coastguard Worker 
146*1208bc7eSAndroid Build Coastguard Worker 	return ret;
147*1208bc7eSAndroid Build Coastguard Worker }
148*1208bc7eSAndroid Build Coastguard Worker 
149*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_range_u64(uint64_t * state,uint64_t range)150*1208bc7eSAndroid Build Coastguard Worker prng_range_u64(uint64_t *state, uint64_t range) {
151*1208bc7eSAndroid Build Coastguard Worker 	uint64_t ret;
152*1208bc7eSAndroid Build Coastguard Worker 	unsigned lg_range;
153*1208bc7eSAndroid Build Coastguard Worker 
154*1208bc7eSAndroid Build Coastguard Worker 	assert(range > 1);
155*1208bc7eSAndroid Build Coastguard Worker 
156*1208bc7eSAndroid Build Coastguard Worker 	/* Compute the ceiling of lg(range). */
157*1208bc7eSAndroid Build Coastguard Worker 	lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
158*1208bc7eSAndroid Build Coastguard Worker 
159*1208bc7eSAndroid Build Coastguard Worker 	/* Generate a result in [0..range) via repeated trial. */
160*1208bc7eSAndroid Build Coastguard Worker 	do {
161*1208bc7eSAndroid Build Coastguard Worker 		ret = prng_lg_range_u64(state, lg_range);
162*1208bc7eSAndroid Build Coastguard Worker 	} while (ret >= range);
163*1208bc7eSAndroid Build Coastguard Worker 
164*1208bc7eSAndroid Build Coastguard Worker 	return ret;
165*1208bc7eSAndroid Build Coastguard Worker }
166*1208bc7eSAndroid Build Coastguard Worker 
167*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_range_zu(atomic_zu_t * state,size_t range,bool atomic)168*1208bc7eSAndroid Build Coastguard Worker prng_range_zu(atomic_zu_t *state, size_t range, bool atomic) {
169*1208bc7eSAndroid Build Coastguard Worker 	size_t ret;
170*1208bc7eSAndroid Build Coastguard Worker 	unsigned lg_range;
171*1208bc7eSAndroid Build Coastguard Worker 
172*1208bc7eSAndroid Build Coastguard Worker 	assert(range > 1);
173*1208bc7eSAndroid Build Coastguard Worker 
174*1208bc7eSAndroid Build Coastguard Worker 	/* Compute the ceiling of lg(range). */
175*1208bc7eSAndroid Build Coastguard Worker 	lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
176*1208bc7eSAndroid Build Coastguard Worker 
177*1208bc7eSAndroid Build Coastguard Worker 	/* Generate a result in [0..range) via repeated trial. */
178*1208bc7eSAndroid Build Coastguard Worker 	do {
179*1208bc7eSAndroid Build Coastguard Worker 		ret = prng_lg_range_zu(state, lg_range, atomic);
180*1208bc7eSAndroid Build Coastguard Worker 	} while (ret >= range);
181*1208bc7eSAndroid Build Coastguard Worker 
182*1208bc7eSAndroid Build Coastguard Worker 	return ret;
183*1208bc7eSAndroid Build Coastguard Worker }
184*1208bc7eSAndroid Build Coastguard Worker 
185*1208bc7eSAndroid Build Coastguard Worker #endif /* JEMALLOC_INTERNAL_PRNG_H */
186