1*1208bc7eSAndroid Build Coastguard Worker #ifndef JEMALLOC_INTERNAL_PRNG_H
2*1208bc7eSAndroid Build Coastguard Worker #define JEMALLOC_INTERNAL_PRNG_H
3*1208bc7eSAndroid Build Coastguard Worker
4*1208bc7eSAndroid Build Coastguard Worker #include "jemalloc/internal/atomic.h"
5*1208bc7eSAndroid Build Coastguard Worker #include "jemalloc/internal/bit_util.h"
6*1208bc7eSAndroid Build Coastguard Worker
7*1208bc7eSAndroid Build Coastguard Worker /*
8*1208bc7eSAndroid Build Coastguard Worker * Simple linear congruential pseudo-random number generator:
9*1208bc7eSAndroid Build Coastguard Worker *
10*1208bc7eSAndroid Build Coastguard Worker * prng(y) = (a*x + c) % m
11*1208bc7eSAndroid Build Coastguard Worker *
12*1208bc7eSAndroid Build Coastguard Worker * where the following constants ensure maximal period:
13*1208bc7eSAndroid Build Coastguard Worker *
14*1208bc7eSAndroid Build Coastguard Worker * a == Odd number (relatively prime to 2^n), and (a-1) is a multiple of 4.
15*1208bc7eSAndroid Build Coastguard Worker * c == Odd number (relatively prime to 2^n).
16*1208bc7eSAndroid Build Coastguard Worker * m == 2^32
17*1208bc7eSAndroid Build Coastguard Worker *
18*1208bc7eSAndroid Build Coastguard Worker * See Knuth's TAOCP 3rd Ed., Vol. 2, pg. 17 for details on these constraints.
19*1208bc7eSAndroid Build Coastguard Worker *
20*1208bc7eSAndroid Build Coastguard Worker * This choice of m has the disadvantage that the quality of the bits is
21*1208bc7eSAndroid Build Coastguard Worker * proportional to bit position. For example, the lowest bit has a cycle of 2,
22*1208bc7eSAndroid Build Coastguard Worker * the next has a cycle of 4, etc. For this reason, we prefer to use the upper
23*1208bc7eSAndroid Build Coastguard Worker * bits.
24*1208bc7eSAndroid Build Coastguard Worker */
25*1208bc7eSAndroid Build Coastguard Worker
26*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
27*1208bc7eSAndroid Build Coastguard Worker /* INTERNAL DEFINITIONS -- IGNORE */
28*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
29*1208bc7eSAndroid Build Coastguard Worker #define PRNG_A_32 UINT32_C(1103515241)
30*1208bc7eSAndroid Build Coastguard Worker #define PRNG_C_32 UINT32_C(12347)
31*1208bc7eSAndroid Build Coastguard Worker
32*1208bc7eSAndroid Build Coastguard Worker #define PRNG_A_64 UINT64_C(6364136223846793005)
33*1208bc7eSAndroid Build Coastguard Worker #define PRNG_C_64 UINT64_C(1442695040888963407)
34*1208bc7eSAndroid Build Coastguard Worker
35*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_state_next_u32(uint32_t state)36*1208bc7eSAndroid Build Coastguard Worker prng_state_next_u32(uint32_t state) {
37*1208bc7eSAndroid Build Coastguard Worker return (state * PRNG_A_32) + PRNG_C_32;
38*1208bc7eSAndroid Build Coastguard Worker }
39*1208bc7eSAndroid Build Coastguard Worker
40*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_state_next_u64(uint64_t state)41*1208bc7eSAndroid Build Coastguard Worker prng_state_next_u64(uint64_t state) {
42*1208bc7eSAndroid Build Coastguard Worker return (state * PRNG_A_64) + PRNG_C_64;
43*1208bc7eSAndroid Build Coastguard Worker }
44*1208bc7eSAndroid Build Coastguard Worker
45*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_state_next_zu(size_t state)46*1208bc7eSAndroid Build Coastguard Worker prng_state_next_zu(size_t state) {
47*1208bc7eSAndroid Build Coastguard Worker #if LG_SIZEOF_PTR == 2
48*1208bc7eSAndroid Build Coastguard Worker return (state * PRNG_A_32) + PRNG_C_32;
49*1208bc7eSAndroid Build Coastguard Worker #elif LG_SIZEOF_PTR == 3
50*1208bc7eSAndroid Build Coastguard Worker return (state * PRNG_A_64) + PRNG_C_64;
51*1208bc7eSAndroid Build Coastguard Worker #else
52*1208bc7eSAndroid Build Coastguard Worker #error Unsupported pointer size
53*1208bc7eSAndroid Build Coastguard Worker #endif
54*1208bc7eSAndroid Build Coastguard Worker }
55*1208bc7eSAndroid Build Coastguard Worker
56*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
57*1208bc7eSAndroid Build Coastguard Worker /* BEGIN PUBLIC API */
58*1208bc7eSAndroid Build Coastguard Worker /******************************************************************************/
59*1208bc7eSAndroid Build Coastguard Worker
60*1208bc7eSAndroid Build Coastguard Worker /*
61*1208bc7eSAndroid Build Coastguard Worker * The prng_lg_range functions give a uniform int in the half-open range [0,
62*1208bc7eSAndroid Build Coastguard Worker * 2**lg_range). If atomic is true, they do so safely from multiple threads.
63*1208bc7eSAndroid Build Coastguard Worker * Multithreaded 64-bit prngs aren't supported.
64*1208bc7eSAndroid Build Coastguard Worker */
65*1208bc7eSAndroid Build Coastguard Worker
66*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_lg_range_u32(atomic_u32_t * state,unsigned lg_range,bool atomic)67*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_u32(atomic_u32_t *state, unsigned lg_range, bool atomic) {
68*1208bc7eSAndroid Build Coastguard Worker uint32_t ret, state0, state1;
69*1208bc7eSAndroid Build Coastguard Worker
70*1208bc7eSAndroid Build Coastguard Worker assert(lg_range > 0);
71*1208bc7eSAndroid Build Coastguard Worker assert(lg_range <= 32);
72*1208bc7eSAndroid Build Coastguard Worker
73*1208bc7eSAndroid Build Coastguard Worker state0 = atomic_load_u32(state, ATOMIC_RELAXED);
74*1208bc7eSAndroid Build Coastguard Worker
75*1208bc7eSAndroid Build Coastguard Worker if (atomic) {
76*1208bc7eSAndroid Build Coastguard Worker do {
77*1208bc7eSAndroid Build Coastguard Worker state1 = prng_state_next_u32(state0);
78*1208bc7eSAndroid Build Coastguard Worker } while (!atomic_compare_exchange_weak_u32(state, &state0,
79*1208bc7eSAndroid Build Coastguard Worker state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
80*1208bc7eSAndroid Build Coastguard Worker } else {
81*1208bc7eSAndroid Build Coastguard Worker state1 = prng_state_next_u32(state0);
82*1208bc7eSAndroid Build Coastguard Worker atomic_store_u32(state, state1, ATOMIC_RELAXED);
83*1208bc7eSAndroid Build Coastguard Worker }
84*1208bc7eSAndroid Build Coastguard Worker ret = state1 >> (32 - lg_range);
85*1208bc7eSAndroid Build Coastguard Worker
86*1208bc7eSAndroid Build Coastguard Worker return ret;
87*1208bc7eSAndroid Build Coastguard Worker }
88*1208bc7eSAndroid Build Coastguard Worker
89*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_lg_range_u64(uint64_t * state,unsigned lg_range)90*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_u64(uint64_t *state, unsigned lg_range) {
91*1208bc7eSAndroid Build Coastguard Worker uint64_t ret, state1;
92*1208bc7eSAndroid Build Coastguard Worker
93*1208bc7eSAndroid Build Coastguard Worker assert(lg_range > 0);
94*1208bc7eSAndroid Build Coastguard Worker assert(lg_range <= 64);
95*1208bc7eSAndroid Build Coastguard Worker
96*1208bc7eSAndroid Build Coastguard Worker state1 = prng_state_next_u64(*state);
97*1208bc7eSAndroid Build Coastguard Worker *state = state1;
98*1208bc7eSAndroid Build Coastguard Worker ret = state1 >> (64 - lg_range);
99*1208bc7eSAndroid Build Coastguard Worker
100*1208bc7eSAndroid Build Coastguard Worker return ret;
101*1208bc7eSAndroid Build Coastguard Worker }
102*1208bc7eSAndroid Build Coastguard Worker
103*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_lg_range_zu(atomic_zu_t * state,unsigned lg_range,bool atomic)104*1208bc7eSAndroid Build Coastguard Worker prng_lg_range_zu(atomic_zu_t *state, unsigned lg_range, bool atomic) {
105*1208bc7eSAndroid Build Coastguard Worker size_t ret, state0, state1;
106*1208bc7eSAndroid Build Coastguard Worker
107*1208bc7eSAndroid Build Coastguard Worker assert(lg_range > 0);
108*1208bc7eSAndroid Build Coastguard Worker assert(lg_range <= ZU(1) << (3 + LG_SIZEOF_PTR));
109*1208bc7eSAndroid Build Coastguard Worker
110*1208bc7eSAndroid Build Coastguard Worker state0 = atomic_load_zu(state, ATOMIC_RELAXED);
111*1208bc7eSAndroid Build Coastguard Worker
112*1208bc7eSAndroid Build Coastguard Worker if (atomic) {
113*1208bc7eSAndroid Build Coastguard Worker do {
114*1208bc7eSAndroid Build Coastguard Worker state1 = prng_state_next_zu(state0);
115*1208bc7eSAndroid Build Coastguard Worker } while (atomic_compare_exchange_weak_zu(state, &state0,
116*1208bc7eSAndroid Build Coastguard Worker state1, ATOMIC_RELAXED, ATOMIC_RELAXED));
117*1208bc7eSAndroid Build Coastguard Worker } else {
118*1208bc7eSAndroid Build Coastguard Worker state1 = prng_state_next_zu(state0);
119*1208bc7eSAndroid Build Coastguard Worker atomic_store_zu(state, state1, ATOMIC_RELAXED);
120*1208bc7eSAndroid Build Coastguard Worker }
121*1208bc7eSAndroid Build Coastguard Worker ret = state1 >> ((ZU(1) << (3 + LG_SIZEOF_PTR)) - lg_range);
122*1208bc7eSAndroid Build Coastguard Worker
123*1208bc7eSAndroid Build Coastguard Worker return ret;
124*1208bc7eSAndroid Build Coastguard Worker }
125*1208bc7eSAndroid Build Coastguard Worker
126*1208bc7eSAndroid Build Coastguard Worker /*
127*1208bc7eSAndroid Build Coastguard Worker * The prng_range functions behave like the prng_lg_range, but return a result
128*1208bc7eSAndroid Build Coastguard Worker * in [0, range) instead of [0, 2**lg_range).
129*1208bc7eSAndroid Build Coastguard Worker */
130*1208bc7eSAndroid Build Coastguard Worker
131*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint32_t
prng_range_u32(atomic_u32_t * state,uint32_t range,bool atomic)132*1208bc7eSAndroid Build Coastguard Worker prng_range_u32(atomic_u32_t *state, uint32_t range, bool atomic) {
133*1208bc7eSAndroid Build Coastguard Worker uint32_t ret;
134*1208bc7eSAndroid Build Coastguard Worker unsigned lg_range;
135*1208bc7eSAndroid Build Coastguard Worker
136*1208bc7eSAndroid Build Coastguard Worker assert(range > 1);
137*1208bc7eSAndroid Build Coastguard Worker
138*1208bc7eSAndroid Build Coastguard Worker /* Compute the ceiling of lg(range). */
139*1208bc7eSAndroid Build Coastguard Worker lg_range = ffs_u32(pow2_ceil_u32(range)) - 1;
140*1208bc7eSAndroid Build Coastguard Worker
141*1208bc7eSAndroid Build Coastguard Worker /* Generate a result in [0..range) via repeated trial. */
142*1208bc7eSAndroid Build Coastguard Worker do {
143*1208bc7eSAndroid Build Coastguard Worker ret = prng_lg_range_u32(state, lg_range, atomic);
144*1208bc7eSAndroid Build Coastguard Worker } while (ret >= range);
145*1208bc7eSAndroid Build Coastguard Worker
146*1208bc7eSAndroid Build Coastguard Worker return ret;
147*1208bc7eSAndroid Build Coastguard Worker }
148*1208bc7eSAndroid Build Coastguard Worker
149*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE uint64_t
prng_range_u64(uint64_t * state,uint64_t range)150*1208bc7eSAndroid Build Coastguard Worker prng_range_u64(uint64_t *state, uint64_t range) {
151*1208bc7eSAndroid Build Coastguard Worker uint64_t ret;
152*1208bc7eSAndroid Build Coastguard Worker unsigned lg_range;
153*1208bc7eSAndroid Build Coastguard Worker
154*1208bc7eSAndroid Build Coastguard Worker assert(range > 1);
155*1208bc7eSAndroid Build Coastguard Worker
156*1208bc7eSAndroid Build Coastguard Worker /* Compute the ceiling of lg(range). */
157*1208bc7eSAndroid Build Coastguard Worker lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
158*1208bc7eSAndroid Build Coastguard Worker
159*1208bc7eSAndroid Build Coastguard Worker /* Generate a result in [0..range) via repeated trial. */
160*1208bc7eSAndroid Build Coastguard Worker do {
161*1208bc7eSAndroid Build Coastguard Worker ret = prng_lg_range_u64(state, lg_range);
162*1208bc7eSAndroid Build Coastguard Worker } while (ret >= range);
163*1208bc7eSAndroid Build Coastguard Worker
164*1208bc7eSAndroid Build Coastguard Worker return ret;
165*1208bc7eSAndroid Build Coastguard Worker }
166*1208bc7eSAndroid Build Coastguard Worker
167*1208bc7eSAndroid Build Coastguard Worker JEMALLOC_ALWAYS_INLINE size_t
prng_range_zu(atomic_zu_t * state,size_t range,bool atomic)168*1208bc7eSAndroid Build Coastguard Worker prng_range_zu(atomic_zu_t *state, size_t range, bool atomic) {
169*1208bc7eSAndroid Build Coastguard Worker size_t ret;
170*1208bc7eSAndroid Build Coastguard Worker unsigned lg_range;
171*1208bc7eSAndroid Build Coastguard Worker
172*1208bc7eSAndroid Build Coastguard Worker assert(range > 1);
173*1208bc7eSAndroid Build Coastguard Worker
174*1208bc7eSAndroid Build Coastguard Worker /* Compute the ceiling of lg(range). */
175*1208bc7eSAndroid Build Coastguard Worker lg_range = ffs_u64(pow2_ceil_u64(range)) - 1;
176*1208bc7eSAndroid Build Coastguard Worker
177*1208bc7eSAndroid Build Coastguard Worker /* Generate a result in [0..range) via repeated trial. */
178*1208bc7eSAndroid Build Coastguard Worker do {
179*1208bc7eSAndroid Build Coastguard Worker ret = prng_lg_range_zu(state, lg_range, atomic);
180*1208bc7eSAndroid Build Coastguard Worker } while (ret >= range);
181*1208bc7eSAndroid Build Coastguard Worker
182*1208bc7eSAndroid Build Coastguard Worker return ret;
183*1208bc7eSAndroid Build Coastguard Worker }
184*1208bc7eSAndroid Build Coastguard Worker
185*1208bc7eSAndroid Build Coastguard Worker #endif /* JEMALLOC_INTERNAL_PRNG_H */
186