doxygen/c22.00/ran_8h_source.html

 /* This file is part of Cloudy and is copyright (C)1978-2022 by Gary J. Ferland and

  * others.  For conditions of distribution and use see copyright notice in license.txt */


 #ifndef RAN_H

 #define RAN_H


 class t_ran;


 // see: https://isocpp.org/wiki/faq/pointers-to-members

 typedef void (t_ran::*t_ran_fun)(void* p, size_t s);


 //

 // ran_pool holds a pool of PRNG variates, thus allowing efficient initialization using vectorization

 //

 // init()           sets the size of the pool and the method for filling the pool

 // reset()          invalidates the remaining variates in the pool, thus forcing a reinitialization

 //                  the next time next() is called; useful when the random seed is changed

 // lgInitialized()  true if init() was called

 // next()           returns the next variate; this routine is CPU time critical

 // p_alloc()        allocates the pool, making sure it is correctly aligned for SIMD access

 // p_update_pool()  (re)fill the pool with new random variates

 // ~ran_pool()      frees the pool

 //

 template<class T>

 class ran_pool

 {

         void* p_pool;     // start of the pool, correctly aligned for SIMD

         T* p_next;        // pointer to next data item that can be returned

         T* p_end;         // points just beyond the end of the pool

         size_t p_size;    // number of elements in the pool

         size_t p_squad;   // size of the pool in quadwords

         t_ran* p_rc;      // pointer to the instantiation of the random number class

         t_ran_fun p_fill; // fills pool, member function of t_ran class


         void p_alloc()

         {

                 // make sure the memory is correctly aligned for SIMD instructions

                 if( posix_memalign(&p_pool, CD_ALIGN, p_size*sizeof(T)) != 0 )

                         throw bad_alloc();

                 p_next = p_end = (T*)p_pool + p_size;

         }

         void p_update_pool()

         {

                 ASSERT( lgInitialized() );

                 if( p_pool == NULL )

                         p_alloc();

                 (p_rc->*p_fill)(p_pool, p_squad);

                 p_next = (T*)p_pool;

         }

 public:

         void init(size_t s, t_ran* rc, t_ran_fun f)

         {

                 ASSERT( !lgInitialized() );

                 ASSERT( s > 0 );

                 p_size = s;

                 p_squad = (s*sizeof(T))/8;

                 // make sure size is multiple of 8 bytes

                 ASSERT( p_squad*8 == s*sizeof(T) );

                 p_rc = rc;

                 p_fill = f;

         }

         void reset()

         {

                 p_next = p_end;

         }

         bool lgInitialized() const

         {

                 return ( p_size > 0 );

         }

         T next()

         {

                 if( UNLIKELY(p_next == p_end) )

                         p_update_pool();

                 return *p_next++;

         }


         ran_pool()

         {

                 p_pool = p_next = p_end = NULL;

                 p_size = p_squad = 0;

                 p_rc = NULL;

                 p_fill = NULL;

         }

         ran_pool(const ran_pool&) = delete;

         ran_pool& operator= (const ran_pool&) = delete;

         ~ran_pool()

         {

                 posix_memalign_free(p_pool);

         }

 };


 //

 // Two algorithms are supported here: xoroshiro128+ (v1.0) and xoshiro256** (v1.0)

 //

 // The 2016 version of xoroshiro128+ was the first to be added, and has since been upgraded to v1.0.

 // The xoshiro256** algorithm was added later, and is described as an "all-purpose, rock-solid

 // generator" with no known deficiencies. This is the default generator in Cloudy, with xoroshiro128+

 // being kept as a backup. The latter has the advantage that it is somewhat faster, but has some mild

 // deficiencies. To switch, simply change the instantiation of ran at the top of ran.cpp.

 //

 // For more information see: http://xoshiro.di.unimi.it/

 //


 enum algo_prng { PRNG_XOROSHIRO128PLUS, PRNG_XOSHIRO256STARSTAR };


 //

 // t_ran is a global class for efficiently generating pseudo-random numbers. It can generate integer

 //       as well as floating point variates (the latter with a uniform or normal distribution)

 //

 // The variates are stored in pools to allow efficient computation using SIMD instructions. The

 // underlying PRNG algorithm to generate the random bits can be freely chosen. Currently supported

 // are xoshiro256** and xoroshiro128+. Each quadword in a SIMD register should generate a different,

 // non-overlapping stream of random numbers and therefore needs a different state. This is done

 // automatically in the seeding process. The algorithm also takes care that each rank in an MPI run

 // gets a different, non-overlapping stream of random numbers. The algorithm is not thread-safe in

 // openMP runs.

 //

 //   ND -- size of the pool of variates in quadwords

 //   p_algo -- which algorithm should be used as the underlying PRNG

 //   p_sq -- size of the state for the underlying PRNG algorithm in quadwords

 //   p_npack -- number of quadwords packed into a single SIMD register

 //   p_ns -- size of the state for a full SIMD register in quadwords (= p_sq*p_npack)

 //   p_s -- the seed that was used to generate the initial state

 //   p_state[p_ns] -- the state of the PRNG (needs to be correctly aligned for SIMD access).

 //

 // i7(), u8(), i15(), u16(), i31(), u32(), i63(), u64() -- return signed or unsigned integer variates

 // dbl(), rnm() -- return uniformly distributed floating point variates on (0,1)

 // normal() -- return normally distributed floating point variates (double precision only)

 //             these numbers are generated using the Ziggurat algorithm

 // init() -- does a one time initialization using a randomly generated seed. Subsequent calls will

 //           be ignored. There is also a version with a fixed seed.

 // new_rank() -- jump ahead in random number sequence for a different rank number. Mainly useful for

 //               forked threads.

 // get_seed() -- return the seed that was used.

 // print_seed() -- return the seed that was used as a string for printing.

 //

 class t_ran

 {

         // pool size in quadwords

         static const size_t ND = 2048;

         // size of the state in quadwords for a single xoroshiro128plus PRNG stream

         static const size_t SQ_XOROSHIRO128 = 2;

         static const size_t SQ_XOSHIRO256 = 4;


         bool p_lgInitialized;

         algo_prng p_algo;

         size_t p_sq;

         size_t p_npack;

         size_t p_ns;

         uint64 p_s;

         uint64* p_state;


         const double* p_zigxd;

         const double* p_zigrd;

         const double* p_zige2d;


         void p_init(uint64 s, int nRANK);

         void p_seed(uint64 s, int nRANK);

         uint64 p_generate_random_seed();

         uint64 p_random_seed();

         void p_xoroshiro128plus(uint64* pool, size_t size);

         void p_xoshiro256starstar(uint64* pool, size_t size);

         double p_ZigTailNormal(bool lgNegative);


         // fill arrays with random variates

         // NB NB -- the pool need to be correctly aligned for SIMD access

         // NB NB -- the size needs to be a multiple of the SIMD vector size

         void p_u64(void* pool, size_t size);

         void p_dbl(void* pool, size_t size);

         void p_flt(void* pool, size_t size);

         void p_zig(void* pool, size_t size);


         ran_pool<uint8> p_pc;

         ran_pool<uint16> p_ps;

         ran_pool<uint32> p_pi;

         ran_pool<uint64> p_pl;

         ran_pool<double> p_pd;

         ran_pool<sys_float> p_pf;

         ran_pool<double> p_zd;

 public:

         /* integer random variate on the [0,0x7f] interval */

         int8 i7() { return int8(p_pc.next() >> 1); }

         /* integer random variate on the [0,0xff] interval */

         uint8 u8() { return p_pc.next(); }

         /* integer random variate on the [0,0x7fff] interval */

         int16 i15() { return int16(p_ps.next() >> 1); }

         /* integer random variate on the [0,0xffff] interval */

         uint16 u16() { return p_ps.next(); }

         /* integer random variate on the [0,0x7fffffff] interval */

         int32 i31() { return int32(p_pi.next() >> 1); }

         /* integer random variate on the [0,0xffffffff] interval */

         uint32 u32() { return p_pi.next(); }

         /* integer random variate on the [0,0x7fffffffffffffff] interval */

         int64 i63() { return int64(p_pl.next() >> 1);   }

         /* integer random variate on the [1,0xffffffffffffffff] interval */

         uint64 u64() { return p_pl.next(); }

         /* double precision uniform random variate on the (0,1) interval */

         double dbl() { return p_pd.next(); }

         /* single precision uniform random variate on the (0,1) interval */

         realnum rnm()

         {

 #ifdef FLT_IS_DBL

                 return p_pd.next();

 #else

                 return p_pf.next();

 #endif

         }

         /* generates a random number with normal distribution and unit standard deviation using Ziggurat */

         double normal()

         {

                 while( true )

                 {

                         double u = p_zd.next();

                         uint8 i = u8();

                         if( LIKELY(fabs(u) < p_zigrd[i]) )

                                 return u*p_zigxd[i];

                         if( UNLIKELY(i == 0) )

                                 return p_ZigTailNormal( u < 0. );

                         double x = u*p_zigxd[i];

                         double e2 = exp( -0.5*pow2(x) );

                         if( p_zige2d[i+1] + dbl()*(p_zige2d[i]-p_zige2d[i+1]) < e2 )

                                 return x;

                 }

         }


         void init()

         {

                 uint64 s = p_generate_random_seed();

                 p_init(s, 0);

         }

         void init(uint64 s, int nRANK)

         {

                 p_init(s, nRANK);

         }

         void new_rank(int nRANK)

         {

                 ASSERT( p_lgInitialized );

                 p_seed(p_s, nRANK);

         }

         uint64 get_seed() const { return p_s; }

         string print_seed() const

         {

                 ostringstream oss;

                 oss << "PRNG seed: 0x" << setw(16) << setfill('0') << hex << p_s;

                 return oss.str();

         }


         explicit t_ran(algo_prng algo);

         t_ran(const t_ran&) = delete;

         t_ran& operator= (const t_ran&) = delete;

         ~t_ran()

         {

                 posix_memalign_free(p_state);

         }

 };


 extern t_ran ran;


 #endif

t_ran::i31
int32 i31()
Definition: ran.h:190

t_ran::operator=
t_ran & operator=(const t_ran &)=delete

t_ran::p_zigrd
const double * p_zigrd
Definition: ran.h:154

ran_pool::p_pool
void * p_pool
Definition: ran.h:27

t_ran::i63
int64 i63()
Definition: ran.h:194

t_ran::p_npack
size_t p_npack
Definition: ran.h:148

LIKELY
#define LIKELY(x)
Definition: cpu.h:479

ran_pool::ran_pool
ran_pool()
Definition: ran.h:77

t_ran::p_pf
ran_pool< sys_float > p_pf
Definition: ran.h:178

algo_prng
algo_prng
Definition: ran.h:104

t_ran::p_xoshiro256starstar
void p_xoshiro256starstar(uint64 *pool, size_t size)
Definition: ran.cpp:294

PRNG_XOROSHIRO128PLUS
Definition: ran.h:104

t_ran::p_dbl
void p_dbl(void *pool, size_t size)
Definition: ran.cpp:315

t_ran::p_init
void p_init(uint64 s, int nRANK)
Definition: ran.cpp:586

ran_pool::~ran_pool
~ran_pool()
Definition: ran.h:86

t_ran::p_zigxd
const double * p_zigxd
Definition: ran.h:153

t_ran::rnm
realnum rnm()
Definition: ran.h:200

ran_pool::reset
void reset()
Definition: ran.h:62

t_ran::p_lgInitialized
bool p_lgInitialized
Definition: ran.h:145

t_ran::p_state
uint64 * p_state
Definition: ran.h:151

t_ran::ND
static const size_t ND
Definition: ran.h:140

t_ran::p_zige2d
const double * p_zige2d
Definition: ran.h:155

t_ran::p_pi
ran_pool< uint32 > p_pi
Definition: ran.h:175

ran
t_ran ran

ran_pool::p_rc
t_ran * p_rc
Definition: ran.h:32

t_ran::u8
uint8 u8()
Definition: ran.h:184

ran_pool::operator=
ran_pool & operator=(const ran_pool &)=delete

t_ran::~t_ran
~t_ran()
Definition: ran.h:251

t_ran::init
void init()
Definition: ran.h:226

t_ran::u32
uint32 u32()
Definition: ran.h:192

t_ran::p_xoroshiro128plus
void p_xoroshiro128plus(uint64 *pool, size_t size)
Definition: ran.cpp:289

ran_pool::p_next
T * p_next
Definition: ran.h:28

t_ran::print_seed
string print_seed() const
Definition: ran.h:241

realnum
float realnum
Definition: cddefines.h:127

t_ran::p_pc
ran_pool< uint8 > p_pc
Definition: ran.h:173

ran_pool
Definition: ran.h:25

t_ran::p_random_seed
uint64 p_random_seed()

t_ran::p_generate_random_seed
uint64 p_generate_random_seed()
Definition: ran.cpp:625

t_ran::p_u64
void p_u64(void *pool, size_t size)
Definition: ran.cpp:302

t_ran::p_flt
void p_flt(void *pool, size_t size)
Definition: ran.cpp:327

NULL
#define NULL
Definition: cddefines.h:115

t_ran::SQ_XOSHIRO256
static const size_t SQ_XOSHIRO256
Definition: ran.h:143

t_ran::p_pl
ran_pool< uint64 > p_pl
Definition: ran.h:176

t_ran::t_ran
t_ran(algo_prng algo)
Definition: ran.cpp:653

PRNG_XOSHIRO256STARSTAR
Definition: ran.h:104

t_ran::p_algo
algo_prng p_algo
Definition: ran.h:146

t_ran::u64
uint64 u64()
Definition: ran.h:196

posix_memalign_free
void posix_memalign_free(void *p)
Definition: cpu.h:143

t_ran::u16
uint16 u16()
Definition: ran.h:188

ran_pool::p_squad
size_t p_squad
Definition: ran.h:31

t_ran::normal
double normal()
Definition: ran.h:209

ASSERT
#define ASSERT(exp)
Definition: cddefines.h:637

t_ran::p_s
uint64 p_s
Definition: ran.h:150

t_ran::p_pd
ran_pool< double > p_pd
Definition: ran.h:177

pow2
T pow2(T a)
Definition: cddefines.h:987

ran_pool::init
void init(size_t s, t_ran *rc, t_ran_fun f)
Definition: ran.h:51

ran_pool::p_alloc
void p_alloc()
Definition: ran.h:35

t_ran::p_ZigTailNormal
double p_ZigTailNormal(bool lgNegative)
Definition: ran.cpp:571

t_ran::dbl
double dbl()
Definition: ran.h:198

UNLIKELY
#define UNLIKELY(x)
Definition: cpu.h:490

ran_pool::p_end
T * p_end
Definition: ran.h:29

ran_pool::p_size
size_t p_size
Definition: ran.h:30

t_ran::p_seed
void p_seed(uint64 s, int nRANK)
Definition: ran.cpp:609

t_ran::init
void init(uint64 s, int nRANK)
Definition: ran.h:231

t_ran::p_zig
void p_zig(void *pool, size_t size)
Definition: ran.cpp:339

e2
double e2(double x)
Definition: thirdparty.cpp:3100

t_ran::p_sq
size_t p_sq
Definition: ran.h:147

ran_pool::lgInitialized
bool lgInitialized() const
Definition: ran.h:66

t_ran
Definition: ran.h:137

ran_pool::p_update_pool
void p_update_pool()
Definition: ran.h:42

t_ran::i15
int16 i15()
Definition: ran.h:186

CD_ALIGN
#define CD_ALIGN
Definition: cpu.h:127

t_ran::p_zd
ran_pool< double > p_zd
Definition: ran.h:179

ran_pool::next
T next()
Definition: ran.h:70

t_ran::new_rank
void new_rank(int nRANK)
Definition: ran.h:235

t_ran::i7
int8 i7()
Definition: ran.h:182

ran_pool::p_fill
t_ran_fun p_fill
Definition: ran.h:33

t_ran::p_ps
ran_pool< uint16 > p_ps
Definition: ran.h:174

t_ran::p_ns
size_t p_ns
Definition: ran.h:149

t_ran::get_seed
uint64 get_seed() const
Definition: ran.h:240

t_ran::SQ_XOROSHIRO128
static const size_t SQ_XOROSHIRO128
Definition: ran.h:142

t_ran_fun
void(t_ran::* t_ran_fun)(void *p, size_t s)
Definition: ran.h:10