[Teem-commit] SF.net SVN: teem:[7147] teem/trunk/src/air

SourceForge Headquarters 1320 Columbia Street Suite 310 San Diego, CA 92101 +1 (858) 422-6466

Revision: 7147
          http://sourceforge.net/p/teem/code/7147
Author:   kindlmann
Date:     2023-08-04 17:18:29 +0000 (Fri, 04 Aug 2023)
Log Message:
-----------
starting BUT NOT YET TESTED Jenkins Small Fast JSF RNG

Modified Paths:
--------------
    teem/trunk/src/air/CMakeLists.txt
    teem/trunk/src/air/GNUmakefile
    teem/trunk/src/air/air.h

Added Paths:
-----------
    teem/trunk/src/air/randJSF.c

Modified: teem/trunk/src/air/CMakeLists.txt
===================================================================

--- teem/trunk/src/air/CMakeLists.txt	2023-08-04 16:52:19 UTC (rev 7146)
+++ teem/trunk/src/air/CMakeLists.txt	2023-08-04 17:18:29 UTC (rev 7147)
@@ -14,6 +14,7 @@
   parseAir.c
   privateAir.h
   randMT.c
+  randJSF.c
   sane.c
   string.c
   threadAir.c

Modified: teem/trunk/src/air/GNUmakefile
===================================================================
--- teem/trunk/src/air/GNUmakefile	2023-08-04 16:52:19 UTC (rev 7146)
+++ teem/trunk/src/air/GNUmakefile	2023-08-04 17:18:29 UTC (rev 7147)
@@ -47,11 +47,11 @@
 $(L).NEED =
 $(L).PUBLIC_HEADERS = air.h
 $(L).PRIVATE_HEADERS = privateAir.h
-$(L).OBJS = 754.o randMT.o array.o miscAir.o parseAir.o math.o \
+$(L).OBJS = 754.o randMT.o randJSF.o array.o miscAir.o parseAir.o math.o \
 	endianAir.o dio.o mop.o enum.o sane.o string.o threadAir.o heap.o
 $(L).TESTS = test/floatprint test/doubleprint test/tok \
-	test/tmop test/tline test/fp test/trand test/tmisc test/tdio \
-        test/bessy test/tarr test/texp test/logrice test/tprint
+	test/tmop test/tline test/fp test/trand test/trandJSF test/tmisc test/tdio \
+  test/bessy test/tarr test/texp test/logrice test/tprint
 
 $(L).NEED_QNANHIBIT = true
 $(L).NEED_DIO = true

Modified: teem/trunk/src/air/air.h
===================================================================
--- teem/trunk/src/air/air.h	2023-08-04 16:52:19 UTC (rev 7146)
+++ teem/trunk/src/air/air.h	2023-08-04 17:18:29 UTC (rev 7147)
@@ -440,6 +440,23 @@
 AIR_EXPORT double airDrandMT(void);
 AIR_EXPORT int airRandMTSanity(void);
 
+/* "Jenkins Small Fast" (psuedo)random number generator */
+typedef struct {
+  unsigned int a, b, c, d;
+} airJSFRand;
+/* randJSF.c */
+AIR_EXPORT airJSFRand *airJSFRandNew(unsigned int seed);
+AIR_EXPORT airJSFRand *airJSFRandNix(airJSFRand *jsf);
+AIR_EXPORT void airJSFRandSeed(airJSFRand *jsf, unsigned int seed);
+AIR_EXPORT unsigned int airJSFRandVal(airJSFRand *jsf);
+AIR_EXPORT unsigned int airJSFRandValMod(airJSFRand *jsf, unsigned int N);
+AIR_EXPORT float airJSFRandUni_f(airJSFRand *jsf);   /* [0,1) */
+AIR_EXPORT double airJSFRandUni_d(airJSFRand *jsf);  /* [0,1) */
+AIR_EXPORT float airJSFRandBiUni_f(airJSFRand *jsf); /* (-1,1) */
+AIR_EXPORT float airJSFRandNormal_f(airJSFRand *jsf);
+AIR_EXPORT void airJSFRandNormal2_f(airJSFRand *jsf, float val[2]);
+AIR_EXPORT int airJSFRandSanity(void);
+
 /* ---- END non-NrrdIO */
 
 /*

Added: teem/trunk/src/air/randJSF.c
===================================================================
--- teem/trunk/src/air/randJSF.c	                        (rev 0)
+++ teem/trunk/src/air/randJSF.c	2023-08-04 17:18:29 UTC (rev 7147)
@@ -0,0 +1,386 @@
+/*
+  Teem: Tools to process and visualize scientific data and images
+  Copyright (C) 2009--2023  University of Chicago
+  Copyright (C) 2005--2008  Gordon Kindlmann
+  Copyright (C) 1998--2004  University of Utah
+
+  This library is free software; you can redistribute it and/or modify it under the terms
+  of the GNU Lesser General Public License (LGPL) as published by the Free Software
+  Foundation; either version 2.1 of the License, or (at your option) any later version.
+  The terms of redistributing and/or modifying this software also include exceptions to
+  the LGPL that facilitate static linking.
+
+  This library is distributed in the hope that it will be useful, but WITHOUT ANY
+  WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+  PARTICULAR PURPOSE.  See the GNU Lesser General Public License for more details.
+
+  You should have received a copy of the GNU Lesser General Public License along with
+  this library; if not, write to Free Software Foundation, Inc., 51 Franklin Street,
+  Fifth Floor, Boston, MA 02110-1301 USA
+*/
+#include "air.h"
+#include "privateAir.h"
+
+/*
+The "Jenkins Small Fast" (JSF) pseudo-random number generator is from Bob Jenkins,
+http://burtleburtle.net/bob/rand/smallprng.html  (circa 2009 ?)
+who called it "A small noncryptographic PRNG", but didn't provide a tidier name.
+GLK learned about this from Melissa O'Neill's 2018 writing here
+https://www.pcg-random.org/posts/bob-jenkins-small-prng-passes-practrand.html
+where she notes how other have identified it as "JSF" in another RNG library.
+The JSF name is used by others as well, e.g.
+https://en.wikipedia.org/wiki/List_of_random_number_generators
+*/
+
+/*
+These #defines allow the (following) original code for "ranval" and "raninit" to BE the
+definition of Teem's airJSFRandVal and airJSFRandSeed, respectively, and for "randctx" to
+refer to the airJSFRand struct which has been already and identically defined in air.h
+*/
+#define ranval  airJSFRandVal
+#define raninit airJSFRandSeed
+#define ranctx  airJSFRand
+
+/* the following (public-domain) code is copied verbatim from Jenkins' web page,
+except for two changes:
+1) "typedef unsigned long int u4;" --> "typedef unsigned int u4;"
+   airRandJSFSanity() ensures that sizeof(unsigned int) == 4
+2) commenting out the ranctx == airJSFRand struct definition */
+
+/* clang-format off */
+typedef unsigned int u4;
+/* typedef struct ranctx { u4 a; u4 b; u4 c; u4 d; } ranctx; */
+
+#define rot(x,k) (((x)<<(k))|((x)>>(32-(k))))
+u4 ranval( ranctx *x ) {
+    u4 e = x->a - rot(x->b, 27);
+    x->a = x->b ^ rot(x->c, 17);
+    x->b = x->c + x->d;
+    x->c = x->d + e;
+    x->d = e + x->a;
+    return x->d;
+}
+
+void raninit( ranctx *x, u4 seed ) {
+    u4 i;
+    x->a = 0xf1ea5eed, x->b = x->c = x->d = seed;
+    for (i=0; i<20; ++i) {
+        (void)ranval(x);
+    }
+}
+/* clang-format on */
+#undef rot
+
+airJSFRand *
+airJSFRandNew(unsigned int seed) {
+  airJSFRand *jsf;
+  jsf = malloc(sizeof(airJSFRand));
+  airJSFRandSeed(jsf, seed); /* == "raninit" above */
+  return jsf;
+}
+
+airJSFRand *
+airJSFRandNix(airJSFRand *jsf) {
+  return airFree(jsf);
+}
+
+unsigned int
+airJSFRandValMod(airJSFRand *jsf, unsigned int N) {
+  unsigned int cap, val;
+  if (!N) {
+    /* no specific range requested; so provide val in range [0, UINT_MAX] */
+    return ranval(jsf);
+  }
+  /* else want values in range [0, N-1].
+     Set cap to biggest multiple of N that fits in a uint32 */
+  cap = 0xffffffff;
+  cap -= cap % N;
+  /* uniformly sample the remainders mod N by generating uints until less than cap */
+  do {
+    val = ranval(jsf);
+  } while (val >= cap);
+  /* return result mod N */
+  return val % N;
+}
+
+int
+airJSFRandSanity(void) {
+  int sane = 0;
+  airJSFRand jsf;
+  if (4 != sizeof(unsigned int)) {
+    return 0;
+  }
+  airJSFRandSeed(&jsf, 2600);
+  sane = (3114645624 == airJSFRandVal(&jsf) && /* */
+          580265137 == airJSFRandVal(&jsf) &&  /* */
+          3377642734 == airJSFRandVal(&jsf) && /* */
+          630323219 == airJSFRandVal(&jsf) &&  /* */
+          3984528821 == airJSFRandVal(&jsf) && /* */
+          849682424 == airJSFRandVal(&jsf) &&  /* */
+          3735540612 == airJSFRandVal(&jsf) && /* */
+          2696920995 == airJSFRandVal(&jsf) && /* */
+          155857509 == airJSFRandVal(&jsf) &&  /* */
+          1578235471 == airJSFRandVal(&jsf));
+  return sane;
+}
+
+/******************************************************************************
+ ******************************************************************************
+ End of basic random number generation, start of floating-point specific stuff
+ ******************************************************************************
+ ******************************************************************************/
+
+/* airJSFRandUni_f,airJSFRandUni_d functions are for accurately sampling floats,doubles
+between 0 and 1, making sure that it is possible for all finite values in that range to
+be generated, which is NOT true of the naive approach of dividing some int in [0,N-1] by
+N. Random values really close to 0 turn into (via the RandNormal functions below) samples
+far into the tails of the Gaussian.
+
+The idea for these is described in Section 3.1 of:
+
+    David B. Thomas, Wayne Luk, Philip H.W. Leong, and John D. Villasenor.
+    Gaussian random number generators. ACM Comput. Surv. 39, 4, Article 11
+    (November 2007). DOI=http://dx.doi.org/10.1145/1287620.1287622
+
+  which is also the same basic idea as Taylor Campbell describes here:
+
+    http://mumble.net/~campbell/2014/04/28/uniform-random-float
+    http://mumble.net/~campbell/2014/04/28/random_real.c
+
+Essentially: the probability of returning a float X should be proportional to the width
+of the interval containing all the reals closer to X than any other float, which is
+(except when the fraction field is all zeros) simply the ulp(X), or the distance to the
+next representable float.  In IEEE754 the value of the exponent field determines the ulp,
+and the ulp is halved by decrementing the exponent.  Starting with the highest possible
+exponent for values below 1 (that is, the bias minus 1), a stream of random bits
+determines whether to decrement the exponent, stopping when a 1 bit is seen. The ulp
+within the denormals is the same as for the lowest normal.
+*/
+
+/* https://en.wikipedia.org/wiki/Find_first_set */
+static unsigned int
+uint32_clz(unsigned int nn) {
+  /* HEY should figure out a configure-time test for having __builtin_clz */
+#if 0
+  return __builtin_clz(nn);
+#else
+  unsigned int ret = 0;
+  if (!(nn & 0xFFFF0000)) {
+    ret += 16;
+    nn <<= 16;
+  }
+  if (!(nn & 0xFF000000)) {
+    ret += 8;
+    nn <<= 8;
+  }
+  if (!(nn & 0xF0000000)) {
+    ret += 4;
+    nn <<= 4;
+  }
+  if (!(nn & 0xC0000000)) {
+    ret += 2;
+    nn <<= 2;
+  }
+  if (!(nn & 0x80000000)) {
+    ret += 1;
+  }
+  return ret;
+#endif
+}
+
+#if 0
+static unsigned int
+uint64_clz(airULLong nn) {
+#  if 0
+  /* HEY should figure out a configure-time test for having __builtin_clz */
+  return __builtin_clzll(nn);
+#  else
+  unsigned int ret = 0;
+  if (!(nn & 0xFFFFFFFF00000000)) {
+    ret += 32;
+    nn <<= 32;
+  }
+  if (!(nn & 0xFFFF000000000000)) {
+    ret += 16;
+    nn <<= 16;
+  }
+  if (!(nn & 0xFF00000000000000)) {
+    ret += 8;
+    nn <<= 8;
+  }
+  if (!(nn & 0xF000000000000000)) {
+    ret += 4;
+    nn <<= 4;
+  }
+  if (!(nn & 0xC000000000000000)) {
+    ret += 2;
+    nn <<= 2;
+  }
+  if (!(nn & 0x8000000000000000)) {
+    ret += 1;
+  }
+  return ret;
+#  endif
+}
+#endif
+
+float
+airJSFRandUni_f(airJSFRand *rng) {
+  unsigned int expo = 126; /* one less than bias => values in [0.5,1) */
+  unsigned int nz;         /* number of leading zeros seen */
+  unsigned int rnd;
+  airFloat ret;
+
+  rnd = airJSFRandVal(rng);
+  while (!rnd && expo > 32) {
+    /* got 32 bits of zeros (!) and can decrement expo by 32; try again */
+    expo -= 32;
+    rnd = airJSFRandVal(rng);
+  }
+  /* possible (though unlikely) to leave loop with expo <= 32 and rnd == 0,
+     and builtin clz(0) is undefined, so need extra "rnd ?" check here */
+  nz = rnd ? uint32_clz(rnd) : 32;
+  /* either we saw a 1 before expo hits zero, or not, in which case
+     we're into the denormals (expo == 0), which is fine */
+  expo = nz > expo ? 0 : expo - nz;
+  /* # zero bits has determined expo; now determine frac */
+  if (nz > 8) {
+    /* there are less then 32 - 1 - 8 = 23 random bits remaining (the
+       first 1 after the leading 0s does not get to be in fraction)
+       so need to get more random bits for fraction */
+    rnd = airJSFRandVal(rng);
+  }
+  ret.i = (expo << 23) | (rnd & 0x7fffff);
+  return ret.f;
+}
+
+float
+airJSFRandBiUni_f(airJSFRand *rng) {
+  /* HEY copy-pasta (minus comments) from above,
+  but now we use more bit of randomness to set the sign */
+  unsigned int expo = 126;
+  unsigned int nz;
+  unsigned int rnd;
+  airFloat ret;
+
+  rnd = airJSFRandVal(rng);
+  while (!rnd && expo > 32) {
+    expo -= 32;
+    rnd = airJSFRandVal(rng);
+  }
+  nz = rnd ? uint32_clz(rnd) : 32;
+  expo = nz > expo ? 0 : expo - nz;
+  if (nz > 7) { /* vs 8 above */
+    rnd = airJSFRandVal(rng);
+  }
+  ret.i = ((rnd & 0x800000) << 8) | (expo << 23) | (rnd & 0x7fffff);
+  return ret.f;
+}
+
+#if 0
+/* for accessing bits of a IEEE754 double
+ 1-bit sign, 11-bit expo with bias=1023, 52-bit frac
+ 6666555555555544444444443333333333222222222211111111110000000000
+ 3210987654321098765432109876543210987654321098765432109876543210
+ seeeeeeeeeeeffffffffffffffffffffffffffffffffffffffffffffffffffff
+*/
+typedef union {
+  uint64_t ii;
+  double dd;
+} empcg_double;
+
+double
+empcg64_urand(empcg64_state_t *rng) {
+  unsigned int expo = 1022u; /* one less than bias */
+  uint64_t rnd = empcg64_random(rng);
+  while (!rnd && expo > 64u) {
+    expo -= 64u;
+    rnd = empcg64_random(rng);
+  }
+  unsigned int nz = rnd ? empcg64_clz(rnd) : 64u;
+  expo = nz > expo ? 0 : expo - nz;
+  if (nz > 11u) {
+    /* there are less then 64 - 1 - 11 = 52 random bits remaining */
+    rnd = empcg64_random(rng);
+  }
+  empcg_double ret = {.ii = (((uint64_t)expo) << 52) | (rnd & 0xfffffffffffff)};
+  return ret.dd;
+}
+
+double
+empcg64_sgn_urand(empcg64_state_t *rng) {
+  unsigned int expo = 1022;
+  uint64_t rnd = empcg64_random(rng);
+  while (!rnd && expo > 64u) {
+    expo -= 64u;
+    rnd = empcg64_random(rng);
+  }
+  unsigned int nz = rnd ? empcg64_clz(rnd) : 64u;
+  expo = nz > expo ? 0 : expo - nz;
+  if (nz > 10u) {
+    rnd = empcg64_random(rng);
+  }
+  empcg_double ret = {.ii = ((rnd & 0x10000000000000) << 11) | (((uint64_t)expo) << 52)
+                          | (rnd & 0xfffffffffffff)};
+  return ret.dd;
+}
+#endif
+
+/* Polar Box–Muller
+https://en.wikipedia.org/wiki/Box%E2%80%93Muller_transform#Polar_form
+which generates two values at once */
+void
+airJSFRandNormal2_f(airJSFRand *rng, float val[2]) {
+  float xx, yy, rr;
+  do {
+    xx = airJSFRandBiUni_f(rng);
+    yy = airJSFRandBiUni_f(rng);
+    rr = xx * xx + yy * yy;
+  } while (!rr || rr >= 1);
+  rr = sqrtf((-2 * logf(rr)) / rr);
+  val[0] = xx * rr;
+  val[1] = yy * rr;
+  return;
+}
+
+/* If you really only want one value */
+float
+airJSFRandNormal_f(airJSFRand *rng) {
+  float xx, yy, rr;
+  do {
+    xx = airJSFRandBiUni_f(rng);
+    yy = airJSFRandBiUni_f(rng);
+    rr = xx * xx + yy * yy;
+  } while (!rr || rr >= 1);
+  rr = sqrtf((-2 * logf(rr)) / rr);
+  /* sum of two normals has variance 2 or stdv sqrt(2) */
+  return rr * (xx + yy) * 0.7071067811865475244f;
+}
+
+#if 0
+double
+empcg64_nrand(empcg64_state_t *rng) {
+  double xx, yy, rr;
+  do {
+    xx = empcg64_sgn_urand(rng);
+    yy = empcg64_sgn_urand(rng);
+    rr = xx * xx + yy * yy;
+  } while (!rr || rr >= 1);
+  rr = sqrt((-2 * log(rr)) / rr);
+  return rr * (xx + yy) * 0.7071067811865475244008;
+}
+
+void
+empcg64_nrand2(empcg64_state_t *rng, double *vv) {
+  double xx, yy, rr;
+  do {
+    xx = empcg64_sgn_urand(rng);
+    yy = empcg64_sgn_urand(rng);
+    rr = xx * xx + yy * yy;
+  } while (!rr || rr >= 1);
+  rr = sqrt((-2 * log(rr)) / rr);
+  vv[0] = xx * rr;
+  vv[1] = yy * rr;
+  return;
+}
+#endif

This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site.