mattip
diff --git a/‎_randomgen/benchmark.py
Lines changed: 65 additions & 108 deletions b/‎_randomgen/benchmark.py
Lines changed: 65 additions & 108 deletions
diff --git a/‎_randomgen/doc/source/conf.py
Lines changed: 0 additions & 2 deletions b/‎_randomgen/doc/source/conf.py
Lines changed: 0 additions & 2 deletions
diff --git a/‎_randomgen/doc/source/performance.py
Lines changed: 8 additions & 8 deletions b/‎_randomgen/doc/source/performance.py
Lines changed: 8 additions & 8 deletions
diff --git a/‎_randomgen/randomgen/tests/test_numpy_mt19937.py
Lines changed: 10 additions & 6 deletions b/‎_randomgen/randomgen/tests/test_numpy_mt19937.py
Lines changed: 10 additions & 6 deletions
@@ -84,122 +84,67 @@ def timer_uniform():
     run_timer(dist, command, None, SETUP, 'Uniforms')
 
 
-def timer_8bit_bounded(max=95, use_masked=True):
-    min = 0
+def timer_bounded(bits=8, max=95, use_masked=True):
+    """
+    Timer for 8-bit bounded values.
+
+    Parameters
+    ----------
+    bits : {8, 16, 32, 64}
+        Bit width of unsigned output type
+    max : int
+        Upper bound for range. Lower is always 0.  Must be <= 2**bits.
+    use_masked: bool
+        If True, masking and rejection sampling is used to generate a random
+        number in an interval. If False, Lemire's algorithm is used if
+        available to generate a random number in an interval.
+
+    Notes
+    -----
+    Lemire's algorithm has improved performance when {max}+1 is not a
+    power of two.
+    """
+    if bits not in (8, 16, 32, 64):
+        raise ValueError('bits must be one of 8, 16, 32, 64.')
+    minimum = 0
 
     dist = 'random_uintegers'
 
-    # Note on performance of generating random numbers in an interval:
-    # use_masked=True : masking and rejection sampling is used to generate a random number in an interval.
-    # use_masked=False : Lemire's algorithm is used if available to generate a random number in an interval.
-    # Lemire's algorithm has improved performance when {max}+1 is not a power of two.
+    if use_masked:  # Use masking & rejection.
+        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint{bits}, use_masked=True)'
+    else:  # Use Lemire's algo.
+        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint{bits}, use_masked=False)'
 
-    if use_masked:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint8, use_masked=True)'  # Use masking & rejection.
-    else:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint8, use_masked=False)'  # Use Lemire's algo.
+    command = command.format(min=minimum, max=max, bits=bits)
 
-    command = command.format(min=min, max=max)
-
-    command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint8)'
-    command_numpy = command_numpy.format(min=min, max=max)
+    command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint{bits})'
+    command_numpy = command_numpy.format(min=minimum, max=max, bits=bits)
 
     run_timer(dist, command, command_numpy, SETUP,
-              '8-bit bounded unsigned integers (max={max}, use_masked={use_masked})'.format(max=max, use_masked=use_masked))
-
-
-def timer_16bit_bounded(max=1535, use_masked=True):
-    min = 0
-
-    dist = 'random_uintegers'
-
-    # Note on performance of generating random numbers in an interval:
-    # use_masked=True : masking and rejection sampling is used to generate a random number in an interval.
-    # use_masked=False : Lemire's algorithm is used if available to generate a random number in an interval.
-    # Lemire's algorithm has improved performance when {max}+1 is not a power of two.
-
-    if use_masked:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint16, use_masked=True)'  # Use masking & rejection.
-    else:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint16, use_masked=False)'  # Use Lemire's algo.
-
-    command = command.format(min=min, max=max)
-
-    command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint16)'
-    command_numpy = command_numpy.format(min=min, max=max)
-
-    run_timer(dist, command, command_numpy, SETUP,
-              '16-bit bounded unsigned integers (max={max}, use_masked={use_masked})'.format(max=max, use_masked=use_masked))
+              '{bits}-bit bounded unsigned integers (max={max}, '
+              'use_masked={use_masked})'.format(max=max, use_masked=use_masked, bits=bits))
 
 
 def timer_32bit():
     info = np.iinfo(np.uint32)
-    min, max = info.min, info.max
+    minimum, maximum = info.min, info.max
     dist = 'random_uintegers'
     command = 'rg.random_uintegers(1000000, 32)'
     command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint32)'
-    command_numpy = command_numpy.format(min=min, max=max)
+    command_numpy = command_numpy.format(min=minimum, max=maximum)
     run_timer(dist, command, command_numpy, SETUP, '32-bit unsigned integers')
 
 
-def timer_32bit_bounded(max=1535, use_masked=True):
-    min = 0
-
-    dist = 'random_uintegers'
-
-    # Note on performance of generating random numbers in an interval:
-    # use_masked=True : masking and rejection sampling is used to generate a random number in an interval.
-    # use_masked=False : Lemire's algorithm is used if available to generate a random number in an interval.
-    # Lemire's algorithm has improved performance when {max}+1 is not a power of two.
-
-    if use_masked:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint32, use_masked=True)'  # Use masking & rejection.
-    else:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint32, use_masked=False)'  # Use Lemire's algo.
-
-    command = command.format(min=min, max=max)
-
-    command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint32)'
-    command_numpy = command_numpy.format(min=min, max=max)
-
-    run_timer(dist, command, command_numpy, SETUP,
-              '32-bit bounded unsigned integers (max={max}, use_masked={use_masked})'.format(max=max, use_masked=use_masked))
-
-
 def timer_64bit():
     info = np.iinfo(np.uint64)
-    min, max = info.min, info.max
+    minimum, maximum = info.min, info.max
     dist = 'random_uintegers'
     command = 'rg.random_uintegers(1000000)'
     command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint64)'
-    command_numpy = command_numpy.format(min=min, max=max)
+    command_numpy = command_numpy.format(min=minimum, max=maximum)
     run_timer(dist, command, command_numpy, SETUP, '64-bit unsigned integers')
 
 
-def timer_64bit_bounded(max=1535, use_masked=True):
-    min = 0
-
-    dist = 'random_uintegers'
-
-    # Note on performance of generating random numbers in an interval:
-    # use_masked=True : masking and rejection sampling is used to generate a random number in an interval.
-    # use_masked=False : Lemire's algorithm is used if available to generate a random number in an interval.
-    # Lemire's algorithm has improved performance when {max}+1 is not a power of two.
-
-    if use_masked:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint64, use_masked=True)'  # Use masking & rejection.
-    else:
-        command = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint64, use_masked=False)'  # Use Lemire's algo.
-
-    command = command.format(min=min, max=max)
-
-    command_numpy = 'rg.randint({min}, {max}+1, 1000000, dtype=np.uint64)'
-    command_numpy = command_numpy.format(min=min, max=max)
-
-    run_timer(dist, command, command_numpy, SETUP,
-              '64-bit bounded unsigned integers (max={max}, use_masked={use_masked})'.format(max=max, use_masked=use_masked))
-
-
 def timer_normal_zig():
     dist = 'standard_normal'
     command = 'rg.standard_normal(1000000)'
@@ -210,35 +155,47 @@ def timer_normal_zig():
 
 if __name__ == '__main__':
     import argparse
+
     parser = argparse.ArgumentParser()
-    parser.add_argument('--full', dest='full', action='store_true')
+    parser.add_argument('-f', '--full',
+                        help='Run benchmarks for a wide range of distributions.'
+                             ' If not provided, only tests the production of '
+                             'uniform values.',
+                        dest='full', action='store_true')
+    parser.add_argument('-bi', '--bounded-ints',
+                        help='Included benchmark coverage of the bounded '
+                             'integer generators in a full run.',
+                        dest='bounded_ints', action='store_true')
     args = parser.parse_args()
 
     timer_uniform()
     if args.full:
         timer_raw()
-        timer_8bit_bounded(use_masked=True)
-        timer_8bit_bounded(max=64, use_masked=False)  # Worst case for Numpy.
-        timer_8bit_bounded(max=95, use_masked=False)  # Typ. avrg. case for Numpy.
-        timer_8bit_bounded(max=127, use_masked=False)  # Best case for Numpy.
+        if args.bounded_ints:
+            timer_bounded(use_masked=True)
+            timer_bounded(max=64, use_masked=False)  # Worst case for Numpy.
+            timer_bounded(max=95, use_masked=False)  # Typ. avrg. case for Numpy.
+            timer_bounded(max=127, use_masked=False)  # Best case for Numpy.
 
-        timer_16bit_bounded(use_masked=True)
-        timer_16bit_bounded(max=1024, use_masked=False)  # Worst case for Numpy.
-        timer_16bit_bounded(max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
-        timer_16bit_bounded(max=2047, use_masked=False)  # Best case for Numpy.
+            timer_bounded(16, use_masked=True)
+            timer_bounded(16, max=1024, use_masked=False)  # Worst case for Numpy.
+            timer_bounded(16, max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
+            timer_bounded(16, max=2047, use_masked=False)  # Best case for Numpy.
 
         timer_32bit()
 
-        timer_32bit_bounded(use_masked=True)
-        timer_32bit_bounded(max=1024, use_masked=False)  # Worst case for Numpy.
-        timer_32bit_bounded(max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
-        timer_32bit_bounded(max=2047, use_masked=False)  # Best case for Numpy.
+        if args.bounded_ints:
+            timer_bounded(32, use_masked=True)
+            timer_bounded(32, max=1024, use_masked=False)  # Worst case for Numpy.
+            timer_bounded(32, max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
+            timer_bounded(32, max=2047, use_masked=False)  # Best case for Numpy.
 
         timer_64bit()
 
-        timer_64bit_bounded(use_masked=True)
-        timer_64bit_bounded(max=1024, use_masked=False)  # Worst case for Numpy.
-        timer_64bit_bounded(max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
-        timer_64bit_bounded(max=2047, use_masked=False)  # Best case for Numpy.
+        if args.bounded_ints:
+            timer_bounded(64, use_masked=True)
+            timer_bounded(64, max=1024, use_masked=False)  # Worst case for Numpy.
+            timer_bounded(64, max=1535, use_masked=False)  # Typ. avrg. case for Numpy.
+            timer_bounded(64, max=2047, use_masked=False)  # Best case for Numpy.
 
         timer_normal_zig()
@@ -15,9 +15,7 @@
 # import os
 # import sys
 # sys.path.insert(0, os.path.abspath('.'))
-from distutils.version import LooseVersion
 import guzzle_sphinx_theme
-# import sphinx_rtd_theme
 import randomgen
 
 # -- Project information -----------------------------------------------------
 
@@ -1,11 +1,13 @@
+from timeit import repeat
+
 import numpy as np
-from timeit import timeit, repeat
 import pandas as pd
 
 from randomgen import MT19937, DSFMT, ThreeFry, PCG64, Xoroshiro128, \
-    Xorshift1024, Philox
+    Xorshift1024, Philox, Xoshiro256StarStar, Xoshiro512StarStar
 
-PRNGS = [DSFMT, MT19937, Philox, PCG64, ThreeFry, Xoroshiro128, Xorshift1024]
+PRNGS = [DSFMT, MT19937, Philox, PCG64, ThreeFry, Xoroshiro128, Xorshift1024,
+         Xoshiro256StarStar, Xoshiro512StarStar]
 
 funcs = {'32-bit Unsigned Ints': 'random_uintegers(size=1000000,bits=32)',
          '64-bit Unsigned Ints': 'random_uintegers(size=1000000,bits=32)',
@@ -32,11 +34,10 @@
         t = repeat(test.format(func=funcs[key]),
                    setup.format(prng=prng().__class__.__name__),
                    number=1, repeat=3)
-        col[key]= 1000 * min(t)
+        col[key] = 1000 * min(t)
     col = pd.Series(col)
     table[prng().__class__.__name__] = col
 
-
 npfuncs = {}
 npfuncs.update(funcs)
 npfuncs['32-bit Unsigned Ints'] = 'randint(2**32,dtype="uint32",size=1000000)'
@@ -54,7 +55,6 @@
     col[key] = 1000 * min(t)
 table['NumPy'] = pd.Series(col)
 
-
 table = pd.DataFrame(table)
 table = table.reindex(table.mean(1).sort_values().index)
 order = np.log(table).mean().sort_values().index
@@ -63,11 +63,11 @@
 table = table.T
 print(table.to_csv(float_format='%0.1f'))
 
-rel = table / (table.iloc[:,[0]].values @ np.ones((1,8)))
+rel = table / (table.iloc[:, [0]].values @ np.ones((1, 8)))
 rel.pop(rel.columns[0])
 rel = rel.T
 rel['Overall'] = np.exp(np.log(rel).mean(1))
 rel *= 100
 rel = np.round(rel)
 rel = rel.T
-print(rel.to_csv(float_format='%0d'))
+print(rel.to_csv(float_format='%0d'))
@@ -437,27 +437,31 @@ def test_randint(self):
         assert_array_equal(actual, desired)
 
     def test_randint_masked(self):
-        """ Test masked rejection sampling algorithm to generate array of uint32 in an interval. """
+        # Test masked rejection sampling algorithm to generate array of
+        # uint32 in an interval.
         mt19937.seed(self.seed)
-        actual = mt19937.randint(0, 99, size=(3, 2), dtype=np.uint32, use_masked=True)
+        actual = mt19937.randint(0, 99, size=(3, 2), dtype=np.uint32,
+                                 use_masked=True)
         desired = np.array([[2, 47],
                             [12, 51],
                             [33, 43]], dtype=np.uint32)
         assert_array_equal(actual, desired)
 
     def test_randint_lemire_32(self):
-        """ Test lemire algorithm to generate array of uint32 in an interval. """
+        # Test lemire algorithm to generate array of uint32 in an interval.
         mt19937.seed(self.seed)
-        actual = mt19937.randint(0, 99, size=(3, 2), dtype=np.uint32, use_masked=False)
+        actual = mt19937.randint(0, 99, size=(3, 2), dtype=np.uint32,
+                                 use_masked=False)
         desired = np.array([[61, 33],
                             [58, 14],
                             [87, 23]], dtype=np.uint32)
         assert_array_equal(actual, desired)
 
     def test_randint_lemire_64(self):
-        """ Test lemire algorithm to generate array of uint64 in an interval. """
+        # Test lemire algorithm to generate array of uint64 in an interval.
         mt19937.seed(self.seed)
-        actual = mt19937.randint(0, 99 + 0xFFFFFFFFF, size=(3, 2), dtype=np.uint64, use_masked=False)
+        actual = mt19937.randint(0, 99 + 0xFFFFFFFFF, size=(3, 2),
+                                 dtype=np.uint64, use_masked=False)
         desired = np.array([[42523252834, 40656066204],
                             [61069871386, 61274051182],
                             [31443797706, 53476677934]], dtype=np.uint64)