114b11b2bSmrg/*
214b11b2bSmrg * Copyright © 2012 Siarhei Siamashka <siarhei.siamashka@gmail.com>
314b11b2bSmrg *
414b11b2bSmrg * Based on the public domain implementation of small noncryptographic PRNG
514b11b2bSmrg * authored by Bob Jenkins: http://burtleburtle.net/bob/rand/smallprng.html
614b11b2bSmrg *
714b11b2bSmrg * Permission is hereby granted, free of charge, to any person obtaining a
814b11b2bSmrg * copy of this software and associated documentation files (the "Software"),
914b11b2bSmrg * to deal in the Software without restriction, including without limitation
1014b11b2bSmrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
1114b11b2bSmrg * and/or sell copies of the Software, and to permit persons to whom the
1214b11b2bSmrg * Software is furnished to do so, subject to the following conditions:
1314b11b2bSmrg *
1414b11b2bSmrg * The above copyright notice and this permission notice (including the next
1514b11b2bSmrg * paragraph) shall be included in all copies or substantial portions of the
1614b11b2bSmrg * Software.
1714b11b2bSmrg *
1814b11b2bSmrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1914b11b2bSmrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2014b11b2bSmrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
2114b11b2bSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2214b11b2bSmrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
2314b11b2bSmrg * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
2414b11b2bSmrg * DEALINGS IN THE SOFTWARE.
2514b11b2bSmrg */
2614b11b2bSmrg
2714b11b2bSmrg#ifndef __UTILS_PRNG_H__
2814b11b2bSmrg#define __UTILS_PRNG_H__
2914b11b2bSmrg
3014b11b2bSmrg/*
3114b11b2bSmrg * This file provides a fast SIMD-optimized noncryptographic PRNG (pseudorandom
3214b11b2bSmrg * number generator), with the output good enough to pass "Big Crush" tests
3314b11b2bSmrg * from TestU01 (http://en.wikipedia.org/wiki/TestU01).
3414b11b2bSmrg *
3514b11b2bSmrg * SIMD code uses http://gcc.gnu.org/onlinedocs/gcc/Vector-Extensions.html
3614b11b2bSmrg * which is a GCC specific extension. There is also a slower alternative
3714b11b2bSmrg * code path, which should work with any C compiler.
3814b11b2bSmrg *
3914b11b2bSmrg * The "prng_t" structure keeps the internal state of the random number
4014b11b2bSmrg * generator. It is possible to have multiple instances of the random number
4114b11b2bSmrg * generator active at the same time, in this case each of them needs to have
4214b11b2bSmrg * its own "prng_t". All the functions take a pointer to "prng_t"
4314b11b2bSmrg * as the first argument.
4414b11b2bSmrg *
4514b11b2bSmrg * Functions:
4614b11b2bSmrg *
4714b11b2bSmrg * ----------------------------------------------------------------------------
4814b11b2bSmrg * void prng_srand_r (prng_t *prng, uint32_t seed);
4914b11b2bSmrg *
5014b11b2bSmrg * Initialize the pseudorandom number generator. The sequence of preudorandom
5114b11b2bSmrg * numbers is deterministic and only depends on "seed". Any two generators
5214b11b2bSmrg * initialized with the same seed will produce exactly the same sequence.
5314b11b2bSmrg *
5414b11b2bSmrg * ----------------------------------------------------------------------------
5514b11b2bSmrg * uint32_t prng_rand_r (prng_t *prng);
5614b11b2bSmrg *
5714b11b2bSmrg * Generate a single uniformly distributed 32-bit pseudorandom value.
5814b11b2bSmrg *
5914b11b2bSmrg * ----------------------------------------------------------------------------
6014b11b2bSmrg * void prng_randmemset_r (prng_t                  *prng,
6114b11b2bSmrg *                         void                    *buffer,
6214b11b2bSmrg *                         size_t                   size,
6314b11b2bSmrg *                         prng_randmemset_flags_t  flags);
6414b11b2bSmrg *
6514b11b2bSmrg * Fills the memory buffer "buffer" with "size" bytes of pseudorandom data.
6614b11b2bSmrg * The "flags" argument may be used to tweak some statistics properties:
6714b11b2bSmrg *    RANDMEMSET_MORE_00 - set ~25% of bytes to 0x00
6814b11b2bSmrg *    RANDMEMSET_MORE_FF - set ~25% of bytes to 0xFF
6914b11b2bSmrg * The flags can be combined. This allows a bit better simulation of typical
7014b11b2bSmrg * pixel data, which normally contains a lot of fully transparent or fully
7114b11b2bSmrg * opaque pixels.
7214b11b2bSmrg */
7314b11b2bSmrg
7414b11b2bSmrg#ifdef HAVE_CONFIG_H
7514b11b2bSmrg#include <pixman-config.h>
7614b11b2bSmrg#endif
7714b11b2bSmrg
7814b11b2bSmrg#include "pixman-private.h"
7914b11b2bSmrg
8014b11b2bSmrg/*****************************************************************************/
8114b11b2bSmrg
8214b11b2bSmrg#ifdef HAVE_GCC_VECTOR_EXTENSIONS
8314b11b2bSmrgtypedef uint32_t uint32x4 __attribute__ ((vector_size(16)));
8414b11b2bSmrgtypedef uint8_t  uint8x16 __attribute__ ((vector_size(16)));
8514b11b2bSmrg#endif
8614b11b2bSmrg
8714b11b2bSmrgtypedef struct
8814b11b2bSmrg{
8914b11b2bSmrg    uint32_t a, b, c, d;
9014b11b2bSmrg} smallprng_t;
9114b11b2bSmrg
9214b11b2bSmrgtypedef struct
9314b11b2bSmrg{
9414b11b2bSmrg#ifdef HAVE_GCC_VECTOR_EXTENSIONS
9514b11b2bSmrg    uint32x4 a, b, c, d;
9614b11b2bSmrg#else
9714b11b2bSmrg    smallprng_t p1, p2, p3, p4;
9814b11b2bSmrg#endif
9914b11b2bSmrg    smallprng_t p0;
10014b11b2bSmrg} prng_t;
10114b11b2bSmrg
10214b11b2bSmrgtypedef union
10314b11b2bSmrg{
10414b11b2bSmrg    uint8_t  b[16];
10514b11b2bSmrg    uint32_t w[4];
10614b11b2bSmrg#ifdef HAVE_GCC_VECTOR_EXTENSIONS
10714b11b2bSmrg    uint8x16 vb;
10814b11b2bSmrg    uint32x4 vw;
10914b11b2bSmrg#endif
11014b11b2bSmrg} prng_rand_128_data_t;
11114b11b2bSmrg
11214b11b2bSmrg/*****************************************************************************/
11314b11b2bSmrg
11414b11b2bSmrgstatic force_inline uint32_t
11514b11b2bSmrgsmallprng_rand_r (smallprng_t *x)
11614b11b2bSmrg{
11714b11b2bSmrg    uint32_t e = x->a - ((x->b << 27) + (x->b >> (32 - 27)));
11814b11b2bSmrg    x->a = x->b ^ ((x->c << 17) ^ (x->c >> (32 - 17)));
11914b11b2bSmrg    x->b = x->c + x->d;
12014b11b2bSmrg    x->c = x->d + e;
12114b11b2bSmrg    x->d = e + x->a;
12214b11b2bSmrg    return x->d;
12314b11b2bSmrg}
12414b11b2bSmrg
12514b11b2bSmrg/* Generate 4 bytes (32-bits) of random data */
12614b11b2bSmrgstatic force_inline uint32_t
12714b11b2bSmrgprng_rand_r (prng_t *x)
12814b11b2bSmrg{
12914b11b2bSmrg    return smallprng_rand_r (&x->p0);
13014b11b2bSmrg}
13114b11b2bSmrg
13214b11b2bSmrg/* Generate 16 bytes (128-bits) of random data */
13314b11b2bSmrgstatic force_inline void
13414b11b2bSmrgprng_rand_128_r (prng_t *x, prng_rand_128_data_t *data)
13514b11b2bSmrg{
13614b11b2bSmrg#ifdef HAVE_GCC_VECTOR_EXTENSIONS
13714b11b2bSmrg    uint32x4 e = x->a - ((x->b << 27) + (x->b >> (32 - 27)));
13814b11b2bSmrg    x->a = x->b ^ ((x->c << 17) ^ (x->c >> (32 - 17)));
13914b11b2bSmrg    x->b = x->c + x->d;
14014b11b2bSmrg    x->c = x->d + e;
14114b11b2bSmrg    x->d = e + x->a;
14214b11b2bSmrg    data->vw = x->d;
14314b11b2bSmrg#else
14414b11b2bSmrg    data->w[0] = smallprng_rand_r (&x->p1);
14514b11b2bSmrg    data->w[1] = smallprng_rand_r (&x->p2);
14614b11b2bSmrg    data->w[2] = smallprng_rand_r (&x->p3);
14714b11b2bSmrg    data->w[3] = smallprng_rand_r (&x->p4);
14814b11b2bSmrg#endif
14914b11b2bSmrg}
15014b11b2bSmrg
15114b11b2bSmrgtypedef enum
15214b11b2bSmrg{
15314b11b2bSmrg    RANDMEMSET_MORE_00        = 1, /* ~25% chance for 0x00 bytes */
15414b11b2bSmrg    RANDMEMSET_MORE_FF        = 2, /* ~25% chance for 0xFF bytes */
15514b11b2bSmrg    RANDMEMSET_MORE_00000000  = 4, /* ~25% chance for 0x00000000 clusters */
15614b11b2bSmrg    RANDMEMSET_MORE_FFFFFFFF  = 8, /* ~25% chance for 0xFFFFFFFF clusters */
15714b11b2bSmrg    RANDMEMSET_MORE_00_AND_FF = (RANDMEMSET_MORE_00 | RANDMEMSET_MORE_00000000 |
15814b11b2bSmrg                                 RANDMEMSET_MORE_FF | RANDMEMSET_MORE_FFFFFFFF)
15914b11b2bSmrg} prng_randmemset_flags_t;
16014b11b2bSmrg
16114b11b2bSmrg/* Set the 32-bit seed for PRNG */
16214b11b2bSmrgvoid prng_srand_r (prng_t *prng, uint32_t seed);
16314b11b2bSmrg
16414b11b2bSmrg/* Fill memory buffer with random data */
16514b11b2bSmrgvoid prng_randmemset_r (prng_t                  *prng,
16614b11b2bSmrg                        void                    *buffer,
16714b11b2bSmrg                        size_t                   size,
16814b11b2bSmrg                        prng_randmemset_flags_t  flags);
16914b11b2bSmrg
17014b11b2bSmrg#endif
171