123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634 |
- #include <stdio.h>
- #include <string.h>
- #include <stdlib.h>
- #include "dSFMT-params.h"
- #include "dSFMT-common.h"
- #if defined(__cplusplus)
- extern "C" {
- #endif
- dsfmt_t dsfmt_global_data;
- static const int dsfmt_mexp = DSFMT_MEXP;
- inline static uint32_t ini_func1(uint32_t x);
- inline static uint32_t ini_func2(uint32_t x);
- inline static void gen_rand_array_c1o2(dsfmt_t *dsfmt, w128_t *array,
- int size);
- inline static void gen_rand_array_c0o1(dsfmt_t *dsfmt, w128_t *array,
- int size);
- inline static void gen_rand_array_o0c1(dsfmt_t *dsfmt, w128_t *array,
- int size);
- inline static void gen_rand_array_o0o1(dsfmt_t *dsfmt, w128_t *array,
- int size);
- inline static int idxof(int i);
- static void initial_mask(dsfmt_t *dsfmt);
- static void period_certification(dsfmt_t *dsfmt);
- #if defined(HAVE_SSE2)
- static const union X128I_T sse2_int_one = {{1, 1}};
- static const union X128D_T sse2_double_two = {{2.0, 2.0}};
- static const union X128D_T sse2_double_m_one = {{-1.0, -1.0}};
- #endif
- #if defined(DSFMT_BIG_ENDIAN)
- inline static int idxof(int i) {
- return i ^ 1;
- }
- #else
- inline static int idxof(int i) {
- return i;
- }
- #endif
- #if defined(HAVE_SSE2)
- inline static void convert_c0o1(w128_t *w) {
- w->sd = _mm_add_pd(w->sd, sse2_double_m_one.d128);
- }
- inline static void convert_o0c1(w128_t *w) {
- w->sd = _mm_sub_pd(sse2_double_two.d128, w->sd);
- }
- inline static void convert_o0o1(w128_t *w) {
- w->si = _mm_or_si128(w->si, sse2_int_one.i128);
- w->sd = _mm_add_pd(w->sd, sse2_double_m_one.d128);
- }
- #else
- inline static void convert_c0o1(w128_t *w) {
- w->d[0] -= 1.0;
- w->d[1] -= 1.0;
- }
- inline static void convert_o0c1(w128_t *w) {
- w->d[0] = 2.0 - w->d[0];
- w->d[1] = 2.0 - w->d[1];
- }
- inline static void convert_o0o1(w128_t *w) {
- w->u[0] |= 1;
- w->u[1] |= 1;
- w->d[0] -= 1.0;
- w->d[1] -= 1.0;
- }
- #endif
- inline static void gen_rand_array_c1o2(dsfmt_t *dsfmt, w128_t *array,
- int size) {
- int i, j;
- w128_t lung;
- lung = dsfmt->status[DSFMT_N];
- do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
- &lung);
- for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1], &lung);
- }
- for (; i < DSFMT_N; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- for (; i < size - DSFMT_N; i++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- for (j = 0; j < 2 * DSFMT_N - size; j++) {
- dsfmt->status[j] = array[j + size - DSFMT_N];
- }
- for (; i < size; i++, j++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- dsfmt->status[j] = array[i];
- }
- dsfmt->status[DSFMT_N] = lung;
- }
- inline static void gen_rand_array_c0o1(dsfmt_t *dsfmt, w128_t *array,
- int size) {
- int i, j;
- w128_t lung;
- lung = dsfmt->status[DSFMT_N];
- do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
- &lung);
- for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1], &lung);
- }
- for (; i < DSFMT_N; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- for (; i < size - DSFMT_N; i++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- convert_c0o1(&array[i - DSFMT_N]);
- }
- for (j = 0; j < 2 * DSFMT_N - size; j++) {
- dsfmt->status[j] = array[j + size - DSFMT_N];
- }
- for (; i < size; i++, j++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- dsfmt->status[j] = array[i];
- convert_c0o1(&array[i - DSFMT_N]);
- }
- for (i = size - DSFMT_N; i < size; i++) {
- convert_c0o1(&array[i]);
- }
- dsfmt->status[DSFMT_N] = lung;
- }
- inline static void gen_rand_array_o0o1(dsfmt_t *dsfmt, w128_t *array,
- int size) {
- int i, j;
- w128_t lung;
- lung = dsfmt->status[DSFMT_N];
- do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
- &lung);
- for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1], &lung);
- }
- for (; i < DSFMT_N; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- for (; i < size - DSFMT_N; i++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- convert_o0o1(&array[i - DSFMT_N]);
- }
- for (j = 0; j < 2 * DSFMT_N - size; j++) {
- dsfmt->status[j] = array[j + size - DSFMT_N];
- }
- for (; i < size; i++, j++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- dsfmt->status[j] = array[i];
- convert_o0o1(&array[i - DSFMT_N]);
- }
- for (i = size - DSFMT_N; i < size; i++) {
- convert_o0o1(&array[i]);
- }
- dsfmt->status[DSFMT_N] = lung;
- }
- inline static void gen_rand_array_o0c1(dsfmt_t *dsfmt, w128_t *array,
- int size) {
- int i, j;
- w128_t lung;
- lung = dsfmt->status[DSFMT_N];
- do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
- &lung);
- for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1], &lung);
- }
- for (; i < DSFMT_N; i++) {
- do_recursion(&array[i], &dsfmt->status[i],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- for (; i < size - DSFMT_N; i++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- convert_o0c1(&array[i - DSFMT_N]);
- }
- for (j = 0; j < 2 * DSFMT_N - size; j++) {
- dsfmt->status[j] = array[j + size - DSFMT_N];
- }
- for (; i < size; i++, j++) {
- do_recursion(&array[i], &array[i - DSFMT_N],
- &array[i + DSFMT_POS1 - DSFMT_N], &lung);
- dsfmt->status[j] = array[i];
- convert_o0c1(&array[i - DSFMT_N]);
- }
- for (i = size - DSFMT_N; i < size; i++) {
- convert_o0c1(&array[i]);
- }
- dsfmt->status[DSFMT_N] = lung;
- }
- static uint32_t ini_func1(uint32_t x) {
- return (x ^ (x >> 27)) * (uint32_t)1664525UL;
- }
- static uint32_t ini_func2(uint32_t x) {
- return (x ^ (x >> 27)) * (uint32_t)1566083941UL;
- }
- static void initial_mask(dsfmt_t *dsfmt) {
- int i;
- uint64_t *psfmt;
- psfmt = &dsfmt->status[0].u[0];
- for (i = 0; i < DSFMT_N * 2; i++) {
- psfmt[i] = (psfmt[i] & DSFMT_LOW_MASK) | DSFMT_HIGH_CONST;
- }
- }
- static void period_certification(dsfmt_t *dsfmt) {
- uint64_t pcv[2] = {DSFMT_PCV1, DSFMT_PCV2};
- uint64_t tmp[2];
- uint64_t inner;
- int i;
- #if (DSFMT_PCV2 & 1) != 1
- int j;
- uint64_t work;
- #endif
- tmp[0] = (dsfmt->status[DSFMT_N].u[0] ^ DSFMT_FIX1);
- tmp[1] = (dsfmt->status[DSFMT_N].u[1] ^ DSFMT_FIX2);
- inner = tmp[0] & pcv[0];
- inner ^= tmp[1] & pcv[1];
- for (i = 32; i > 0; i >>= 1) {
- inner ^= inner >> i;
- }
- inner &= 1;
-
- if (inner == 1) {
- return;
- }
-
- #if (DSFMT_PCV2 & 1) == 1
- dsfmt->status[DSFMT_N].u[1] ^= 1;
- #else
- for (i = 1; i >= 0; i--) {
- work = 1;
- for (j = 0; j < 64; j++) {
- if ((work & pcv[i]) != 0) {
- dsfmt->status[DSFMT_N].u[i] ^= work;
- return;
- }
- work = work << 1;
- }
- }
- #endif
- return;
- }
- const char *dsfmt_get_idstring(void) {
- return DSFMT_IDSTR;
- }
- int dsfmt_get_min_array_size(void) {
- return DSFMT_N64;
- }
- void dsfmt_gen_rand_all(dsfmt_t *dsfmt) {
- int i;
- w128_t lung;
- lung = dsfmt->status[DSFMT_N];
- do_recursion(&dsfmt->status[0], &dsfmt->status[0],
- &dsfmt->status[DSFMT_POS1], &lung);
- for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
- do_recursion(&dsfmt->status[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1], &lung);
- }
- for (; i < DSFMT_N; i++) {
- do_recursion(&dsfmt->status[i], &dsfmt->status[i],
- &dsfmt->status[i + DSFMT_POS1 - DSFMT_N], &lung);
- }
- dsfmt->status[DSFMT_N] = lung;
- }
- void dsfmt_fill_array_close1_open2(dsfmt_t *dsfmt, double array[], int size) {
- assert(size % 2 == 0);
- assert(size >= DSFMT_N64);
- gen_rand_array_c1o2(dsfmt, (w128_t *)array, size / 2);
- }
- void dsfmt_fill_array_open_close(dsfmt_t *dsfmt, double array[], int size) {
- assert(size % 2 == 0);
- assert(size >= DSFMT_N64);
- gen_rand_array_o0c1(dsfmt, (w128_t *)array, size / 2);
- }
- void dsfmt_fill_array_close_open(dsfmt_t *dsfmt, double array[], int size) {
- assert(size % 2 == 0);
- assert(size >= DSFMT_N64);
- gen_rand_array_c0o1(dsfmt, (w128_t *)array, size / 2);
- }
- void dsfmt_fill_array_open_open(dsfmt_t *dsfmt, double array[], int size) {
- assert(size % 2 == 0);
- assert(size >= DSFMT_N64);
- gen_rand_array_o0o1(dsfmt, (w128_t *)array, size / 2);
- }
- #if defined(__INTEL_COMPILER)
- # pragma warning(disable:981)
- #endif
- void dsfmt_chk_init_gen_rand(dsfmt_t *dsfmt, uint32_t seed, int mexp) {
- int i;
- uint32_t *psfmt;
-
- if (mexp != dsfmt_mexp) {
- fprintf(stderr, "DSFMT_MEXP doesn't match with dSFMT.c\n");
- exit(1);
- }
- psfmt = &dsfmt->status[0].u32[0];
- psfmt[idxof(0)] = seed;
- for (i = 1; i < (DSFMT_N + 1) * 4; i++) {
- psfmt[idxof(i)] = 1812433253UL
- * (psfmt[idxof(i - 1)] ^ (psfmt[idxof(i - 1)] >> 30)) + i;
- }
- initial_mask(dsfmt);
- period_certification(dsfmt);
- dsfmt->idx = DSFMT_N64;
- }
- void dsfmt_chk_init_by_array(dsfmt_t *dsfmt, uint32_t init_key[],
- int key_length, int mexp) {
- int i, j, count;
- uint32_t r;
- uint32_t *psfmt32;
- int lag;
- int mid;
- int size = (DSFMT_N + 1) * 4;
-
- if (mexp != dsfmt_mexp) {
- fprintf(stderr, "DSFMT_MEXP doesn't match with dSFMT.c\n");
- exit(1);
- }
- if (size >= 623) {
- lag = 11;
- } else if (size >= 68) {
- lag = 7;
- } else if (size >= 39) {
- lag = 5;
- } else {
- lag = 3;
- }
- mid = (size - lag) / 2;
- psfmt32 = &dsfmt->status[0].u32[0];
- memset(dsfmt->status, 0x8b, sizeof(dsfmt->status));
- if (key_length + 1 > size) {
- count = key_length + 1;
- } else {
- count = size;
- }
- r = ini_func1(psfmt32[idxof(0)] ^ psfmt32[idxof(mid % size)]
- ^ psfmt32[idxof((size - 1) % size)]);
- psfmt32[idxof(mid % size)] += r;
- r += key_length;
- psfmt32[idxof((mid + lag) % size)] += r;
- psfmt32[idxof(0)] = r;
- count--;
- for (i = 1, j = 0; (j < count) && (j < key_length); j++) {
- r = ini_func1(psfmt32[idxof(i)]
- ^ psfmt32[idxof((i + mid) % size)]
- ^ psfmt32[idxof((i + size - 1) % size)]);
- psfmt32[idxof((i + mid) % size)] += r;
- r += init_key[j] + i;
- psfmt32[idxof((i + mid + lag) % size)] += r;
- psfmt32[idxof(i)] = r;
- i = (i + 1) % size;
- }
- for (; j < count; j++) {
- r = ini_func1(psfmt32[idxof(i)]
- ^ psfmt32[idxof((i + mid) % size)]
- ^ psfmt32[idxof((i + size - 1) % size)]);
- psfmt32[idxof((i + mid) % size)] += r;
- r += i;
- psfmt32[idxof((i + mid + lag) % size)] += r;
- psfmt32[idxof(i)] = r;
- i = (i + 1) % size;
- }
- for (j = 0; j < size; j++) {
- r = ini_func2(psfmt32[idxof(i)]
- + psfmt32[idxof((i + mid) % size)]
- + psfmt32[idxof((i + size - 1) % size)]);
- psfmt32[idxof((i + mid) % size)] ^= r;
- r -= i;
- psfmt32[idxof((i + mid + lag) % size)] ^= r;
- psfmt32[idxof(i)] = r;
- i = (i + 1) % size;
- }
- initial_mask(dsfmt);
- period_certification(dsfmt);
- dsfmt->idx = DSFMT_N64;
- }
- #if defined(__INTEL_COMPILER)
- # pragma warning(default:981)
- #endif
- #if defined(__cplusplus)
- }
- #endif
|