Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Blame
Revision Log

dSFMT.c@ 3891

Visit:

Last change on this file since 3891 was 3602, checked in by cmv, 17 years ago
RandomGeneratorInterface + dSFMT etc..., cmv 28/04/2009
File size: 22.5 KB

Line
1	/**
2	* @file dSFMT.c
3	* @brief double precision SIMD-oriented Fast Mersenne Twister (dSFMT)
4	* based on IEEE 754 format.
5	*
6	* @author Mutsuo Saito (Hiroshima University)
7	* @author Makoto Matsumoto (Hiroshima University)
8	*
9	* Copyright (C) 2007,2008 Mutsuo Saito, Makoto Matsumoto and Hiroshima
10	* University. All rights reserved.
11	*
12	* The new BSD License is applied to this software, see LICENSE.txt
13	*/
14	#include <stdio.h>
15	#include <string.h>
16	#include <stdlib.h>
17	#include "dsfmtflags.h"
18	#include "dSFMT-params.h"
19
20	/** dsfmt internal state vector */
21	dsfmt_t dsfmt_global_data;
22	/** dsfmt mexp for check */
23	static const int dsfmt_mexp = DSFMT_MEXP;
24
25	/*----------------
26	STATIC FUNCTIONS
27	----------------*/
28	inline static uint32_t ini_func1(uint32_t x);
29	inline static uint32_t ini_func2(uint32_t x);
30	inline static void gen_rand_array_c1o2(dsfmt_t dsfmt, w128_t array,
31	int size);
32	inline static void gen_rand_array_c0o1(dsfmt_t dsfmt, w128_t array,
33	int size);
34	inline static void gen_rand_array_o0c1(dsfmt_t dsfmt, w128_t array,
35	int size);
36	inline static void gen_rand_array_o0o1(dsfmt_t dsfmt, w128_t array,
37	int size);
38	inline static int idxof(int i);
39	static void initial_mask(dsfmt_t *dsfmt);
40	static void period_certification(dsfmt_t *dsfmt);
41
42	#if defined(HAVE_SSE2)
43	# include <emmintrin.h>
44	/** mask data for sse2 */
45	static __m128i sse2_param_mask;
46	/** 1 in 64bit for sse2 */
47	static __m128i sse2_int_one;
48	/** 2.0 double for sse2 */
49	static __m128d sse2_double_two;
50	/** -1.0 double for sse2 */
51	static __m128d sse2_double_m_one;
52
53	static void setup_const(void);
54	#endif
55
56	/**
57	* This function simulate a 32-bit array index overlapped to 64-bit
58	* array of LITTLE ENDIAN in BIG ENDIAN machine.
59	*/
60	#if defined(DSFMT_BIG_ENDIAN)
61	inline static int idxof(int i) {
62	return i ^ 1;
63	}
64	#else
65	inline static int idxof(int i) {
66	return i;
67	}
68	#endif
69
70	/**
71	* This function represents the recursion formula.
72	* @param r output
73	* @param a a 128-bit part of the internal state array
74	* @param b a 128-bit part of the internal state array
75	* @param lung a 128-bit part of the internal state array
76	*/
77	#if defined(HAVE_ALTIVEC)
78	inline static void do_recursion(w128_t r, w128_t a, w128_t * b,
79	w128_t *lung) {
80	const vector unsigned char sl1 = ALTI_SL1;
81	const vector unsigned char sl1_perm = ALTI_SL1_PERM;
82	const vector unsigned int sl1_msk = ALTI_SL1_MSK;
83	const vector unsigned char sr1 = ALTI_SR;
84	const vector unsigned char sr1_perm = ALTI_SR_PERM;
85	const vector unsigned int sr1_msk = ALTI_SR_MSK;
86	const vector unsigned char perm = ALTI_PERM;
87	const vector unsigned int msk1 = ALTI_MSK;
88	vector unsigned int w, x, y, z;
89
90	z = a->s;
91	w = lung->s;
92	x = vec_perm(w, (vector unsigned int)perm, perm);
93	y = vec_perm(z, sl1_perm, sl1_perm);
94	y = vec_sll(y, sl1);
95	y = vec_and(y, sl1_msk);
96	w = vec_xor(x, b->s);
97	w = vec_xor(w, y);
98	x = vec_perm(w, (vector unsigned int)sr1_perm, sr1_perm);
99	x = vec_srl(x, sr1);
100	x = vec_and(x, sr1_msk);
101	y = vec_and(w, msk1);
102	z = vec_xor(z, y);
103	r->s = vec_xor(z, x);
104	lung->s = w;
105	}
106	#elif defined(HAVE_SSE2)
107	/**
108	* This function setup some constant variables for SSE2.
109	*/
110	static void setup_const(void) {
111	static int first = 1;
112	if (!first) {
113	return;
114	}
115	sse2_param_mask = _mm_set_epi32(DSFMT_MSK32_3, DSFMT_MSK32_4,
116	DSFMT_MSK32_1, DSFMT_MSK32_2);
117	sse2_int_one = _mm_set_epi32(0, 1, 0, 1);
118	sse2_double_two = _mm_set_pd(2.0, 2.0);
119	sse2_double_m_one = _mm_set_pd(-1.0, -1.0);
120	first = 0;
121	}
122
123	/**
124	* This function represents the recursion formula.
125	* @param r output 128-bit
126	* @param a a 128-bit part of the internal state array
127	* @param b a 128-bit part of the internal state array
128	* @param d a 128-bit part of the internal state array (I/O)
129	*/
130	inline static void do_recursion(w128_t r, w128_t a, w128_t b, w128_t u) {
131	__m128i v, w, x, y, z;
132
133	x = a->si;
134	z = _mm_slli_epi64(x, DSFMT_SL1);
135	y = _mm_shuffle_epi32(u->si, SSE2_SHUFF);
136	z = _mm_xor_si128(z, b->si);
137	y = _mm_xor_si128(y, z);
138
139	v = _mm_srli_epi64(y, DSFMT_SR);
140	w = _mm_and_si128(y, sse2_param_mask);
141	v = _mm_xor_si128(v, x);
142	v = _mm_xor_si128(v, w);
143	r->si = v;
144	u->si = y;
145	}
146	#else /* standard C */
147	/**
148	* This function represents the recursion formula.
149	* @param r output 128-bit
150	* @param a a 128-bit part of the internal state array
151	* @param b a 128-bit part of the internal state array
152	* @param lung a 128-bit part of the internal state array (I/O)
153	*/
154	inline static void do_recursion(w128_t r, w128_t a, w128_t * b,
155	w128_t *lung) {
156	uint64_t t0, t1, L0, L1;
157
158	t0 = a->u[0];
159	t1 = a->u[1];
160	L0 = lung->u[0];
161	L1 = lung->u[1];
162	lung->u[0] = (t0 << DSFMT_SL1) ^ (L1 >> 32) ^ (L1 << 32) ^ b->u[0];
163	lung->u[1] = (t1 << DSFMT_SL1) ^ (L0 >> 32) ^ (L0 << 32) ^ b->u[1];
164	r->u[0] = (lung->u[0] >> DSFMT_SR) ^ (lung->u[0] & DSFMT_MSK1) ^ t0;
165	r->u[1] = (lung->u[1] >> DSFMT_SR) ^ (lung->u[1] & DSFMT_MSK2) ^ t1;
166	}
167	#endif
168
169	#if defined(HAVE_SSE2)
170	/**
171	* This function converts the double precision floating point numbers which
172	* distribute uniformly in the range [1, 2) to those which distribute uniformly
173	* in the range [0, 1).
174	* @param w 128bit stracture of double precision floating point numbers (I/O)
175	*/
176	inline static void convert_c0o1(w128_t *w) {
177	w->sd = _mm_add_pd(w->sd, sse2_double_m_one);
178	}
179
180	/**
181	* This function converts the double precision floating point numbers which
182	* distribute uniformly in the range [1, 2) to those which distribute uniformly
183	* in the range (0, 1].
184	* @param w 128bit stracture of double precision floating point numbers (I/O)
185	*/
186	inline static void convert_o0c1(w128_t *w) {
187	w->sd = _mm_sub_pd(sse2_double_two, w->sd);
188	}
189
190	/**
191	* This function converts the double precision floating point numbers which
192	* distribute uniformly in the range [1, 2) to those which distribute uniformly
193	* in the range (0, 1).
194	* @param w 128bit stracture of double precision floating point numbers (I/O)
195	*/
196	inline static void convert_o0o1(w128_t *w) {
197	w->si = _mm_or_si128(w->si, sse2_int_one);
198	w->sd = _mm_add_pd(w->sd, sse2_double_m_one);
199	}
200	#else /* standard C and altivec */
201	/**
202	* This function converts the double precision floating point numbers which
203	* distribute uniformly in the range [1, 2) to those which distribute uniformly
204	* in the range [0, 1).
205	* @param w 128bit stracture of double precision floating point numbers (I/O)
206	*/
207	inline static void convert_c0o1(w128_t *w) {
208	w->d[0] -= 1.0;
209	w->d[1] -= 1.0;
210	}
211
212	/**
213	* This function converts the double precision floating point numbers which
214	* distribute uniformly in the range [1, 2) to those which distribute uniformly
215	* in the range (0, 1].
216	* @param w 128bit stracture of double precision floating point numbers (I/O)
217	*/
218	inline static void convert_o0c1(w128_t *w) {
219	w->d[0] = 2.0 - w->d[0];
220	w->d[1] = 2.0 - w->d[1];
221	}
222
223	/**
224	* This function converts the double precision floating point numbers which
225	* distribute uniformly in the range [1, 2) to those which distribute uniformly
226	* in the range (0, 1).
227	* @param w 128bit stracture of double precision floating point numbers (I/O)
228	*/
229	inline static void convert_o0o1(w128_t *w) {
230	w->u[0] \|= 1;
231	w->u[1] \|= 1;
232	w->d[0] -= 1.0;
233	w->d[1] -= 1.0;
234	}
235	#endif
236
237	/**
238	* This function fills the user-specified array with double precision
239	* floating point pseudorandom numbers of the IEEE 754 format.
240	* @param dsfmt dsfmt state vector.
241	* @param array an 128-bit array to be filled by pseudorandom numbers.
242	* @param size number of 128-bit pseudorandom numbers to be generated.
243	*/
244	inline static void gen_rand_array_c1o2(dsfmt_t dsfmt, w128_t array,
245	int size) {
246	int i, j;
247	w128_t lung;
248
249	lung = dsfmt->status[DSFMT_N];
250	do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
251	&lung);
252	for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
253	do_recursion(&array[i], &dsfmt->status[i],
254	&dsfmt->status[i + DSFMT_POS1], &lung);
255	}
256	for (; i < DSFMT_N; i++) {
257	do_recursion(&array[i], &dsfmt->status[i],
258	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
259	}
260	for (; i < size - DSFMT_N; i++) {
261	do_recursion(&array[i], &array[i - DSFMT_N],
262	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
263	}
264	for (j = 0; j < 2 * DSFMT_N - size; j++) {
265	dsfmt->status[j] = array[j + size - DSFMT_N];
266	}
267	for (; i < size; i++, j++) {
268	do_recursion(&array[i], &array[i - DSFMT_N],
269	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
270	dsfmt->status[j] = array[i];
271	}
272	dsfmt->status[DSFMT_N] = lung;
273	}
274
275	/**
276	* This function fills the user-specified array with double precision
277	* floating point pseudorandom numbers of the IEEE 754 format.
278	* @param dsfmt dsfmt state vector.
279	* @param array an 128-bit array to be filled by pseudorandom numbers.
280	* @param size number of 128-bit pseudorandom numbers to be generated.
281	*/
282	inline static void gen_rand_array_c0o1(dsfmt_t dsfmt, w128_t array,
283	int size) {
284	int i, j;
285	w128_t lung;
286
287	lung = dsfmt->status[DSFMT_N];
288	do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
289	&lung);
290	for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
291	do_recursion(&array[i], &dsfmt->status[i],
292	&dsfmt->status[i + DSFMT_POS1], &lung);
293	}
294	for (; i < DSFMT_N; i++) {
295	do_recursion(&array[i], &dsfmt->status[i],
296	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
297	}
298	for (; i < size - DSFMT_N; i++) {
299	do_recursion(&array[i], &array[i - DSFMT_N],
300	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
301	convert_c0o1(&array[i - DSFMT_N]);
302	}
303	for (j = 0; j < 2 * DSFMT_N - size; j++) {
304	dsfmt->status[j] = array[j + size - DSFMT_N];
305	}
306	for (; i < size; i++, j++) {
307	do_recursion(&array[i], &array[i - DSFMT_N],
308	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
309	dsfmt->status[j] = array[i];
310	convert_c0o1(&array[i - DSFMT_N]);
311	}
312	for (i = size - DSFMT_N; i < size; i++) {
313	convert_c0o1(&array[i]);
314	}
315	dsfmt->status[DSFMT_N] = lung;
316	}
317
318	/**
319	* This function fills the user-specified array with double precision
320	* floating point pseudorandom numbers of the IEEE 754 format.
321	* @param dsfmt dsfmt state vector.
322	* @param array an 128-bit array to be filled by pseudorandom numbers.
323	* @param size number of 128-bit pseudorandom numbers to be generated.
324	*/
325	inline static void gen_rand_array_o0o1(dsfmt_t dsfmt, w128_t array,
326	int size) {
327	int i, j;
328	w128_t lung;
329
330	lung = dsfmt->status[DSFMT_N];
331	do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
332	&lung);
333	for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
334	do_recursion(&array[i], &dsfmt->status[i],
335	&dsfmt->status[i + DSFMT_POS1], &lung);
336	}
337	for (; i < DSFMT_N; i++) {
338	do_recursion(&array[i], &dsfmt->status[i],
339	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
340	}
341	for (; i < size - DSFMT_N; i++) {
342	do_recursion(&array[i], &array[i - DSFMT_N],
343	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
344	convert_o0o1(&array[i - DSFMT_N]);
345	}
346	for (j = 0; j < 2 * DSFMT_N - size; j++) {
347	dsfmt->status[j] = array[j + size - DSFMT_N];
348	}
349	for (; i < size; i++, j++) {
350	do_recursion(&array[i], &array[i - DSFMT_N],
351	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
352	dsfmt->status[j] = array[i];
353	convert_o0o1(&array[i - DSFMT_N]);
354	}
355	for (i = size - DSFMT_N; i < size; i++) {
356	convert_o0o1(&array[i]);
357	}
358	dsfmt->status[DSFMT_N] = lung;
359	}
360
361	/**
362	* This function fills the user-specified array with double precision
363	* floating point pseudorandom numbers of the IEEE 754 format.
364	* @param dsfmt dsfmt state vector.
365	* @param array an 128-bit array to be filled by pseudorandom numbers.
366	* @param size number of 128-bit pseudorandom numbers to be generated.
367	*/
368	inline static void gen_rand_array_o0c1(dsfmt_t dsfmt, w128_t array,
369	int size) {
370	int i, j;
371	w128_t lung;
372
373	lung = dsfmt->status[DSFMT_N];
374	do_recursion(&array[0], &dsfmt->status[0], &dsfmt->status[DSFMT_POS1],
375	&lung);
376	for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
377	do_recursion(&array[i], &dsfmt->status[i],
378	&dsfmt->status[i + DSFMT_POS1], &lung);
379	}
380	for (; i < DSFMT_N; i++) {
381	do_recursion(&array[i], &dsfmt->status[i],
382	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
383	}
384	for (; i < size - DSFMT_N; i++) {
385	do_recursion(&array[i], &array[i - DSFMT_N],
386	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
387	convert_o0c1(&array[i - DSFMT_N]);
388	}
389	for (j = 0; j < 2 * DSFMT_N - size; j++) {
390	dsfmt->status[j] = array[j + size - DSFMT_N];
391	}
392	for (; i < size; i++, j++) {
393	do_recursion(&array[i], &array[i - DSFMT_N],
394	&array[i + DSFMT_POS1 - DSFMT_N], &lung);
395	dsfmt->status[j] = array[i];
396	convert_o0c1(&array[i - DSFMT_N]);
397	}
398	for (i = size - DSFMT_N; i < size; i++) {
399	convert_o0c1(&array[i]);
400	}
401	dsfmt->status[DSFMT_N] = lung;
402	}
403
404	/**
405	* This function represents a function used in the initialization
406	* by init_by_array
407	* @param x 32-bit integer
408	* @return 32-bit integer
409	*/
410	static uint32_t ini_func1(uint32_t x) {
411	return (x ^ (x >> 27)) * (uint32_t)1664525UL;
412	}
413
414	/**
415	* This function represents a function used in the initialization
416	* by init_by_array
417	* @param x 32-bit integer
418	* @return 32-bit integer
419	*/
420	static uint32_t ini_func2(uint32_t x) {
421	return (x ^ (x >> 27)) * (uint32_t)1566083941UL;
422	}
423
424	/**
425	* This function initializes the internal state array to fit the IEEE
426	* 754 format.
427	* @param dsfmt dsfmt state vector.
428	*/
429	static void initial_mask(dsfmt_t *dsfmt) {
430	int i;
431	uint64_t *psfmt;
432
433	psfmt = &dsfmt->status[0].u[0];
434	for (i = 0; i < DSFMT_N * 2; i++) {
435	psfmt[i] = (psfmt[i] & DSFMT_LOW_MASK) \| DSFMT_HIGH_CONST;
436	}
437	}
438
439	/**
440	* This function certificate the period of 2^{SFMT_MEXP}-1.
441	* @param dsfmt dsfmt state vector.
442	*/
443	static void period_certification(dsfmt_t *dsfmt) {
444	uint64_t pcv[2] = {DSFMT_PCV1, DSFMT_PCV2};
445	uint64_t tmp[2];
446	uint64_t inner;
447	int i;
448	#if (DSFMT_PCV2 & 1) != 1
449	int j;
450	uint64_t work;
451	#endif
452
453	tmp[0] = (dsfmt->status[DSFMT_N].u[0] ^ DSFMT_FIX1);
454	tmp[1] = (dsfmt->status[DSFMT_N].u[1] ^ DSFMT_FIX2);
455
456	inner = tmp[0] & pcv[0];
457	inner ^= tmp[1] & pcv[1];
458	for (i = 32; i > 0; i >>= 1) {
459	inner ^= inner >> i;
460	}
461	inner &= 1;
462	/* check OK */
463	if (inner == 1) {
464	return;
465	}
466	/* check NG, and modification */
467	#if (DSFMT_PCV2 & 1) == 1
468	dsfmt->status[DSFMT_N].u[1] ^= 1;
469	#else
470	for (i = 1; i >= 0; i--) {
471	work = 1;
472	for (j = 0; j < 64; j++) {
473	if ((work & pcv[i]) != 0) {
474	dsfmt->status[DSFMT_N].u[i] ^= work;
475	return;
476	}
477	work = work << 1;
478	}
479	}
480	#endif
481	return;
482	}
483
484	/*----------------
485	PUBLIC FUNCTIONS
486	----------------*/
487	/**
488	* This function returns the identification string. The string shows
489	* the Mersenne exponent, and all parameters of this generator.
490	* @return id string.
491	*/
492	const char *dsfmt_get_idstring(void) {
493	return DSFMT_IDSTR;
494	}
495
496	/**
497	* This function returns the minimum size of array used for \b
498	* fill_array functions.
499	* @return minimum size of array used for fill_array functions.
500	*/
501	int dsfmt_get_min_array_size(void) {
502	return DSFMT_N64;
503	}
504
505	/**
506	* This function fills the internal state array with double precision
507	* floating point pseudorandom numbers of the IEEE 754 format.
508	* @param dsfmt dsfmt state vector.
509	*/
510	void dsfmt_gen_rand_all(dsfmt_t *dsfmt) {
511	int i;
512	w128_t lung;
513
514	lung = dsfmt->status[DSFMT_N];
515	do_recursion(&dsfmt->status[0], &dsfmt->status[0],
516	&dsfmt->status[DSFMT_POS1], &lung);
517	for (i = 1; i < DSFMT_N - DSFMT_POS1; i++) {
518	do_recursion(&dsfmt->status[i], &dsfmt->status[i],
519	&dsfmt->status[i + DSFMT_POS1], &lung);
520	}
521	for (; i < DSFMT_N; i++) {
522	do_recursion(&dsfmt->status[i], &dsfmt->status[i],
523	&dsfmt->status[i + DSFMT_POS1 - DSFMT_N], &lung);
524	}
525	dsfmt->status[DSFMT_N] = lung;
526	}
527
528	/**
529	* This function generates double precision floating point
530	* pseudorandom numbers which distribute in the range [1, 2) to the
531	* specified array[] by one call. The number of pseudorandom numbers
532	* is specified by the argument \b size, which must be at least (SFMT_MEXP
533	* / 128) * 2 and a multiple of two. The function
534	* get_min_array_size() returns this minimum size. The generation by
535	* this function is much faster than the following fill_array_xxx functions.
536	*
537	* For initialization, init_gen_rand() or init_by_array() must be called
538	* before the first call of this function. This function can not be
539	* used after calling genrand_xxx functions, without initialization.
540	*
541	* @param dsfmt dsfmt state vector.
542	* @param array an array where pseudorandom numbers are filled
543	* by this function. The pointer to the array must be "aligned"
544	* (namely, must be a multiple of 16) in the SIMD version, since it
545	* refers to the address of a 128-bit integer. In the standard C
546	* version, the pointer is arbitrary.
547	*
548	* @param size the number of 64-bit pseudorandom integers to be
549	* generated. size must be a multiple of 2, and greater than or equal
550	* to (SFMT_MEXP / 128) * 2.
551	*
552	* @note \b memalign or \b posix_memalign is available to get aligned
553	* memory. Mac OSX doesn't have these functions, but \b malloc of OSX
554	* returns the pointer to the aligned memory block.
555	*/
556	void dsfmt_fill_array_close1_open2(dsfmt_t *dsfmt, double array[], int size) {
557	assert(size % 2 == 0);
558	assert(size >= DSFMT_N64);
559	gen_rand_array_c1o2(dsfmt, (w128_t *)array, size / 2);
560	}
561
562	/**
563	* This function generates double precision floating point
564	* pseudorandom numbers which distribute in the range (0, 1] to the
565	* specified array[] by one call. This function is the same as
566	* fill_array_close1_open2() except the distribution range.
567	*
568	* @param dsfmt dsfmt state vector.
569	* @param array an array where pseudorandom numbers are filled
570	* by this function.
571	* @param size the number of pseudorandom numbers to be generated.
572	* see also \sa fill_array_close1_open2()
573	*/
574	void dsfmt_fill_array_open_close(dsfmt_t *dsfmt, double array[], int size) {
575	assert(size % 2 == 0);
576	assert(size >= DSFMT_N64);
577	gen_rand_array_o0c1(dsfmt, (w128_t *)array, size / 2);
578	}
579
580	/**
581	* This function generates double precision floating point
582	* pseudorandom numbers which distribute in the range [0, 1) to the
583	* specified array[] by one call. This function is the same as
584	* fill_array_close1_open2() except the distribution range.
585	*
586	* @param array an array where pseudorandom numbers are filled
587	* by this function.
588	* @param dsfmt dsfmt state vector.
589	* @param size the number of pseudorandom numbers to be generated.
590	* see also \sa fill_array_close1_open2()
591	*/
592	void dsfmt_fill_array_close_open(dsfmt_t *dsfmt, double array[], int size) {
593	assert(size % 2 == 0);
594	assert(size >= DSFMT_N64);
595	gen_rand_array_c0o1(dsfmt, (w128_t *)array, size / 2);
596	}
597
598	/**
599	* This function generates double precision floating point
600	* pseudorandom numbers which distribute in the range (0, 1) to the
601	* specified array[] by one call. This function is the same as
602	* fill_array_close1_open2() except the distribution range.
603	*
604	* @param dsfmt dsfmt state vector.
605	* @param array an array where pseudorandom numbers are filled
606	* by this function.
607	* @param size the number of pseudorandom numbers to be generated.
608	* see also \sa fill_array_close1_open2()
609	*/
610	void dsfmt_fill_array_open_open(dsfmt_t *dsfmt, double array[], int size) {
611	assert(size % 2 == 0);
612	assert(size >= DSFMT_N64);
613	gen_rand_array_o0o1(dsfmt, (w128_t *)array, size / 2);
614	}
615
616	#if defined(__INTEL_COMPILER)
617	# pragma warning(disable:981)
618	#endif
619	/**
620	* This function initializes the internal state array with a 32-bit
621	* integer seed.
622	* @param dsfmt dsfmt state vector.
623	* @param seed a 32-bit integer used as the seed.
624	* @param mexp caller's mersenne expornent
625	*/
626	void dsfmt_chk_init_gen_rand(dsfmt_t *dsfmt, uint32_t seed, int mexp) {
627	int i;
628	uint32_t *psfmt;
629
630	/* make sure caller program is compiled with the same MEXP */
631	if (mexp != dsfmt_mexp) {
632	fprintf(stderr, "DSFMT_MEXP doesn't match with dSFMT.c\n");
633	exit(1);
634	}
635	psfmt = &dsfmt->status[0].u32[0];
636	psfmt[idxof(0)] = seed;
637	for (i = 1; i < (DSFMT_N + 1) * 4; i++) {
638	psfmt[idxof(i)] = 1812433253UL
639	* (psfmt[idxof(i - 1)] ^ (psfmt[idxof(i - 1)] >> 30)) + i;
640	}
641	initial_mask(dsfmt);
642	period_certification(dsfmt);
643	dsfmt->idx = DSFMT_N64;
644	#if defined(HAVE_SSE2)
645	setup_const();
646	#endif
647	}
648
649	/**
650	* This function initializes the internal state array,
651	* with an array of 32-bit integers used as the seeds
652	* @param dsfmt dsfmt state vector.
653	* @param init_key the array of 32-bit integers, used as a seed.
654	* @param key_length the length of init_key.
655	* @param mexp caller's mersenne expornent
656	*/
657	void dsfmt_chk_init_by_array(dsfmt_t *dsfmt, uint32_t init_key[],
658	int key_length, int mexp) {
659	int i, j, count;
660	uint32_t r;
661	uint32_t *psfmt32;
662	int lag;
663	int mid;
664	int size = (DSFMT_N + 1) * 4; /* pulmonary */
665
666	/* make sure caller program is compiled with the same MEXP */
667	if (mexp != dsfmt_mexp) {
668	fprintf(stderr, "DSFMT_MEXP doesn't match with dSFMT.c\n");
669	exit(1);
670	}
671	if (size >= 623) {
672	lag = 11;
673	} else if (size >= 68) {
674	lag = 7;
675	} else if (size >= 39) {
676	lag = 5;
677	} else {
678	lag = 3;
679	}
680	mid = (size - lag) / 2;
681
682	psfmt32 = &dsfmt->status[0].u32[0];
683	memset(dsfmt->status, 0x8b, sizeof(dsfmt->status));
684	if (key_length + 1 > size) {
685	count = key_length + 1;
686	} else {
687	count = size;
688	}
689	r = ini_func1(psfmt32[idxof(0)] ^ psfmt32[idxof(mid % size)]
690	^ psfmt32[idxof((size - 1) % size)]);
691	psfmt32[idxof(mid % size)] += r;
692	r += key_length;
693	psfmt32[idxof((mid + lag) % size)] += r;
694	psfmt32[idxof(0)] = r;
695	count--;
696	for (i = 1, j = 0; (j < count) && (j < key_length); j++) {
697	r = ini_func1(psfmt32[idxof(i)]
698	^ psfmt32[idxof((i + mid) % size)]
699	^ psfmt32[idxof((i + size - 1) % size)]);
700	psfmt32[idxof((i + mid) % size)] += r;
701	r += init_key[j] + i;
702	psfmt32[idxof((i + mid + lag) % size)] += r;
703	psfmt32[idxof(i)] = r;
704	i = (i + 1) % size;
705	}
706	for (; j < count; j++) {
707	r = ini_func1(psfmt32[idxof(i)]
708	^ psfmt32[idxof((i + mid) % size)]
709	^ psfmt32[idxof((i + size - 1) % size)]);
710	psfmt32[idxof((i + mid) % size)] += r;
711	r += i;
712	psfmt32[idxof((i + mid + lag) % size)] += r;
713	psfmt32[idxof(i)] = r;
714	i = (i + 1) % size;
715	}
716	for (j = 0; j < size; j++) {
717	r = ini_func2(psfmt32[idxof(i)]
718	+ psfmt32[idxof((i + mid) % size)]
719	+ psfmt32[idxof((i + size - 1) % size)]);
720	psfmt32[idxof((i + mid) % size)] ^= r;
721	r -= i;
722	psfmt32[idxof((i + mid + lag) % size)] ^= r;
723	psfmt32[idxof(i)] = r;
724	i = (i + 1) % size;
725	}
726	initial_mask(dsfmt);
727	period_certification(dsfmt);
728	dsfmt->idx = DSFMT_N64;
729	#if defined(HAVE_SSE2)
730	setup_const();
731	#endif
732	}
733	#if defined(__INTEL_COMPILER)
734	# pragma warning(default:981)
735	#endif

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: Sophya/trunk/SophyaLib/BaseTools/dSFMT.c@ 3891

Download in other formats: