forked from databricks/tpch-dbgen
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathspeed_seed.c
261 lines (226 loc) · 6.47 KB
/
speed_seed.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
/*
* $Id: speed_seed.c,v 1.9 2009/06/28 14:01:08 jms Exp $
*
* Revision History
* ===================
* $Log: speed_seed.c,v $
* Revision 1.9 2009/06/28 14:01:08 jms
* bug fix for DOP
*
* Revision 1.8 2006/08/01 04:13:17 jms
* fix parallel generation
*
* Revision 1.7 2006/07/31 17:23:09 jms
* fix to parallelism problem
*
* Revision 1.6 2006/05/16 16:26:51 jms
* remove calls to FAKE_V_STR
*
* Revision 1.5 2006/04/26 23:14:28 jms
* Declaraion cleanup of fakeVStr()
*
* Revision 1.4 2006/04/26 23:01:10 jms
* address update generation problems
*
* Revision 1.3 2005/10/25 17:26:38 jms
* check in integration between microsoft changes and baseline code
*
* Revision 1.2 2005/01/03 20:08:59 jms
* change line terminations
*
* Revision 1.1.1.1 2004/11/24 23:31:47 jms
* re-establish external server
*
* Revision 1.2 2004/01/22 03:54:12 jms
* 64 bit support changes for customer address
*
* Revision 1.1.1.1 2003/08/08 22:37:36 jms
* recreation after CVS crash
*
* Revision 1.3 2003/08/08 22:37:36 jms
* first integration of rng64 for o_custkey and l_partkey
*
* Revision 1.2 2003/08/07 17:58:34 jms
* Convery RNG to 64bit space as preparation for new large scale RNG
*
* Revision 1.1.1.1 2003/04/03 18:54:21 jms
* initial checkin
*
*
*/
#include <stdio.h>
#include <stdlib.h>
#include "dss.h"
#include "rng64.h"
#include "dss.h"
/* _tal long RandSeed = "Random^SeedFromTimestamp" (void); */
#define ADVANCE_STREAM(stream_id, num_calls) \
advanceStream(stream_id, num_calls, 0)
#define ADVANCE_STREAM64(stream_id, num_calls) \
advanceStream(stream_id, num_calls, 1)
#define MAX_COLOR 92
long name_bits[MAX_COLOR / BITS_PER_LONG];
extern seed_t Seed[];
void fakeVStr(int nAvg, long nSeed, DSS_HUGE nCount);
void NthElement (DSS_HUGE N, DSS_HUGE *StartSeed);
void
advanceStream(int nStream, DSS_HUGE nCalls, int bUse64Bit)
{
if (bUse64Bit)
Seed[nStream].value = AdvanceRand64(Seed[nStream].value, nCalls);
else
NthElement(nCalls, &Seed[nStream].value);
#ifdef RNG_TEST
Seed[nStream].nCalls += nCalls;
#endif
return;
}
/* WARNING! This routine assumes the existence of 64-bit */
/* integers. The notation used here- "HUGE" is *not* ANSI standard. */
/* Hopefully, you have this extension as well. If not, use whatever */
/* nonstandard trick you need to in order to get 64 bit integers. */
/* The book says that this will work if MAXINT for the type you choose */
/* is at least 2**46 - 1, so 64 bits is more than you *really* need */
static DSS_HUGE Multiplier = 16807; /* or whatever nonstandard */
static DSS_HUGE Modulus = 2147483647; /* trick you use to get 64 bit int */
/* Advances value of Seed after N applications of the random number generator
with multiplier Mult and given Modulus.
NthElement(Seed[],count);
Theory: We are using a generator of the form
X_n = [Mult * X_(n-1)] mod Modulus. It turns out that
X_n = [(Mult ** n) X_0] mod Modulus.
This can be computed using a divide-and-conquer technique, see
the code below.
In words, this means that if you want the value of the Seed after n
applications of the generator, you multiply the initial value of the
Seed by the "super multiplier" which is the basic multiplier raised
to the nth power, and then take mod Modulus.
*/
/* Nth Element of sequence starting with StartSeed */
void NthElement (DSS_HUGE N, DSS_HUGE *StartSeed)
{
DSS_HUGE Z;
DSS_HUGE Mult;
static int ln=-1;
int i;
if ((verbose > 0) && ++ln % 1000 == 0)
{
i = ln % LN_CNT;
fprintf(stderr, "%c\b", lnoise[i]);
}
Mult = Multiplier;
Z = (DSS_HUGE) *StartSeed;
while (N > 0 )
{
if (N % 2 != 0) /* testing for oddness, this seems portable */
Z = (Mult * Z) % Modulus;
N = N / 2; /* integer division, truncates */
Mult = (Mult * Mult) % Modulus;
}
*StartSeed = Z;
return;
}
/* updates Seed[column] using the a_rnd algorithm */
void
fake_a_rnd(int min, int max, int column)
{
DSS_HUGE len;
DSS_HUGE itcount;
RANDOM(len, min, max, column);
if (len % 5L == 0)
itcount = len/5;
else
itcount = len/5 + 1L;
NthElement(itcount, &Seed[column].usage);
#ifdef RNG_TEST
Seed[column].nCalls += itcount;
#endif
return;
}
long
sd_part(int child, DSS_HUGE skip_count)
{
int i;
for (i=P_MFG_SD; i<= P_CNTR_SD; i++)
ADVANCE_STREAM(i, skip_count);
ADVANCE_STREAM(P_CMNT_SD, skip_count * 2);
ADVANCE_STREAM(P_NAME_SD, skip_count * 92);
return(0L);
}
long
sd_line(int child, DSS_HUGE skip_count)
{
int i,j;
for (j=0; j < O_LCNT_MAX; j++)
{
for (i=L_QTY_SD; i<= L_RFLG_SD; i++)
/*
if (scale >= 30000 && i == L_PKEY_SD)
ADVANCE_STREAM64(i, skip_count);
else
*/
ADVANCE_STREAM(i, skip_count);
ADVANCE_STREAM(L_CMNT_SD, skip_count * 2);
}
/* need to special case this as the link between master and detail */
if (child == 1)
{
ADVANCE_STREAM(O_ODATE_SD, skip_count);
ADVANCE_STREAM(O_LCNT_SD, skip_count);
}
return(0L);
}
long
sd_order(int child, DSS_HUGE skip_count)
{
ADVANCE_STREAM(O_LCNT_SD, skip_count);
/*
if (scale >= 30000)
ADVANCE_STREAM64(O_CKEY_SD, skip_count);
else
*/
ADVANCE_STREAM(O_CKEY_SD, skip_count);
ADVANCE_STREAM(O_CMNT_SD, skip_count * 2);
ADVANCE_STREAM(O_SUPP_SD, skip_count);
ADVANCE_STREAM(O_CLRK_SD, skip_count);
ADVANCE_STREAM(O_PRIO_SD, skip_count);
ADVANCE_STREAM(O_ODATE_SD, skip_count);
return (0L);
}
long
sd_psupp(int child, DSS_HUGE skip_count)
{
int j;
for (j=0; j < SUPP_PER_PART; j++)
{
ADVANCE_STREAM(PS_QTY_SD, skip_count);
ADVANCE_STREAM(PS_SCST_SD, skip_count);
ADVANCE_STREAM(PS_CMNT_SD, skip_count * 2);
}
return(0L);
}
long
sd_cust(int child, DSS_HUGE skip_count)
{
ADVANCE_STREAM(C_ADDR_SD, skip_count * 9);
ADVANCE_STREAM(C_CMNT_SD, skip_count * 2);
ADVANCE_STREAM(C_NTRG_SD, skip_count);
ADVANCE_STREAM(C_PHNE_SD, 3L * skip_count);
ADVANCE_STREAM(C_ABAL_SD, skip_count);
ADVANCE_STREAM(C_MSEG_SD, skip_count);
return(0L);
}
long
sd_supp(int child, DSS_HUGE skip_count)
{
ADVANCE_STREAM(S_NTRG_SD, skip_count);
ADVANCE_STREAM(S_PHNE_SD, 3L * skip_count);
ADVANCE_STREAM(S_ABAL_SD, skip_count);
ADVANCE_STREAM(S_ADDR_SD, skip_count * 9);
ADVANCE_STREAM(S_CMNT_SD, skip_count * 2);
ADVANCE_STREAM(BBB_CMNT_SD, skip_count);
ADVANCE_STREAM(BBB_JNK_SD, skip_count);
ADVANCE_STREAM(BBB_OFFSET_SD, skip_count);
ADVANCE_STREAM(BBB_TYPE_SD, skip_count); /* avoid one trudge */
return(0L);
}