505 lines
14 KiB
C
505 lines
14 KiB
C
/* Sccsid: @(#)build.c 9.1.1.17 11/15/95 12:52:28 */
|
|
/* stuff related to the customer table */
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#ifndef VMS
|
|
#include <sys/types.h>
|
|
#endif
|
|
#if defined(SUN)
|
|
#include <unistd.h>
|
|
#endif
|
|
#include <math.h>
|
|
|
|
#include "dss.h"
|
|
#include "dsstypes.h"
|
|
|
|
#define LEAP_ADJ(yr, mnth) \
|
|
((LEAP(yr) && (mnth) >= 2) ? 1 : 0)
|
|
#define JDAY_BASE 8035 /* start from 1/1/70 a la unix */
|
|
#define JMNTH_BASE (-70 * 12) /* start from 1/1/70 a la unix */
|
|
#define JDAY(date) ((date) - STARTDATE + JDAY_BASE + 1)
|
|
#define PART_SUPP_BRIDGE(tgt, p, s) \
|
|
{ \
|
|
long tot_scnt = tdefs[SUPP].base * scale; \
|
|
tgt = (p + s * (tot_scnt / SUPP_PER_PART + \
|
|
(long) ((p - 1) / tot_scnt))) % tot_scnt + 1; \
|
|
}
|
|
#define RPRICE_BRIDGE(tgt, p) tgt = rpb_routine(p)
|
|
#define V_STR(avg, sd, tgt) a_rnd((int)(avg * V_STR_LOW), \
|
|
(int)(avg * V_STR_HGH), sd, tgt)
|
|
static void gen_phone PROTO((long ind, char *target, long seed));
|
|
|
|
|
|
/*
|
|
* Extensions to dbgen for generation of skewed data.
|
|
* Surajit Chaudhuri, Vivek Narasayya.
|
|
* (Jan '99)
|
|
*/
|
|
extern double skew;
|
|
long NumLineitemsGenerated;
|
|
extern long SkewInt(long nLow, long nHigh, long nStream, double skew, long n);
|
|
long SkewIntCount(long nStream, int skewVal, long n);
|
|
extern long upd_num;
|
|
|
|
|
|
long
|
|
rpb_routine(long p)
|
|
{
|
|
long price;
|
|
|
|
price = 90000;
|
|
price += (p/10) % 20001; /* limit contribution to $200 */
|
|
price += (p % 1000) * 100;
|
|
|
|
return(price);
|
|
}
|
|
|
|
static void
|
|
gen_phone(long ind, char *target, long seed)
|
|
{
|
|
long acode,
|
|
exchg,
|
|
number;
|
|
|
|
RANDOM(acode, 100, 999, seed, skew, 900);
|
|
RANDOM(exchg, 100, 999, seed, skew, 900);
|
|
RANDOM(number, 1000, 9999, seed, skew, 9000);
|
|
|
|
sprintf(target, "%02d", 10 + (ind % NATIONS_MAX));
|
|
sprintf(target + 3, "%03d", acode);
|
|
sprintf(target + 7, "%03d", exchg);
|
|
sprintf(target + 11, "%04d", number);
|
|
target[2] = target[6] = target[10] = '-';
|
|
|
|
return;
|
|
}
|
|
|
|
|
|
|
|
long
|
|
mk_cust(long n_cust, customer_t *c)
|
|
{
|
|
long i;
|
|
|
|
c->custkey = n_cust;
|
|
sprintf(c->name, C_NAME_FMT, C_NAME_TAG, n_cust);
|
|
c->alen = V_STR(C_ADDR_LEN, C_ADDR_SD, c->address);
|
|
RANDOM(i, 0, (nations.count - 1), C_NTRG_SD, skew, O_CKEY_MAX);
|
|
c->nation_code = i;
|
|
gen_phone(i, c->phone, (long)C_PHNE_SD);
|
|
RANDOM(c->acctbal, C_ABAL_MIN, C_ABAL_MAX, C_ABAL_SD, skew, O_CKEY_MAX);
|
|
pick_str(&c_mseg_set, C_MSEG_SD, c->mktsegment);
|
|
c->clen = V_STR(C_CMNT_LEN, C_CMNT_SD, c->comment);
|
|
|
|
return (0);
|
|
}
|
|
|
|
|
|
/*
|
|
* generate the numbered order and its associated lineitems
|
|
*/
|
|
long
|
|
#ifdef SUPPORT_64BITS
|
|
mk_order(DSS_HUGE index, order_t *o)
|
|
#else
|
|
mk_order(long index[], order_t *o)
|
|
#endif /* SUPPORT_64BITS */
|
|
{
|
|
long lcnt;
|
|
long rprice;
|
|
long ocnt;
|
|
long tmp_date;
|
|
long s_date;
|
|
long r_date;
|
|
long c_date;
|
|
long clk_num;
|
|
long supp_num;
|
|
static char **asc_date = NULL;
|
|
char tmp_str[2];
|
|
char **mk_ascdate PROTO((void));
|
|
|
|
long numBatches;
|
|
long lastBatchSize;
|
|
long i;
|
|
long count;
|
|
long numLines;
|
|
|
|
|
|
if (asc_date == NULL)
|
|
asc_date = mk_ascdate();
|
|
|
|
HUGE_SET(index, o->okey);
|
|
do
|
|
{
|
|
RANDOM(o->custkey, O_CKEY_MIN, O_CKEY_MAX, O_CKEY_SD, skew, O_CKEY_MAX);
|
|
} while (o->custkey % CUST_MORTALITY == 0);
|
|
|
|
|
|
RANDOM(tmp_date, O_ODATE_MIN, O_ODATE_MAX, O_ODATE_SD, skew, O_OKEY_MAX);
|
|
|
|
if (oldtime)
|
|
sprintf(o->odate,"%ld", JDAY(tmp_date));
|
|
else
|
|
strcpy(o->odate, asc_date[tmp_date - STARTDATE]);
|
|
|
|
pick_str(&o_priority_set, O_PRIO_SD, o->opriority);
|
|
RANDOM(clk_num, 1, MAX((scale * O_CLRK_SCL), O_CLRK_SCL), O_CLRK_SD, skew, O_OKEY_MAX);
|
|
sprintf(o->clerk, O_CLRK_FMT,
|
|
O_CLRK_TAG,
|
|
clk_num);
|
|
o->clen = V_STR(O_CMNT_LEN, O_CMNT_SD, o->comment);
|
|
o->spriority = 0;
|
|
|
|
o->totalprice = 0;
|
|
o->orderstatus = 'O';
|
|
ocnt = 0;
|
|
|
|
#ifdef OLD_MAKE_ORDER_LINE
|
|
|
|
RANDOM(o->lines, O_LCNT_MIN, O_LCNT_MAX, O_LCNT_SD, 0, (O_LCNT_MAX-O_LCNT_MIN+1));
|
|
for (lcnt = 0; lcnt < o->lines; lcnt++)
|
|
{
|
|
HUGE_SET(o->okey, o->l[lcnt].okey);
|
|
o->l[lcnt].lcnt = lcnt + 1;
|
|
RANDOM(o->l[lcnt].quantity, L_QTY_MIN, L_QTY_MAX, L_QTY_SD, skew, L_LCNT_MAX);
|
|
RANDOM(o->l[lcnt].discount, L_DCNT_MIN, L_DCNT_MAX, L_DCNT_SD, skew, L_LCNT_MAX);
|
|
RANDOM(o->l[lcnt].tax, L_TAX_MIN, L_TAX_MAX, L_TAX_SD, skew, L_LCNT_MAX);
|
|
pick_str(&l_instruct_set, L_SHIP_SD, o->l[lcnt].shipinstruct);
|
|
pick_str(&l_smode_set, L_SMODE_SD, o->l[lcnt].shipmode);
|
|
o->l[lcnt].clen = V_STR(L_CMNT_LEN, L_CMNT_SD,
|
|
o->l[lcnt].comment);
|
|
RANDOM(o->l[lcnt].partkey, L_PKEY_MIN, L_PKEY_MAX, L_PKEY_SD, skew, L_PKEY_MAX);
|
|
RPRICE_BRIDGE( rprice, o->l[lcnt].partkey);
|
|
RANDOM(supp_num, 0, 3, L_SKEY_SD, skew, 4);
|
|
PART_SUPP_BRIDGE( o->l[lcnt].suppkey, o->l[lcnt].partkey, supp_num);
|
|
o->l[lcnt].eprice = rprice * o->l[lcnt].quantity;
|
|
|
|
o->totalprice +=
|
|
((o->l[lcnt].eprice *
|
|
((long)100 - o->l[lcnt].discount)) / (long)PENNIES ) *
|
|
((long)100 + o->l[lcnt].tax)
|
|
/ (long)PENNIES;
|
|
|
|
RANDOM(s_date, L_SDTE_MIN, L_SDTE_MAX, L_SDTE_SD, skew, L_LCNT_MAX);
|
|
s_date += tmp_date;
|
|
RANDOM(c_date, L_CDTE_MIN, L_CDTE_MAX, L_CDTE_SD, skew, L_LCNT_MAX);
|
|
c_date += tmp_date;
|
|
RANDOM(r_date, L_RDTE_MIN, L_RDTE_MAX, L_RDTE_SD, skew, L_LCNT_MAX);
|
|
r_date += s_date;
|
|
|
|
if (oldtime)
|
|
{
|
|
sprintf(o->l[lcnt].sdate, "%ld", JDAY(s_date));
|
|
sprintf(o->l[lcnt].cdate, "%ld", JDAY(c_date));
|
|
sprintf(o->l[lcnt].rdate, "%ld", JDAY(r_date));
|
|
}
|
|
else
|
|
{
|
|
strcpy(o->l[lcnt].sdate, asc_date[s_date - STARTDATE]);
|
|
strcpy(o->l[lcnt].cdate, asc_date[c_date - STARTDATE]);
|
|
strcpy(o->l[lcnt].rdate, asc_date[r_date - STARTDATE]);
|
|
}
|
|
|
|
if (julian(r_date) <= CURRENTDATE)
|
|
{
|
|
pick_str(&l_rflag_set, L_RFLG_SD, tmp_str);
|
|
o->l[lcnt].rflag[0] = *tmp_str;
|
|
}
|
|
else
|
|
o->l[lcnt].rflag[0] = 'N';
|
|
|
|
if (julian(s_date) <= CURRENTDATE)
|
|
{
|
|
ocnt++;
|
|
o->l[lcnt].lstatus[0] = 'F';
|
|
}
|
|
else
|
|
o->l[lcnt].lstatus[0] = 'O';
|
|
}
|
|
if (ocnt > 0)
|
|
o->orderstatus = 'P';
|
|
if (ocnt == o->lines)
|
|
o->orderstatus = 'F';
|
|
#else /* New method for generating skewed data for ORDERS & LINEITEM */
|
|
|
|
numLines = SkewIntCount (L_OKEY_SD, skew, L_LINE_SIZE);
|
|
|
|
/* make sure that we get enough rows for lineitem */
|
|
if(numLines < O_LCNT_MAX)
|
|
{
|
|
/* numLines = a uniform random number between 1 and O_LCNT_MAX */
|
|
numLines = (numLines) ? (numLines) : 1;
|
|
RANDOM(numLines, O_LCNT_MIN, O_LCNT_MAX, O_LCNT_SD, 0, (O_LCNT_MAX-O_LCNT_MIN+1));
|
|
}
|
|
|
|
/* In each batch we can generate at most O_LCNT_MAX copies of lineitem rows */
|
|
/* compute number of batches necessary for this particular value of o_orderkey */
|
|
numBatches = numLines / (O_LCNT_MAX);
|
|
lastBatchSize = numLines % (O_LCNT_MAX);
|
|
|
|
if(lastBatchSize)
|
|
numBatches++;
|
|
|
|
for(i = 0; i < numBatches; i++)
|
|
{
|
|
if((i==0) && (numLines==O_LCNT_MAX))
|
|
{
|
|
/* special case - one batch with O_LCNT_MAX rows */
|
|
count = numLines;
|
|
}
|
|
else
|
|
{
|
|
count = (i==(numBatches-1)) ? lastBatchSize : O_LCNT_MAX;
|
|
}
|
|
o->lines = count;
|
|
for (lcnt = 0; lcnt < count ; lcnt++)
|
|
{
|
|
HUGE_SET(o->okey, o->l[lcnt].okey);
|
|
o->l[lcnt].lcnt = (i*O_LCNT_MAX) + lcnt + 1;
|
|
RANDOM(o->l[lcnt].quantity, L_QTY_MIN, L_QTY_MAX, L_QTY_SD, skew, L_LINE_SIZE);
|
|
RANDOM(o->l[lcnt].discount, L_DCNT_MIN, L_DCNT_MAX, L_DCNT_SD, skew, L_LINE_SIZE);
|
|
RANDOM(o->l[lcnt].tax, L_TAX_MIN, L_TAX_MAX, L_TAX_SD, skew, L_LINE_SIZE);
|
|
pick_str(&l_instruct_set, L_SHIP_SD, o->l[lcnt].shipinstruct);
|
|
pick_str(&l_smode_set, L_SMODE_SD, o->l[lcnt].shipmode);
|
|
o->l[lcnt].clen = V_STR(L_CMNT_LEN, L_CMNT_SD,
|
|
o->l[lcnt].comment);
|
|
RANDOM(o->l[lcnt].partkey, L_PKEY_MIN, L_PKEY_MAX, L_PKEY_SD, skew, L_LINE_SIZE);
|
|
RPRICE_BRIDGE( rprice, o->l[lcnt].partkey);
|
|
RANDOM(supp_num, 0, 3, L_SKEY_SD, skew, 4);
|
|
PART_SUPP_BRIDGE( o->l[lcnt].suppkey, o->l[lcnt].partkey, supp_num);
|
|
o->l[lcnt].eprice = rprice * o->l[lcnt].quantity;
|
|
|
|
o->totalprice +=
|
|
((o->l[lcnt].eprice *
|
|
((long)100 - o->l[lcnt].discount)) / (long)PENNIES ) *
|
|
((long)100 + o->l[lcnt].tax)
|
|
/ (long)PENNIES;
|
|
|
|
RANDOM(s_date, L_SDTE_MIN, L_SDTE_MAX, L_SDTE_SD, skew, L_LINE_SIZE);
|
|
s_date += tmp_date;
|
|
RANDOM(c_date, L_CDTE_MIN, L_CDTE_MAX, L_CDTE_SD, skew, L_LINE_SIZE);
|
|
c_date += tmp_date;
|
|
RANDOM(r_date, L_RDTE_MIN, L_RDTE_MAX, L_RDTE_SD, skew, L_LINE_SIZE);
|
|
r_date += s_date;
|
|
|
|
if (oldtime)
|
|
{
|
|
sprintf(o->l[lcnt].sdate, "%ld", JDAY(s_date));
|
|
sprintf(o->l[lcnt].cdate, "%ld", JDAY(c_date));
|
|
sprintf(o->l[lcnt].rdate, "%ld", JDAY(r_date));
|
|
}
|
|
else
|
|
{
|
|
strcpy(o->l[lcnt].sdate, asc_date[s_date - STARTDATE]);
|
|
strcpy(o->l[lcnt].cdate, asc_date[c_date - STARTDATE]);
|
|
strcpy(o->l[lcnt].rdate, asc_date[r_date - STARTDATE]);
|
|
}
|
|
|
|
if (julian(r_date) <= CURRENTDATE)
|
|
{
|
|
pick_str(&l_rflag_set, L_RFLG_SD, tmp_str);
|
|
o->l[lcnt].rflag[0] = *tmp_str;
|
|
}
|
|
else
|
|
o->l[lcnt].rflag[0] = 'N';
|
|
|
|
if (julian(s_date) <= CURRENTDATE)
|
|
{
|
|
ocnt++;
|
|
o->l[lcnt].lstatus[0] = 'F';
|
|
}
|
|
else
|
|
o->l[lcnt].lstatus[0] = 'O';
|
|
}
|
|
if (ocnt > 0)
|
|
o->orderstatus = 'P';
|
|
if (ocnt == o->lines)
|
|
o->orderstatus = 'F';
|
|
/*
|
|
* Print the batch now.
|
|
* Note that if number of rows printed for LINEITEM
|
|
* has already exceeded L_LINE_SIZE, then they are not printed.
|
|
* However, exactly (tdefs[ORDER].base * scale) rows
|
|
* in ORDERS will always be filled.
|
|
*/
|
|
if(i==0)
|
|
{
|
|
tdefs[ORDER].loader[direct] (o, upd_num);
|
|
tdefs[LINE].loader[direct] (o, upd_num);
|
|
}
|
|
else
|
|
tdefs[LINE].loader[direct] (o, upd_num);
|
|
|
|
NumLineitemsGenerated += count;
|
|
}
|
|
#endif
|
|
|
|
return (0);
|
|
}
|
|
|
|
long
|
|
mk_part(long index, part_t *p)
|
|
{
|
|
long temp;
|
|
long snum;
|
|
long brnd;
|
|
|
|
p->partkey = index;
|
|
agg_str(&colors, (long)P_NAME_SCL, (long)P_NAME_SD, p->name);
|
|
RANDOM(temp, P_MFG_MIN, P_MFG_MAX, P_MFG_SD, skew, L_PKEY_MAX);
|
|
sprintf(p->mfgr, P_MFG_FMT, P_MFG_TAG, temp);
|
|
RANDOM(brnd, P_BRND_MIN, P_BRND_MAX, P_BRND_SD, skew, L_PKEY_MAX);
|
|
sprintf(p->brand, P_BRND_FMT,
|
|
P_BRND_TAG,
|
|
(temp * 10 + brnd));
|
|
p->tlen = pick_str(&p_types_set, P_TYPE_SD, p->type);
|
|
p->tlen = strlen(p_types_set.list[p->tlen].text);
|
|
RANDOM(p->size, P_SIZE_MIN, P_SIZE_MAX, P_SIZE_SD, skew, L_PKEY_MAX);
|
|
pick_str(&p_cntr_set, P_CNTR_SD, p->container);
|
|
RPRICE_BRIDGE( p->retailprice, index);
|
|
p->clen = V_STR(P_CMNT_LEN, P_CMNT_SD, p->comment);
|
|
|
|
for (snum = 0; snum < SUPP_PER_PART; snum++)
|
|
{
|
|
p->s[snum].partkey = p->partkey;
|
|
PART_SUPP_BRIDGE( p->s[snum].suppkey, index, snum);
|
|
RANDOM(p->s[snum].qty, PS_QTY_MIN, PS_QTY_MAX, PS_QTY_SD, skew, L_PKEY_MAX);
|
|
RANDOM(p->s[snum].scost, PS_SCST_MIN, PS_SCST_MAX, PS_SCST_SD, skew, L_PKEY_MAX);
|
|
p->s[snum].clen = V_STR(PS_CMNT_LEN, PS_CMNT_SD, p->s[snum].comment);
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
long
|
|
mk_supp(long index, supplier_t *s)
|
|
{
|
|
long i,
|
|
bad_press;
|
|
int noise,
|
|
offset,
|
|
type;
|
|
|
|
s->suppkey = index;
|
|
sprintf(s->name, S_NAME_FMT, S_NAME_TAG, index);
|
|
s->alen = V_STR(S_ADDR_LEN, S_ADDR_SD, s->address);
|
|
RANDOM(i, 0, nations.count - 1, S_NTRG_SD, skew, PS_SKEY_MAX);
|
|
s->nation_code= i;
|
|
gen_phone(i, s->phone, S_PHNE_SD);
|
|
RANDOM(s->acctbal, S_ABAL_MIN, S_ABAL_MAX, S_ABAL_SD, skew, PS_SKEY_MAX);
|
|
RANDOM(bad_press, 1, 10000, BBB_CMNT_SD, skew, PS_SKEY_MAX);
|
|
if (bad_press <= S_CMNT_BBB)
|
|
{
|
|
RANDOM(noise, 0, (S_CMNT_MAX - BBB_CMNT_LEN), BBB_JNK_SD, skew, (S_CMNT_MAX - BBB_CMNT_LEN)+1);
|
|
RANDOM(offset, 0, (S_CMNT_MAX - (BBB_CMNT_LEN + noise)),
|
|
BBB_OFFSET_SD, skew, (S_CMNT_MAX - (BBB_CMNT_LEN + noise))+1);
|
|
RANDOM(type, 0, 100, BBB_TYPE_SD, skew, 101);
|
|
type = (type < BBB_DEADBEATS) ?0:1;
|
|
s->clen =
|
|
a_rnd(BBB_CMNT_LEN + noise + offset,
|
|
S_CMNT_MAX, S_CMNT_SD, s->comment);
|
|
memcpy(s->comment + offset, BBB_BASE, BBB_BASE_LEN);
|
|
if (type == 0)
|
|
memcpy(s->comment + BBB_BASE_LEN + offset + noise,
|
|
BBB_COMPLAIN, BBB_TYPE_LEN);
|
|
else
|
|
memcpy(s->comment + BBB_BASE_LEN + offset + noise,
|
|
BBB_COMMEND, BBB_TYPE_LEN);
|
|
}
|
|
else
|
|
s->clen = V_STR(S_CMNT_LEN, S_CMNT_SD, s->comment);
|
|
|
|
return (0);
|
|
}
|
|
|
|
struct
|
|
{
|
|
char *mdes;
|
|
long days;
|
|
long dcnt;
|
|
} months[] =
|
|
|
|
{
|
|
{
|
|
NULL, 0, 0
|
|
},
|
|
{
|
|
"JAN", 31, 31
|
|
},
|
|
{
|
|
"FEB", 28, 59
|
|
},
|
|
{
|
|
"MAR", 31, 90
|
|
},
|
|
{
|
|
"APR", 30, 120
|
|
},
|
|
{
|
|
"MAY", 31, 151
|
|
},
|
|
{
|
|
"JUN", 30, 181
|
|
},
|
|
{
|
|
"JUL", 31, 212
|
|
},
|
|
{
|
|
"AUG", 31, 243
|
|
},
|
|
{
|
|
"SEP", 30, 273
|
|
},
|
|
{
|
|
"OCT", 31, 304
|
|
},
|
|
{
|
|
"NOV", 30, 334
|
|
},
|
|
{
|
|
"DEC", 31, 365
|
|
}
|
|
};
|
|
|
|
long
|
|
mk_time(long index, dss_time_t *t)
|
|
{
|
|
long m = 0;
|
|
long y;
|
|
long d;
|
|
|
|
t->timekey = index + JDAY_BASE;
|
|
y = julian(index + STARTDATE - 1) / 1000;
|
|
d = julian(index + STARTDATE - 1) % 1000;
|
|
while (d > months[m].dcnt + LEAP_ADJ(y, m))
|
|
m++;
|
|
PR_DATE(t->alpha, y, m,
|
|
d - months[m - 1].dcnt - ((LEAP(y) && m > 2) ? 1 : 0));
|
|
t->year = 1900 + y;
|
|
t->month = m + 12 * y + JMNTH_BASE;
|
|
t->week = (d + T_START_DAY - 1) / 7 + 1;
|
|
t->day = d - months[m - 1].dcnt - LEAP_ADJ(y, m-1);
|
|
|
|
return (0);
|
|
}
|
|
|
|
int
|
|
mk_nation(long index, code_t *c)
|
|
{
|
|
c->code = index - 1;
|
|
c->text = nations.list[index - 1].text;
|
|
c->join = nations.list[index - 1].weight;
|
|
c->clen = V_STR(N_CMNT_LEN, N_CMNT_SD, c->comment);
|
|
return(0);
|
|
}
|
|
|
|
int
|
|
mk_region(long index, code_t *c)
|
|
{
|
|
|
|
c->code = index - 1;
|
|
c->text = regions.list[index - 1].text;
|
|
c->join = 0; /* for completeness */
|
|
c->clen = V_STR(R_CMNT_LEN, R_CMNT_SD, c->comment);
|
|
return(0);
|
|
}
|