-
Notifications
You must be signed in to change notification settings - Fork 42
/
Copy path300-PopulateSnowflake.sh
executable file
·531 lines (504 loc) · 22.6 KB
/
300-PopulateSnowflake.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
set -e
export LOCATION=gcs://fivetran-benchmark/tpcds_1000_dat
cat <<EOF
drop database if exists tpcds;
create database tpcds;
use tpcds;
create table call_center(
cc_call_center_sk bigint
, cc_call_center_id varchar
, cc_rec_start_date varchar
, cc_rec_end_date varchar
, cc_closed_date_sk bigint
, cc_open_date_sk bigint
, cc_name varchar
, cc_class varchar
, cc_employees int
, cc_sq_ft int
, cc_hours varchar
, cc_manager varchar
, cc_mkt_id int
, cc_mkt_class varchar
, cc_mkt_desc varchar
, cc_market_manager varchar
, cc_division int
, cc_division_name varchar
, cc_company int
, cc_company_name varchar
, cc_street_number varchar
, cc_street_name varchar
, cc_street_type varchar
, cc_suite_number varchar
, cc_city varchar
, cc_county varchar
, cc_state varchar
, cc_zip varchar
, cc_country varchar
, cc_gmt_offset double precision
, cc_tax_percentage double precision
);
create table catalog_page(
cp_catalog_page_sk bigint
, cp_catalog_page_id varchar
, cp_start_date_sk bigint
, cp_end_date_sk bigint
, cp_department varchar
, cp_catalog_number int
, cp_catalog_page_number int
, cp_description varchar
, cp_type varchar
);
create table catalog_returns(
cr_returned_date_sk bigint,
cr_returned_time_sk bigint,
cr_item_sk bigint,
cr_refunded_customer_sk bigint,
cr_refunded_cdemo_sk bigint,
cr_refunded_hdemo_sk bigint,
cr_refunded_addr_sk bigint,
cr_returning_customer_sk bigint,
cr_returning_cdemo_sk bigint,
cr_returning_hdemo_sk bigint,
cr_returning_addr_sk bigint,
cr_call_center_sk bigint,
cr_catalog_page_sk bigint,
cr_ship_mode_sk bigint,
cr_warehouse_sk bigint,
cr_reason_sk bigint,
cr_order_number bigint,
cr_return_quantity int,
cr_return_amount double precision,
cr_return_tax double precision,
cr_return_amt_inc_tax double precision,
cr_fee double precision,
cr_return_ship_cost double precision,
cr_refunded_cash double precision,
cr_reversed_charge double precision,
cr_store_credit double precision,
cr_net_loss double precision
);
create table catalog_sales (
cs_sold_date_sk bigint,
cs_sold_time_sk bigint,
cs_ship_date_sk bigint,
cs_bill_customer_sk bigint,
cs_bill_cdemo_sk bigint,
cs_bill_hdemo_sk bigint,
cs_bill_addr_sk bigint,
cs_ship_customer_sk bigint,
cs_ship_cdemo_sk bigint,
cs_ship_hdemo_sk bigint,
cs_ship_addr_sk bigint,
cs_call_center_sk bigint,
cs_catalog_page_sk bigint,
cs_ship_mode_sk bigint,
cs_warehouse_sk bigint,
cs_item_sk bigint,
cs_promo_sk bigint,
cs_order_number bigint,
cs_quantity int,
cs_wholesale_cost double precision,
cs_list_price double precision,
cs_sales_price double precision,
cs_ext_discount_amt double precision,
cs_ext_sales_price double precision,
cs_ext_wholesale_cost double precision,
cs_ext_list_price double precision,
cs_ext_tax double precision,
cs_coupon_amt double precision,
cs_ext_ship_cost double precision,
cs_net_paid double precision,
cs_net_paid_inc_tax double precision,
cs_net_paid_inc_ship double precision,
cs_net_paid_inc_ship_tax double precision,
cs_net_profit double precision
);
create table customer_address (
ca_address_sk bigint,
ca_address_id varchar,
ca_street_number varchar,
ca_street_name varchar,
ca_street_type varchar,
ca_suite_number varchar,
ca_city varchar,
ca_county varchar,
ca_state varchar,
ca_zip varchar,
ca_country varchar,
ca_gmt_offset double precision,
ca_location_type varchar
);
create table customer_demographics (
cd_demo_sk bigint,
cd_gender varchar,
cd_marital_status varchar,
cd_education_status varchar,
cd_purchase_estimate int,
cd_credit_rating varchar,
cd_dep_count int,
cd_dep_employed_count int,
cd_dep_college_count int
);
create table customer (
c_customer_sk bigint,
c_customer_id varchar,
c_current_cdemo_sk bigint,
c_current_hdemo_sk bigint,
c_current_addr_sk bigint,
c_first_shipto_date_sk bigint,
c_first_sales_date_sk bigint,
c_salutation varchar,
c_first_name varchar,
c_last_name varchar,
c_preferred_cust_flag varchar,
c_birth_day int,
c_birth_month int,
c_birth_year int,
c_birth_country varchar,
c_login varchar,
c_email_address varchar,
c_last_review_date varchar
);
create table date_dim (
d_date_sk bigint,
d_date_id varchar,
d_date varchar,
d_month_seq int,
d_week_seq int,
d_quarter_seq int,
d_year int,
d_dow int,
d_moy int,
d_dom int,
d_qoy int,
d_fy_year int,
d_fy_quarter_seq int,
d_fy_week_seq int,
d_day_name varchar,
d_quarter_name varchar,
d_holiday varchar,
d_weekend varchar,
d_following_holiday varchar,
d_first_dom int,
d_last_dom int,
d_same_day_ly int,
d_same_day_lq int,
d_current_day varchar,
d_current_week varchar,
d_current_month varchar,
d_current_quarter varchar,
d_current_year varchar
);
create table household_demographics (
hd_demo_sk bigint,
hd_income_band_sk bigint,
hd_buy_potential varchar,
hd_dep_count int,
hd_vehicle_count int
);
create table income_band(
ib_income_band_sk bigint
, ib_lower_bound int
, ib_upper_bound int
);
create table inventory (
inv_date_sk bigint,
inv_item_sk bigint,
inv_warehouse_sk bigint,
inv_quantity_on_hand int
);
create table item (
i_item_sk bigint,
i_item_id varchar,
i_rec_start_date varchar,
i_rec_end_date varchar,
i_item_desc varchar,
i_current_price double precision,
i_wholesale_cost double precision,
i_brand_id int,
i_brand varchar,
i_class_id int,
i_class varchar,
i_category_id int,
i_category varchar,
i_manufact_id int,
i_manufact varchar,
i_size varchar,
i_formulation varchar,
i_color varchar,
i_units varchar,
i_container varchar,
i_manager_id int,
i_product_name varchar
);
create table promotion (
p_promo_sk bigint,
p_promo_id varchar,
p_start_date_sk bigint,
p_end_date_sk bigint,
p_item_sk bigint,
p_cost double precision,
p_response_target int,
p_promo_name varchar,
p_channel_dmail varchar,
p_channel_email varchar,
p_channel_catalog varchar,
p_channel_tv varchar,
p_channel_radio varchar,
p_channel_press varchar,
p_channel_event varchar,
p_channel_demo varchar,
p_channel_details varchar,
p_purpose varchar,
p_discount_active varchar
);
create table reason(
r_reason_sk bigint
, r_reason_id varchar
, r_reason_desc varchar
);
create table ship_mode(
sm_ship_mode_sk bigint
, sm_ship_mode_id varchar
, sm_type varchar
, sm_code varchar
, sm_carrier varchar
, sm_contract varchar
);
create table store_returns (
sr_returned_date_sk bigint,
sr_return_time_sk bigint,
sr_item_sk bigint,
sr_customer_sk bigint,
sr_cdemo_sk bigint,
sr_hdemo_sk bigint,
sr_addr_sk bigint,
sr_store_sk bigint,
sr_reason_sk bigint,
sr_ticket_number bigint,
sr_return_quantity int,
sr_return_amt double precision,
sr_return_tax double precision,
sr_return_amt_inc_tax double precision,
sr_fee double precision,
sr_return_ship_cost double precision,
sr_refunded_cash double precision,
sr_reversed_charge double precision,
sr_store_credit double precision,
sr_net_loss double precision
);
create table store_sales (
ss_sold_date_sk bigint,
ss_sold_time_sk bigint,
ss_item_sk bigint,
ss_customer_sk bigint,
ss_cdemo_sk bigint,
ss_hdemo_sk bigint,
ss_addr_sk bigint,
ss_store_sk bigint,
ss_promo_sk bigint,
ss_ticket_number bigint,
ss_quantity int,
ss_wholesale_cost double precision,
ss_list_price double precision,
ss_sales_price double precision,
ss_ext_discount_amt double precision,
ss_ext_sales_price double precision,
ss_ext_wholesale_cost double precision,
ss_ext_list_price double precision,
ss_ext_tax double precision,
ss_coupon_amt double precision,
ss_net_paid double precision,
ss_net_paid_inc_tax double precision,
ss_net_profit double precision
);
create table store (
s_store_sk bigint,
s_store_id varchar,
s_rec_start_date varchar,
s_rec_end_date varchar,
s_closed_date_sk bigint,
s_store_name varchar,
s_number_employees int,
s_floor_space int,
s_hours varchar,
s_manager varchar,
s_market_id int,
s_geography_class varchar,
s_market_desc varchar,
s_market_manager varchar,
s_division_id int,
s_division_name varchar,
s_company_id int,
s_company_name varchar,
s_street_number varchar,
s_street_name varchar,
s_street_type varchar,
s_suite_number varchar,
s_city varchar,
s_county varchar,
s_state varchar,
s_zip varchar,
s_country varchar,
s_gmt_offset double precision,
s_tax_precentage double precision
);
create table time_dim (
t_time_sk bigint,
t_time_id varchar,
t_time int,
t_hour int,
t_minute int,
t_second int,
t_am_pm varchar,
t_shift varchar,
t_sub_shift varchar,
t_meal_time varchar
);
create table warehouse(
w_warehouse_sk bigint
, w_warehouse_id varchar
, w_warehouse_name varchar
, w_warehouse_sq_ft int
, w_street_number varchar
, w_street_name varchar
, w_street_type varchar
, w_suite_number varchar
, w_city varchar
, w_county varchar
, w_state varchar
, w_zip varchar
, w_country varchar
, w_gmt_offset double precision
);
create table web_page(
wp_web_page_sk bigint
, wp_web_page_id varchar
, wp_rec_start_date varchar
, wp_rec_end_date varchar
, wp_creation_date_sk bigint
, wp_access_date_sk bigint
, wp_autogen_flag varchar
, wp_customer_sk bigint
, wp_url varchar
, wp_type varchar
, wp_char_count int
, wp_link_count int
, wp_image_count int
, wp_max_ad_count int
);
create table web_returns (
wr_returned_date_sk bigint,
wr_returned_time_sk bigint,
wr_item_sk bigint,
wr_refunded_customer_sk bigint,
wr_refunded_cdemo_sk bigint,
wr_refunded_hdemo_sk bigint,
wr_refunded_addr_sk bigint,
wr_returning_customer_sk bigint,
wr_returning_cdemo_sk bigint,
wr_returning_hdemo_sk bigint,
wr_returning_addr_sk bigint,
wr_web_page_sk bigint,
wr_reason_sk bigint,
wr_order_number bigint,
wr_return_quantity int,
wr_return_amt double precision,
wr_return_tax double precision,
wr_return_amt_inc_tax double precision,
wr_fee double precision,
wr_return_ship_cost double precision,
wr_refunded_cash double precision,
wr_reversed_charge double precision,
wr_account_credit double precision,
wr_net_loss double precision
);
create table web_sales (
ws_sold_date_sk bigint,
ws_sold_time_sk bigint,
ws_ship_date_sk bigint,
ws_item_sk bigint,
ws_bill_customer_sk bigint,
ws_bill_cdemo_sk bigint,
ws_bill_hdemo_sk bigint,
ws_bill_addr_sk bigint,
ws_ship_customer_sk bigint,
ws_ship_cdemo_sk bigint,
ws_ship_hdemo_sk bigint,
ws_ship_addr_sk bigint,
ws_web_page_sk bigint,
ws_web_site_sk bigint,
ws_ship_mode_sk bigint,
ws_warehouse_sk bigint,
ws_promo_sk bigint,
ws_order_number bigint,
ws_quantity int,
ws_wholesale_cost double precision,
ws_list_price double precision,
ws_sales_price double precision,
ws_ext_discount_amt double precision,
ws_ext_sales_price double precision,
ws_ext_wholesale_cost double precision,
ws_ext_list_price double precision,
ws_ext_tax double precision,
ws_coupon_amt double precision,
ws_ext_ship_cost double precision,
ws_net_paid double precision,
ws_net_paid_inc_tax double precision,
ws_net_paid_inc_ship double precision,
ws_net_paid_inc_ship_tax double precision,
ws_net_profit double precision
);
create table web_site (
web_site_sk bigint,
web_site_id varchar,
web_rec_start_date varchar,
web_rec_end_date varchar,
web_name varchar,
web_open_date_sk bigint,
web_close_date_sk bigint,
web_class varchar,
web_manager varchar,
web_mkt_id int,
web_mkt_class varchar,
web_mkt_desc varchar,
web_market_manager varchar,
web_company_id int,
web_company_name varchar,
web_street_number varchar,
web_street_name varchar,
web_street_type varchar,
web_suite_number varchar,
web_city varchar,
web_county varchar,
web_state varchar,
web_zip varchar,
web_country varchar,
web_gmt_offset double precision,
web_tax_percentage double precision
);
copy into call_center from '${LOCATION}/call_center/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into catalog_page from '${LOCATION}/catalog_page/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into catalog_returns from '${LOCATION}/catalog_returns/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into catalog_sales from '${LOCATION}/catalog_sales/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into customer from '${LOCATION}/customer/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into customer_address from '${LOCATION}/customer_address/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into customer_demographics from '${LOCATION}/customer_demographics/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into date_dim from '${LOCATION}/date_dim/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into household_demographics from '${LOCATION}/household_demographics/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into income_band from '${LOCATION}/income_band/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into inventory from '${LOCATION}/inventory/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into item from '${LOCATION}/item/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into promotion from '${LOCATION}/promotion/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into reason from '${LOCATION}/reason/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into ship_mode from '${LOCATION}/ship_mode/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into store from '${LOCATION}/store/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into store_returns from '${LOCATION}/store_returns/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into store_sales from '${LOCATION}/store_sales/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into time_dim from '${LOCATION}/time_dim/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into warehouse from '${LOCATION}/warehouse/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into web_page from '${LOCATION}/web_page/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into web_returns from '${LOCATION}/web_returns/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into web_sales from '${LOCATION}/web_sales/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
copy into web_site from '${LOCATION}/web_site/' file_format = (type = csv field_delimiter='|' error_on_column_count_mismatch=false VALIDATE_UTF8=false );
EOF