Skip to content

Commit

Permalink
[opt](tools) update tools schema (#41335)
Browse files Browse the repository at this point in the history
optimize tpcds sf1000 schema bucket number & remove collocation group
usage.

Co-authored-by: zhongjian.xzj <[email protected]>
  • Loading branch information
2 people authored and dataroaring committed Oct 5, 2024
1 parent af8bc63 commit 3107130
Showing 1 changed file with 20 additions and 26 deletions.
46 changes: 20 additions & 26 deletions tools/tpcds-tools/ddl/create-tpcds-tables-sf1000.sql
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ CREATE TABLE IF NOT EXISTS customer_demographics (
cd_dep_college_count integer
)
DUPLICATE KEY(cd_demo_sk)
DISTRIBUTED BY HASH(cd_demo_sk) BUCKETS 12
DISTRIBUTED BY HASH(cd_demo_sk) BUCKETS 9
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -74,7 +74,7 @@ CREATE TABLE IF NOT EXISTS date_dim (
d_current_year char(1)
)
DUPLICATE KEY(d_date_sk)
DISTRIBUTED BY HASH(d_date_sk) BUCKETS 12
DISTRIBUTED BY HASH(d_date_sk) BUCKETS 9
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -213,10 +213,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(cs_item_sk, cs_order_number) BUCKETS 32
DISTRIBUTED BY HASH(cs_item_sk, cs_order_number) BUCKETS 3
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "catalog"
"replication_num" = "1"
);
drop table if exists call_center;
CREATE TABLE IF NOT EXISTS call_center (
Expand Down Expand Up @@ -340,7 +339,7 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(inv_item_sk, inv_warehouse_sk) BUCKETS 32
DISTRIBUTED BY HASH(inv_item_sk, inv_warehouse_sk) BUCKETS 1
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -450,10 +449,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(cr_item_sk, cr_order_number) BUCKETS 32
DISTRIBUTED BY HASH(cr_item_sk, cr_order_number) BUCKETS 1
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "catalog"
"replication_num" = "1"
);
drop table if exists household_demographics;
CREATE TABLE IF NOT EXISTS household_demographics (
Expand All @@ -464,7 +462,7 @@ CREATE TABLE IF NOT EXISTS household_demographics (
hd_vehicle_count integer
)
DUPLICATE KEY(hd_demo_sk)
DISTRIBUTED BY HASH(hd_demo_sk) BUCKETS 3
DISTRIBUTED BY HASH(hd_demo_sk) BUCKETS 1
PROPERTIES (
"replication_num" = "1"
);
Expand All @@ -485,7 +483,7 @@ CREATE TABLE IF NOT EXISTS customer_address (
ca_location_type char(20)
)
DUPLICATE KEY(ca_address_sk)
DISTRIBUTED BY HASH(ca_address_sk) BUCKETS 32
DISTRIBUTED BY HASH(ca_address_sk) BUCKETS 18
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -543,7 +541,7 @@ CREATE TABLE IF NOT EXISTS item (
i_product_name char(50)
)
DUPLICATE KEY(i_item_sk)
DISTRIBUTED BY HASH(i_item_sk) BUCKETS 32
DISTRIBUTED BY HASH(i_item_sk) BUCKETS 9
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -650,10 +648,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(wr_item_sk, wr_order_number) BUCKETS 32
DISTRIBUTED BY HASH(wr_item_sk, wr_order_number) BUCKETS 1
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "web"
"replication_num" = "1"
);
drop table if exists web_site;
CREATE TABLE IF NOT EXISTS web_site (
Expand Down Expand Up @@ -829,10 +826,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(ws_item_sk, ws_order_number) BUCKETS 32
DISTRIBUTED BY HASH(ws_item_sk, ws_order_number) BUCKETS 3
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "web"
"replication_num" = "1"
);
drop table if exists store;
CREATE TABLE IF NOT EXISTS store (
Expand Down Expand Up @@ -885,7 +881,7 @@ CREATE TABLE IF NOT EXISTS time_dim (
t_meal_time char(20)
)
DUPLICATE KEY(t_time_sk)
DISTRIBUTED BY HASH(t_time_sk) BUCKETS 12
DISTRIBUTED BY HASH(t_time_sk) BUCKETS 9
PROPERTIES (
"replication_num" = "1"
);
Expand Down Expand Up @@ -1010,10 +1006,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(sr_item_sk, sr_ticket_number) BUCKETS 32
DISTRIBUTED BY HASH(sr_item_sk, sr_ticket_number) BUCKETS 1
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "store"
"replication_num" = "1"
);
drop table if exists store_sales;
CREATE TABLE IF NOT EXISTS store_sales (
Expand Down Expand Up @@ -1117,10 +1112,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
PARTITION `p71` VALUES LESS THAN ("2452975"),
PARTITION `p72` VALUES LESS THAN (MAXVALUE)
)
DISTRIBUTED BY HASH(ss_item_sk, ss_ticket_number) BUCKETS 32
DISTRIBUTED BY HASH(ss_item_sk, ss_ticket_number) BUCKETS 3
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "store"
"replication_num" = "1"
);
drop table if exists ship_mode;
CREATE TABLE IF NOT EXISTS ship_mode (
Expand Down Expand Up @@ -1158,7 +1152,7 @@ CREATE TABLE IF NOT EXISTS customer (
c_last_review_date_sk integer
)
DUPLICATE KEY(c_customer_sk)
DISTRIBUTED BY HASH(c_customer_id) BUCKETS 24
DISTRIBUTED BY HASH(c_customer_id) BUCKETS 18
PROPERTIES (
"replication_num" = "1"
);
Expand Down

0 comments on commit 3107130

Please sign in to comment.