This is an automated email from the ASF dual-hosted git repository.

englefly pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/doris.git


The following commit(s) were added to refs/heads/master by this push:
     new aae2470ea08 [opt](tools) update tools schema (#41335)
aae2470ea08 is described below

commit aae2470ea08e31238e937450bf21fc51c05d3f51
Author: xzj7019 <131111794+xzj7...@users.noreply.github.com>
AuthorDate: Fri Sep 27 10:04:37 2024 +0800

    [opt](tools) update tools schema (#41335)
    
    optimize tpcds sf1000 schema bucket number & remove collocation group
    usage.
    
    Co-authored-by: zhongjian.xzj 
<zhongjian.xzj@zhongjianxzjdeMacBook-Pro.local>
---
 .../tpcds-tools/ddl/create-tpcds-tables-sf1000.sql | 46 ++++++++++------------
 1 file changed, 20 insertions(+), 26 deletions(-)

diff --git a/tools/tpcds-tools/ddl/create-tpcds-tables-sf1000.sql 
b/tools/tpcds-tools/ddl/create-tpcds-tables-sf1000.sql
index 6d332d8c548..7e950580553 100644
--- a/tools/tpcds-tools/ddl/create-tpcds-tables-sf1000.sql
+++ b/tools/tpcds-tools/ddl/create-tpcds-tables-sf1000.sql
@@ -27,7 +27,7 @@ CREATE TABLE IF NOT EXISTS customer_demographics (
     cd_dep_college_count integer
 )
 DUPLICATE KEY(cd_demo_sk)
-DISTRIBUTED BY HASH(cd_demo_sk) BUCKETS 12
+DISTRIBUTED BY HASH(cd_demo_sk) BUCKETS 9
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -74,7 +74,7 @@ CREATE TABLE IF NOT EXISTS date_dim (
     d_current_year char(1)
 )
 DUPLICATE KEY(d_date_sk)
-DISTRIBUTED BY HASH(d_date_sk) BUCKETS 12
+DISTRIBUTED BY HASH(d_date_sk) BUCKETS 9
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -213,10 +213,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(cs_item_sk, cs_order_number) BUCKETS 32
+DISTRIBUTED BY HASH(cs_item_sk, cs_order_number) BUCKETS 3
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "catalog"
+  "replication_num" = "1"
 );
 drop table if exists call_center;
 CREATE TABLE IF NOT EXISTS call_center (
@@ -340,7 +339,7 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(inv_item_sk, inv_warehouse_sk) BUCKETS 32
+DISTRIBUTED BY HASH(inv_item_sk, inv_warehouse_sk) BUCKETS 1
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -450,10 +449,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(cr_item_sk, cr_order_number) BUCKETS 32
+DISTRIBUTED BY HASH(cr_item_sk, cr_order_number) BUCKETS 1
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "catalog"
+  "replication_num" = "1"
 );
 drop table if exists household_demographics;
 CREATE TABLE IF NOT EXISTS household_demographics (
@@ -464,7 +462,7 @@ CREATE TABLE IF NOT EXISTS household_demographics (
     hd_vehicle_count integer
 )
 DUPLICATE KEY(hd_demo_sk)
-DISTRIBUTED BY HASH(hd_demo_sk) BUCKETS 3
+DISTRIBUTED BY HASH(hd_demo_sk) BUCKETS 1
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -485,7 +483,7 @@ CREATE TABLE IF NOT EXISTS customer_address (
     ca_location_type char(20)
 )
 DUPLICATE KEY(ca_address_sk)
-DISTRIBUTED BY HASH(ca_address_sk) BUCKETS 32
+DISTRIBUTED BY HASH(ca_address_sk) BUCKETS 18
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -543,7 +541,7 @@ CREATE TABLE IF NOT EXISTS item (
     i_product_name char(50)
 )
 DUPLICATE KEY(i_item_sk)
-DISTRIBUTED BY HASH(i_item_sk) BUCKETS 32
+DISTRIBUTED BY HASH(i_item_sk) BUCKETS 9
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -650,10 +648,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(wr_item_sk, wr_order_number) BUCKETS 32
+DISTRIBUTED BY HASH(wr_item_sk, wr_order_number) BUCKETS 1
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "web"
+  "replication_num" = "1"
 );
 drop table if exists web_site;
 CREATE TABLE IF NOT EXISTS web_site (
@@ -829,10 +826,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(ws_item_sk, ws_order_number) BUCKETS 32
+DISTRIBUTED BY HASH(ws_item_sk, ws_order_number) BUCKETS 3
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "web"
+  "replication_num" = "1"
 );
 drop table if exists store;
 CREATE TABLE IF NOT EXISTS store (
@@ -885,7 +881,7 @@ CREATE TABLE IF NOT EXISTS time_dim (
     t_meal_time char(20)
 )
 DUPLICATE KEY(t_time_sk)
-DISTRIBUTED BY HASH(t_time_sk) BUCKETS 12
+DISTRIBUTED BY HASH(t_time_sk) BUCKETS 9
 PROPERTIES (
   "replication_num" = "1"
 );
@@ -1010,10 +1006,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(sr_item_sk, sr_ticket_number) BUCKETS 32
+DISTRIBUTED BY HASH(sr_item_sk, sr_ticket_number) BUCKETS 1
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "store"
+  "replication_num" = "1"
 );
 drop table if exists store_sales;
 CREATE TABLE IF NOT EXISTS store_sales (
@@ -1117,10 +1112,9 @@ PARTITION `p70` VALUES LESS THAN ("2452945"),
 PARTITION `p71` VALUES LESS THAN ("2452975"),
 PARTITION `p72` VALUES LESS THAN (MAXVALUE)
 )
-DISTRIBUTED BY HASH(ss_item_sk, ss_ticket_number) BUCKETS 32
+DISTRIBUTED BY HASH(ss_item_sk, ss_ticket_number) BUCKETS 3
 PROPERTIES (
-  "replication_num" = "1",
-  "colocate_with" = "store"
+  "replication_num" = "1"
 );
 drop table if exists ship_mode;
 CREATE TABLE IF NOT EXISTS ship_mode (
@@ -1158,7 +1152,7 @@ CREATE TABLE IF NOT EXISTS customer (
     c_last_review_date_sk integer
 )
 DUPLICATE KEY(c_customer_sk)
-DISTRIBUTED BY HASH(c_customer_id) BUCKETS 24
+DISTRIBUTED BY HASH(c_customer_id) BUCKETS 18
 PROPERTIES (
   "replication_num" = "1"
 );


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org
For additional commands, e-mail: commits-h...@doris.apache.org

Reply via email to