http://git-wip-us.apache.org/repos/asf/hive/blob/e986fc56/ql/src/test/results/clientpositive/perf/tez/constraints/query72.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/constraints/query72.q.out b/ql/src/test/results/clientpositive/perf/tez/constraints/query72.q.out index fe82eda..1a9c2cf 100644 --- a/ql/src/test/results/clientpositive/perf/tez/constraints/query72.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/constraints/query72.q.out @@ -81,36 +81,34 @@ POSTHOOK: Output: hdfs://### HDFS PATH ### Plan optimized by CBO. Vertex dependency in root stage -Map 1 <- Reducer 14 (BROADCAST_EDGE), Reducer 16 (BROADCAST_EDGE), Reducer 19 (BROADCAST_EDGE) -Reducer 10 <- Map 26 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE) +Map 1 <- Reducer 17 (BROADCAST_EDGE) +Reducer 10 <- Map 24 (SIMPLE_EDGE), Reducer 9 (SIMPLE_EDGE) Reducer 11 <- Reducer 10 (SIMPLE_EDGE) Reducer 12 <- Reducer 11 (SIMPLE_EDGE) -Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE) -Reducer 16 <- Map 15 (CUSTOM_SIMPLE_EDGE) -Reducer 18 <- Map 17 (SIMPLE_EDGE), Map 20 (SIMPLE_EDGE) -Reducer 19 <- Reducer 18 (CUSTOM_SIMPLE_EDGE) +Reducer 16 <- Map 15 (SIMPLE_EDGE), Map 18 (SIMPLE_EDGE) +Reducer 17 <- Reducer 16 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 13 (SIMPLE_EDGE) -Reducer 3 <- Map 15 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) -Reducer 4 <- Reducer 18 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) -Reducer 5 <- Map 21 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) -Reducer 6 <- Map 22 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) -Reducer 7 <- Map 23 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) -Reducer 8 <- Map 24 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) -Reducer 9 <- Map 25 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) +Reducer 3 <- Map 14 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) +Reducer 4 <- Reducer 16 (SIMPLE_EDGE), Reducer 3 (SIMPLE_EDGE) +Reducer 5 <- Map 19 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) +Reducer 6 <- Map 20 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) +Reducer 7 <- Map 21 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) +Reducer 8 <- Map 22 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) +Reducer 9 <- Map 23 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:100 Stage-1 Reducer 12 vectorized - File Output Operator [FS_287] - Limit [LIM_286] (rows=100 width=312) + File Output Operator [FS_277] + Limit [LIM_276] (rows=100 width=312) Number of rows:100 - Select Operator [SEL_285] (rows=193558220 width=312) + Select Operator [SEL_275] (rows=193558220 width=312) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] <-Reducer 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_284] - Group By Operator [GBY_283] (rows=193558220 width=312) + SHUFFLE [RS_274] + Group By Operator [GBY_273] (rows=193558220 width=312) Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2 <-Reducer 10 [SIMPLE_EDGE] SHUFFLE [RS_64] @@ -120,11 +118,11 @@ Stage-0 Select Operator [SEL_61] (rows=499184560 width=292) Output:["_col0","_col1","_col2","_col3","_col4"] Merge Join Operator [MERGEJOIN_243] (rows=499184560 width=292) - Conds:RS_58._col4, _col6=RS_282._col0, _col1(Left Outer),Output:["_col13","_col15","_col19","_col25"] - <-Map 26 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_282] + Conds:RS_58._col4, _col6=RS_272._col0, _col1(Left Outer),Output:["_col13","_col15","_col19","_col25"] + <-Map 24 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_272] PartitionCols:_col0, _col1 - Select Operator [SEL_281] (rows=28798881 width=8) + Select Operator [SEL_271] (rows=28798881 width=8) Output:["_col0","_col1"] TableScan [TS_56] (rows=28798881 width=8) default@catalog_returns,catalog_returns,Tbl:COMPLETE,Col:COMPLETE,Output:["cr_item_sk","cr_order_number"] @@ -134,11 +132,11 @@ Stage-0 Select Operator [SEL_55] (rows=193558220 width=300) Output:["_col4","_col6","_col13","_col15","_col19","_col25"] Merge Join Operator [MERGEJOIN_242] (rows=193558220 width=300) - Conds:RS_52._col5=RS_280._col0(Left Outer),Output:["_col4","_col6","_col13","_col20","_col24","_col25"] - <-Map 25 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_280] + Conds:RS_52._col5=RS_270._col0(Left Outer),Output:["_col4","_col6","_col13","_col20","_col24","_col25"] + <-Map 23 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_270] PartitionCols:_col0 - Select Operator [SEL_279] (rows=2300 width=4) + Select Operator [SEL_269] (rows=2300 width=4) Output:["_col0"] TableScan [TS_27] (rows=2300 width=4) default@promotion,promotion,Tbl:COMPLETE,Col:COMPLETE,Output:["p_promo_sk"] @@ -146,11 +144,11 @@ Stage-0 SHUFFLE [RS_52] PartitionCols:_col5 Merge Join Operator [MERGEJOIN_241] (rows=193558220 width=299) - Conds:RS_49._col4=RS_278._col0(Inner),Output:["_col4","_col5","_col6","_col13","_col20","_col24"] - <-Map 24 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_278] + Conds:RS_49._col4=RS_268._col0(Inner),Output:["_col4","_col5","_col6","_col13","_col20","_col24"] + <-Map 22 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_268] PartitionCols:_col0 - Select Operator [SEL_277] (rows=462000 width=188) + Select Operator [SEL_267] (rows=462000 width=188) Output:["_col0","_col1"] TableScan [TS_25] (rows=462000 width=188) default@item,item,Tbl:COMPLETE,Col:COMPLETE,Output:["i_item_sk","i_item_desc"] @@ -160,11 +158,11 @@ Stage-0 Filter Operator [FIL_48] (rows=193558220 width=131) predicate:(_col22 > _col14) Merge Join Operator [MERGEJOIN_240] (rows=580674662 width=131) - Conds:RS_45._col1=RS_276._col0(Inner),Output:["_col4","_col5","_col6","_col13","_col14","_col20","_col22"] - <-Map 23 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_276] + Conds:RS_45._col1=RS_266._col0(Inner),Output:["_col4","_col5","_col6","_col13","_col14","_col20","_col22"] + <-Map 21 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_266] PartitionCols:_col0 - Select Operator [SEL_275] (rows=73049 width=12) + Select Operator [SEL_265] (rows=73049 width=12) Output:["_col0","_col1"] TableScan [TS_23] (rows=73049 width=98) default@date_dim,d3,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_date"] @@ -172,11 +170,11 @@ Stage-0 SHUFFLE [RS_45] PartitionCols:_col1 Merge Join Operator [MERGEJOIN_239] (rows=580674662 width=127) - Conds:RS_42._col17=RS_274._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col13","_col14","_col20"] - <-Map 22 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_274] + Conds:RS_42._col17=RS_264._col0(Inner),Output:["_col1","_col4","_col5","_col6","_col13","_col14","_col20"] + <-Map 20 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_264] PartitionCols:_col0 - Select Operator [SEL_273] (rows=27 width=104) + Select Operator [SEL_263] (rows=27 width=104) Output:["_col0","_col1"] TableScan [TS_21] (rows=27 width=104) default@warehouse,warehouse,Tbl:COMPLETE,Col:COMPLETE,Output:["w_warehouse_sk","w_warehouse_name"] @@ -186,11 +184,11 @@ Stage-0 Filter Operator [FIL_41] (rows=580674662 width=39) predicate:(_col18 < _col7) Merge Join Operator [MERGEJOIN_238] (rows=1742023986 width=39) - Conds:RS_38._col10, _col4=RS_272._col0, _col1(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col13","_col14","_col17","_col18"] - <-Map 21 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_272] + Conds:RS_38._col10, _col4=RS_262._col0, _col1(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col13","_col14","_col17","_col18"] + <-Map 19 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_262] PartitionCols:_col0, _col1 - Select Operator [SEL_271] (rows=37584000 width=15) + Select Operator [SEL_261] (rows=37584000 width=15) Output:["_col0","_col1","_col2","_col3"] TableScan [TS_19] (rows=37584000 width=15) default@inventory,inventory,Tbl:COMPLETE,Col:COMPLETE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] @@ -199,26 +197,26 @@ Stage-0 PartitionCols:_col10, _col4 Merge Join Operator [MERGEJOIN_237] (rows=2899758 width=30) Conds:RS_35._col0=RS_36._col2(Inner),Output:["_col1","_col4","_col5","_col6","_col7","_col10","_col13","_col14"] - <-Reducer 18 [SIMPLE_EDGE] + <-Reducer 16 [SIMPLE_EDGE] SHUFFLE [RS_36] PartitionCols:_col2 Merge Join Operator [MERGEJOIN_236] (rows=3621 width=20) - Conds:RS_262._col1=RS_265._col1(Inner),Output:["_col0","_col2","_col3","_col4"] - <-Map 17 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_262] + Conds:RS_246._col1=RS_249._col1(Inner),Output:["_col0","_col2","_col3","_col4"] + <-Map 15 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_246] PartitionCols:_col1 - Select Operator [SEL_261] (rows=73049 width=8) + Select Operator [SEL_245] (rows=73049 width=8) Output:["_col0","_col1"] - Filter Operator [FIL_260] (rows=73049 width=8) + Filter Operator [FIL_244] (rows=73049 width=8) predicate:d_week_seq is not null TableScan [TS_9] (rows=73049 width=8) default@date_dim,d2,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_week_seq"] - <-Map 20 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_265] + <-Map 18 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_249] PartitionCols:_col1 - Select Operator [SEL_264] (rows=652 width=16) + Select Operator [SEL_248] (rows=652 width=16) Output:["_col0","_col1","_col2"] - Filter Operator [FIL_263] (rows=652 width=106) + Filter Operator [FIL_247] (rows=652 width=106) predicate:((d_year = 2001) and d_week_seq is not null) TableScan [TS_12] (rows=73049 width=106) default@date_dim,d1,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_date","d_week_seq","d_year"] @@ -226,13 +224,13 @@ Stage-0 SHUFFLE [RS_35] PartitionCols:_col0 Merge Join Operator [MERGEJOIN_235] (rows=8179029 width=21) - Conds:RS_32._col3=RS_254._col0(Inner),Output:["_col0","_col1","_col4","_col5","_col6","_col7"] - <-Map 15 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_254] + Conds:RS_32._col3=RS_260._col0(Inner),Output:["_col0","_col1","_col4","_col5","_col6","_col7"] + <-Map 14 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_260] PartitionCols:_col0 - Select Operator [SEL_253] (rows=1440 width=4) + Select Operator [SEL_259] (rows=1440 width=4) Output:["_col0"] - Filter Operator [FIL_252] (rows=1440 width=96) + Filter Operator [FIL_258] (rows=1440 width=96) predicate:(hd_buy_potential = '1001-5000') TableScan [TS_6] (rows=7200 width=96) default@household_demographics,household_demographics,Tbl:COMPLETE,Col:COMPLETE,Output:["hd_demo_sk","hd_buy_potential"] @@ -240,56 +238,34 @@ Stage-0 SHUFFLE [RS_32] PartitionCols:_col3 Merge Join Operator [MERGEJOIN_234] (rows=40895144 width=27) - Conds:RS_270._col2=RS_246._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] - <-Map 13 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_246] - PartitionCols:_col0 - Select Operator [SEL_245] (rows=265971 width=4) - Output:["_col0"] - Filter Operator [FIL_244] (rows=265971 width=89) - predicate:(cd_marital_status = 'M') - TableScan [TS_3] (rows=1861800 width=89) - default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:COMPLETE,Output:["cd_demo_sk","cd_marital_status"] + Conds:RS_254._col2=RS_257._col0(Inner),Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] <-Map 1 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_270] + SHUFFLE [RS_254] PartitionCols:_col2 - Select Operator [SEL_269] (rows=282274763 width=31) + Select Operator [SEL_253] (rows=282274763 width=31) Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Filter Operator [FIL_268] (rows=282274763 width=31) - predicate:((cs_bill_cdemo_sk BETWEEN DynamicValue(RS_30_customer_demographics_cd_demo_sk_min) AND DynamicValue(RS_30_customer_demographics_cd_demo_sk_max) and in_bloom_filter(cs_bill_cdemo_sk, DynamicValue(RS_30_customer_demographics_cd_demo_sk_bloom_filter))) and (cs_bill_hdemo_sk BETWEEN DynamicValue(RS_33_household_demographics_hd_demo_sk_min) AND DynamicValue(RS_33_household_demographics_hd_demo_sk_max) and in_bloom_filter(cs_bill_hdemo_sk, DynamicValue(RS_33_household_demographics_hd_demo_sk_bloom_filter))) and (cs_sold_date_sk BETWEEN DynamicValue(RS_36_d1_d_date_sk_min) AND DynamicValue(RS_36_d1_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_36_d1_d_date_sk_bloom_filter))) and cs_bill_cdemo_sk is not null and cs_bill_hdemo_sk is not null and cs_ship_date_sk is not null and cs_sold_date_sk is not null) + Filter Operator [FIL_252] (rows=282274763 width=31) + predicate:((cs_sold_date_sk BETWEEN DynamicValue(RS_36_d1_d_date_sk_min) AND DynamicValue(RS_36_d1_d_date_sk_max) and in_bloom_filter(cs_sold_date_sk, DynamicValue(RS_36_d1_d_date_sk_bloom_filter))) and cs_bill_cdemo_sk is not null and cs_bill_hdemo_sk is not null and cs_ship_date_sk is not null and cs_sold_date_sk is not null) TableScan [TS_0] (rows=287989836 width=31) default@catalog_sales,catalog_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["cs_sold_date_sk","cs_ship_date_sk","cs_bill_cdemo_sk","cs_bill_hdemo_sk","cs_item_sk","cs_promo_sk","cs_order_number","cs_quantity"] - <-Reducer 14 [BROADCAST_EDGE] vectorized + <-Reducer 17 [BROADCAST_EDGE] vectorized BROADCAST [RS_251] Group By Operator [GBY_250] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_249] - Group By Operator [GBY_248] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_247] (rows=265971 width=4) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_245] - <-Reducer 16 [BROADCAST_EDGE] vectorized - BROADCAST [RS_259] - Group By Operator [GBY_258] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 15 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_257] - Group By Operator [GBY_256] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_255] (rows=1440 width=4) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_253] - <-Reducer 19 [BROADCAST_EDGE] vectorized - BROADCAST [RS_267] - Group By Operator [GBY_266] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Reducer 18 [CUSTOM_SIMPLE_EDGE] + <-Reducer 16 [CUSTOM_SIMPLE_EDGE] SHUFFLE [RS_138] Group By Operator [GBY_137] (rows=1 width=12) Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] Select Operator [SEL_136] (rows=3621 width=8) Output:["_col0"] Please refer to the previous Merge Join Operator [MERGEJOIN_236] + <-Map 13 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_257] + PartitionCols:_col0 + Select Operator [SEL_256] (rows=265971 width=4) + Output:["_col0"] + Filter Operator [FIL_255] (rows=265971 width=89) + predicate:(cd_marital_status = 'M') + TableScan [TS_3] (rows=1861800 width=89) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:COMPLETE,Output:["cd_demo_sk","cd_marital_status"]
http://git-wip-us.apache.org/repos/asf/hive/blob/e986fc56/ql/src/test/results/clientpositive/perf/tez/constraints/query73.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/perf/tez/constraints/query73.q.out b/ql/src/test/results/clientpositive/perf/tez/constraints/query73.q.out index 5334542..52b0c26 100644 --- a/ql/src/test/results/clientpositive/perf/tez/constraints/query73.q.out +++ b/ql/src/test/results/clientpositive/perf/tez/constraints/query73.q.out @@ -67,15 +67,13 @@ POSTHOOK: Output: hdfs://### HDFS PATH ### Plan optimized by CBO. Vertex dependency in root stage -Map 4 <- Reducer 10 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 14 (BROADCAST_EDGE) +Map 4 <- Reducer 10 (BROADCAST_EDGE) Reducer 10 <- Map 9 (CUSTOM_SIMPLE_EDGE) -Reducer 12 <- Map 11 (CUSTOM_SIMPLE_EDGE) -Reducer 14 <- Map 13 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 5 <- Map 4 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE) Reducer 6 <- Map 11 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) -Reducer 7 <- Map 13 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) +Reducer 7 <- Map 12 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Stage-0 @@ -83,15 +81,15 @@ Stage-0 limit:-1 Stage-1 Reducer 3 vectorized - File Output Operator [FS_134] - Select Operator [SEL_133] (rows=5 width=364) + File Output Operator [FS_124] + Select Operator [SEL_123] (rows=5 width=364) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] <-Reducer 2 [SIMPLE_EDGE] SHUFFLE [RS_34] Select Operator [SEL_33] (rows=5 width=364) Output:["_col0","_col1","_col2","_col3","_col4","_col5"] Merge Join Operator [MERGEJOIN_99] (rows=5 width=364) - Conds:RS_101._col0=RS_132._col1(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col7"] + Conds:RS_101._col0=RS_122._col1(Inner),Output:["_col1","_col2","_col3","_col4","_col5","_col7"] <-Map 1 [SIMPLE_EDGE] vectorized SHUFFLE [RS_101] PartitionCols:_col0 @@ -100,13 +98,13 @@ Stage-0 TableScan [TS_0] (rows=80000000 width=356) default@customer,customer,Tbl:COMPLETE,Col:COMPLETE,Output:["c_customer_sk","c_salutation","c_first_name","c_last_name","c_preferred_cust_flag"] <-Reducer 8 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_132] + SHUFFLE [RS_122] PartitionCols:_col1 - Filter Operator [FIL_131] (rows=5 width=12) + Filter Operator [FIL_121] (rows=5 width=12) predicate:_col2 BETWEEN 1 AND 5 - Select Operator [SEL_130] (rows=788766 width=12) + Select Operator [SEL_120] (rows=788766 width=12) Output:["_col0","_col1","_col2"] - Group By Operator [GBY_129] (rows=788766 width=12) + Group By Operator [GBY_119] (rows=788766 width=12) Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 <-Reducer 7 [SIMPLE_EDGE] SHUFFLE [RS_25] @@ -114,13 +112,13 @@ Stage-0 Group By Operator [GBY_24] (rows=788766 width=12) Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col1, _col4 Merge Join Operator [MERGEJOIN_98] (rows=788766 width=4) - Conds:RS_20._col3=RS_120._col0(Inner),Output:["_col1","_col4"] - <-Map 13 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_120] + Conds:RS_20._col3=RS_118._col0(Inner),Output:["_col1","_col4"] + <-Map 12 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_118] PartitionCols:_col0 - Select Operator [SEL_119] (rows=56 width=4) + Select Operator [SEL_117] (rows=56 width=4) Output:["_col0"] - Filter Operator [FIL_118] (rows=56 width=102) + Filter Operator [FIL_116] (rows=56 width=102) predicate:(s_county) IN ('Mobile County', 'Maverick County', 'Huron County', 'Kittitas County') TableScan [TS_11] (rows=1704 width=102) default@store,store,Tbl:COMPLETE,Col:COMPLETE,Output:["s_store_sk","s_county"] @@ -128,13 +126,13 @@ Stage-0 SHUFFLE [RS_20] PartitionCols:_col3 Merge Join Operator [MERGEJOIN_97] (rows=2973700 width=4) - Conds:RS_17._col2=RS_112._col0(Inner),Output:["_col1","_col3","_col4"] + Conds:RS_17._col2=RS_115._col0(Inner),Output:["_col1","_col3","_col4"] <-Map 11 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_112] + SHUFFLE [RS_115] PartitionCols:_col0 - Select Operator [SEL_111] (rows=480 width=4) + Select Operator [SEL_114] (rows=480 width=4) Output:["_col0"] - Filter Operator [FIL_110] (rows=480 width=104) + Filter Operator [FIL_113] (rows=480 width=104) predicate:((hd_buy_potential) IN ('>10000', 'unknown') and (hd_vehicle_count > 0) and CASE WHEN ((hd_vehicle_count > 0)) THEN (((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count)) > 1.0D)) ELSE (null) END) TableScan [TS_8] (rows=7200 width=104) default@household_demographics,household_demographics,Tbl:COMPLETE,Col:COMPLETE,Output:["hd_demo_sk","hd_buy_potential","hd_dep_count","hd_vehicle_count"] @@ -142,7 +140,7 @@ Stage-0 SHUFFLE [RS_17] PartitionCols:_col2 Merge Join Operator [MERGEJOIN_96] (rows=44605486 width=10) - Conds:RS_128._col0=RS_104._col0(Inner),Output:["_col1","_col2","_col3","_col4"] + Conds:RS_112._col0=RS_104._col0(Inner),Output:["_col1","_col2","_col3","_col4"] <-Map 9 [SIMPLE_EDGE] vectorized SHUFFLE [RS_104] PartitionCols:_col0 @@ -153,12 +151,12 @@ Stage-0 TableScan [TS_5] (rows=73049 width=12) default@date_dim,date_dim,Tbl:COMPLETE,Col:COMPLETE,Output:["d_date_sk","d_year","d_dom"] <-Map 4 [SIMPLE_EDGE] vectorized - SHUFFLE [RS_128] + SHUFFLE [RS_112] PartitionCols:_col0 - Select Operator [SEL_127] (rows=479121995 width=19) + Select Operator [SEL_111] (rows=479121995 width=19) Output:["_col0","_col1","_col2","_col3","_col4"] - Filter Operator [FIL_126] (rows=479121995 width=19) - predicate:((ss_hdemo_sk BETWEEN DynamicValue(RS_18_household_demographics_hd_demo_sk_min) AND DynamicValue(RS_18_household_demographics_hd_demo_sk_max) and in_bloom_filter(ss_hdemo_sk, DynamicValue(RS_18_household_demographics_hd_demo_sk_bloom_filter))) and (ss_sold_date_sk BETWEEN DynamicValue(RS_15_date_dim_d_date_sk_min) AND DynamicValue(RS_15_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_15_date_dim_d_date_sk_bloom_filter))) and (ss_store_sk BETWEEN DynamicValue(RS_21_store_s_store_sk_min) AND DynamicValue(RS_21_store_s_store_sk_max) and in_bloom_filter(ss_store_sk, DynamicValue(RS_21_store_s_store_sk_bloom_filter))) and ss_customer_sk is not null and ss_hdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null) + Filter Operator [FIL_110] (rows=479121995 width=19) + predicate:((ss_sold_date_sk BETWEEN DynamicValue(RS_15_date_dim_d_date_sk_min) AND DynamicValue(RS_15_date_dim_d_date_sk_max) and in_bloom_filter(ss_sold_date_sk, DynamicValue(RS_15_date_dim_d_date_sk_bloom_filter))) and ss_customer_sk is not null and ss_hdemo_sk is not null and ss_sold_date_sk is not null and ss_store_sk is not null) TableScan [TS_2] (rows=575995635 width=19) default@store_sales,store_sales,Tbl:COMPLETE,Col:COMPLETE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_store_sk","ss_ticket_number"] <-Reducer 10 [BROADCAST_EDGE] vectorized @@ -172,26 +170,4 @@ Stage-0 Select Operator [SEL_105] (rows=170 width=4) Output:["_col0"] Please refer to the previous Select Operator [SEL_103] - <-Reducer 12 [BROADCAST_EDGE] vectorized - BROADCAST [RS_117] - Group By Operator [GBY_116] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 11 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_115] - Group By Operator [GBY_114] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_113] (rows=480 width=4) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_111] - <-Reducer 14 [BROADCAST_EDGE] vectorized - BROADCAST [RS_125] - Group By Operator [GBY_124] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)","bloom_filter(VALUE._col2, expectedEntries=1000000)"] - <-Map 13 [CUSTOM_SIMPLE_EDGE] vectorized - SHUFFLE [RS_123] - Group By Operator [GBY_122] (rows=1 width=12) - Output:["_col0","_col1","_col2"],aggregations:["min(_col0)","max(_col0)","bloom_filter(_col0, expectedEntries=1000000)"] - Select Operator [SEL_121] (rows=56 width=4) - Output:["_col0"] - Please refer to the previous Select Operator [SEL_119]