http://git-wip-us.apache.org/repos/asf/hive/blob/6eaa32c8/ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out b/ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out index 7089004..3b2c80e 100644 --- a/ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out +++ b/ql/src/test/results/clientpositive/spark/mapjoin_mapjoin.q.out @@ -65,25 +65,25 @@ STAGE PLANS: Spark #### A masked pattern was here #### Vertices: - Map 1 + Map 2 Map Operator Tree: TableScan - alias: src - Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + alias: src1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: value is not null (type: boolean) - Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null (type: boolean) + Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) + expressions: key (type: string) outputColumnNames: _col0 - Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: 0 _col0 (type: string) - 1 _col1 (type: string) - Position of Big Table: 1 + 1 _col0 (type: string) + Position of Big Table: 0 Local Work: Map Reduce Local Work Path -> Alias: @@ -91,7 +91,7 @@ STAGE PLANS: Path -> Partition: #### A masked pattern was here #### Partition - base file name: src + base file name: src1 input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat properties: @@ -101,14 +101,14 @@ STAGE PLANS: columns.comments 'default','default' columns.types string:string #### A masked pattern was here #### - name default.src + name default.src1 numFiles 1 - numRows 500 - rawDataSize 5312 - serialization.ddl struct src { string key, string value} + numRows 25 + rawDataSize 191 + serialization.ddl struct src1 { string key, string value} serialization.format 1 serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - totalSize 5812 + totalSize 216 #### A masked pattern was here #### serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe @@ -121,37 +121,37 @@ STAGE PLANS: columns.comments 'default','default' columns.types string:string #### A masked pattern was here #### - name default.src + name default.src1 numFiles 1 - numRows 500 - rawDataSize 5312 - serialization.ddl struct src { string key, string value} + numRows 25 + rawDataSize 191 + serialization.ddl struct src1 { string key, string value} serialization.format 1 serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - totalSize 5812 + totalSize 216 #### A masked pattern was here #### serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - name: default.src - name: default.src + name: default.src1 + name: default.src1 Truncated Path -> Alias: - /src [src] + /src1 [src1] Map 3 Map Operator Tree: TableScan - alias: src1 - Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE GatherStats: false Filter Operator isSamplingPred: false - predicate: key is not null (type: boolean) - Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null (type: boolean) + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) + expressions: value (type: string) outputColumnNames: _col0 - Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) Position of Big Table: 0 Local Work: @@ -161,7 +161,7 @@ STAGE PLANS: Path -> Partition: #### A masked pattern was here #### Partition - base file name: src1 + base file name: src input format: org.apache.hadoop.mapred.TextInputFormat output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat properties: @@ -171,14 +171,14 @@ STAGE PLANS: columns.comments 'default','default' columns.types string:string #### A masked pattern was here #### - name default.src1 + name default.src numFiles 1 - numRows 25 - rawDataSize 191 - serialization.ddl struct src1 { string key, string value} + numRows 500 + rawDataSize 5312 + serialization.ddl struct src { string key, string value} serialization.format 1 serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - totalSize 216 + totalSize 5812 #### A masked pattern was here #### serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe @@ -191,26 +191,26 @@ STAGE PLANS: columns.comments 'default','default' columns.types string:string #### A masked pattern was here #### - name default.src1 + name default.src numFiles 1 - numRows 25 - rawDataSize 191 - serialization.ddl struct src1 { string key, string value} + numRows 500 + rawDataSize 5312 + serialization.ddl struct src { string key, string value} serialization.format 1 serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - totalSize 216 + totalSize 5812 #### A masked pattern was here #### serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - name: default.src1 - name: default.src1 + name: default.src + name: default.src Truncated Path -> Alias: - /src1 [src1] + /src [src] Stage: Stage-1 Spark #### A masked pattern was here #### Vertices: - Map 2 + Map 1 Map Operator Tree: TableScan alias: srcpart @@ -232,45 +232,41 @@ STAGE PLANS: 1 _col0 (type: string) outputColumnNames: _col0, _col1 input vertices: - 1 Map 3 + 1 Map 2 Position of Big Table: 0 Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col1 + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0 input vertices: - 0 Map 1 - Position of Big Table: 1 + 1 Map 3 + Position of Big Table: 0 Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - Select Operator - expressions: _col1 (type: string) - outputColumnNames: _col0 - Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - File Output Operator - compressed: false - GlobalTableId: 0 + File Output Operator + compressed: false + GlobalTableId: 0 #### A masked pattern was here #### - NumFilesPerFileSink: 1 - Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + NumFilesPerFileSink: 1 + Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE #### A masked pattern was here #### - table: - input format: org.apache.hadoop.mapred.TextInputFormat - output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat - properties: - columns _col0 - columns.types string - escape.delim \ - hive.serialization.extend.additional.nesting.levels true - serialization.format 1 - serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - TotalFiles: 1 - GatherStats: false - MultiFileSpray: false + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + properties: + columns _col0 + columns.types string + escape.delim \ + hive.serialization.extend.additional.nesting.levels true + serialization.format 1 + serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + TotalFiles: 1 + GatherStats: false + MultiFileSpray: false Local Work: Map Reduce Local Work Path -> Alias: @@ -488,39 +484,39 @@ STAGE PLANS: Spark #### A masked pattern was here #### Vertices: - Map 1 + Map 2 Map Operator Tree: TableScan - alias: src - Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + alias: src1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: (value > 'val_450') (type: boolean) - Statistics: Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null (type: boolean) + Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: value (type: string) + expressions: key (type: string) outputColumnNames: _col0 - Statistics: Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: 0 _col0 (type: string) - 1 _col1 (type: string) + 1 _col0 (type: string) Local Work: Map Reduce Local Work Map 3 Map Operator Tree: TableScan - alias: src1 - Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE Filter Operator - predicate: key is not null (type: boolean) - Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE + predicate: (value > 'val_450') (type: boolean) + Statistics: Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE Select Operator - expressions: key (type: string) + expressions: value (type: string) outputColumnNames: _col0 - Statistics: Num rows: 13 Data size: 99 Basic stats: COMPLETE Column stats: NONE + Statistics: Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE Spark HashTable Sink Operator keys: - 0 _col0 (type: string) + 0 _col1 (type: string) 1 _col0 (type: string) Local Work: Map Reduce Local Work @@ -529,7 +525,7 @@ STAGE PLANS: Spark #### A masked pattern was here #### Vertices: - Map 2 + Map 1 Map Operator Tree: TableScan alias: srcpart @@ -549,29 +545,25 @@ STAGE PLANS: 1 _col0 (type: string) outputColumnNames: _col0, _col1 input vertices: - 1 Map 3 + 1 Map 2 Statistics: Num rows: 183 Data size: 1951 Basic stats: COMPLETE Column stats: NONE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: string) - 1 _col1 (type: string) - outputColumnNames: _col1 + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0 input vertices: - 0 Map 1 + 1 Map 3 Statistics: Num rows: 201 Data size: 2146 Basic stats: COMPLETE Column stats: NONE - Select Operator - expressions: _col1 (type: string) - outputColumnNames: _col0 + File Output Operator + compressed: false Statistics: Num rows: 201 Data size: 2146 Basic stats: COMPLETE Column stats: NONE - File Output Operator - compressed: false - Statistics: Num rows: 201 Data size: 2146 Basic stats: COMPLETE Column stats: NONE - table: - input format: org.apache.hadoop.mapred.TextInputFormat - output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat - serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe Local Work: Map Reduce Local Work
http://git-wip-us.apache.org/repos/asf/hive/blob/6eaa32c8/ql/src/test/results/clientpositive/tez/explainuser_1.q.out ---------------------------------------------------------------------- diff --git a/ql/src/test/results/clientpositive/tez/explainuser_1.q.out b/ql/src/test/results/clientpositive/tez/explainuser_1.q.out index c1bfaff..2147984 100644 --- a/ql/src/test/results/clientpositive/tez/explainuser_1.q.out +++ b/ql/src/test/results/clientpositive/tez/explainuser_1.q.out @@ -6427,77 +6427,74 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 3 <- Map 4 (BROADCAST_EDGE) -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) +Map 1 <- Map 3 (BROADCAST_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:-1 Stage-1 Reducer 2 - File Output Operator [FS_20] + File Output Operator [FS_19] compressed:true Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE table:{"serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat"} - Select Operator [SEL_19] - outputColumnNames:["_col0"] - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_30] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"1":"_col1 (type: string)","0":"_col0 (type: string)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:(value > 'val_450') (type: boolean) - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Map Join Operator [MAPJOIN_29] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"Map 3":"_col0 (type: string)","Map 4":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_7] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_28] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_6] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE - |<-Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:srcpart - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + Merge Join Operator [MERGEJOIN_29] + | condition map:[{"":"Inner Join 0 to 1"}] + | keys:{"1":"_col0 (type: string)","0":"_col1 (type: string)"} + | outputColumnNames:["_col0"] + | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 1 [SIMPLE_EDGE] + | Reduce Output Operator [RS_14] + | key expressions:_col1 (type: string) + | Map-reduce partition columns:_col1 (type: string) + | sort order:+ + | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | value expressions:_col0 (type: string) + | Map Join Operator [MAPJOIN_28] + | | condition map:[{"":"Inner Join 0 to 1"}] + | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} + | | outputColumnNames:["_col0","_col1"] + | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Map 3 [BROADCAST_EDGE] + | | Reduce Output Operator [RS_11] + | | key expressions:_col0 (type: string) + | | Map-reduce partition columns:_col0 (type: string) + | | sort order:+ + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Select Operator [SEL_4] + | | outputColumnNames:["_col0"] + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Filter Operator [FIL_26] + | | predicate:key is not null (type: boolean) + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | TableScan [TS_3] + | | alias:src1 + | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Select Operator [SEL_2] + | outputColumnNames:["_col0","_col1"] + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | Filter Operator [FIL_25] + | predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | TableScan [TS_0] + | alias:srcpart + | Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 4 [SIMPLE_EDGE] + Reduce Output Operator [RS_16] + key expressions:_col0 (type: string) + Map-reduce partition columns:_col0 (type: string) + sort order:+ + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator [SEL_7] + outputColumnNames:["_col0"] + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator [FIL_27] + predicate:(value > 'val_450') (type: boolean) + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + TableScan [TS_5] + alias:src + Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE PREHOOK: query: explain select srcpart.key from srcpart join src on (srcpart.value=src.value) join src1 on (srcpart.key=src1.key) where srcpart.value > 'val_450' PREHOOK: type: QUERY @@ -6506,77 +6503,74 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 3 <- Map 4 (BROADCAST_EDGE) -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) +Map 1 <- Map 3 (BROADCAST_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:-1 Stage-1 Reducer 2 - File Output Operator [FS_20] + File Output Operator [FS_19] compressed:true Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE table:{"serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat"} - Select Operator [SEL_19] - outputColumnNames:["_col0"] - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_30] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"1":"_col1 (type: string)","0":"_col0 (type: string)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:(value > 'val_450') (type: boolean) - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Map Join Operator [MAPJOIN_29] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"Map 3":"_col0 (type: string)","Map 4":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_7] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_28] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_6] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE - |<-Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:srcpart - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + Merge Join Operator [MERGEJOIN_29] + | condition map:[{"":"Inner Join 0 to 1"}] + | keys:{"1":"_col0 (type: string)","0":"_col1 (type: string)"} + | outputColumnNames:["_col0"] + | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 1 [SIMPLE_EDGE] + | Reduce Output Operator [RS_14] + | key expressions:_col1 (type: string) + | Map-reduce partition columns:_col1 (type: string) + | sort order:+ + | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | value expressions:_col0 (type: string) + | Map Join Operator [MAPJOIN_28] + | | condition map:[{"":"Inner Join 0 to 1"}] + | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} + | | outputColumnNames:["_col0","_col1"] + | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Map 3 [BROADCAST_EDGE] + | | Reduce Output Operator [RS_11] + | | key expressions:_col0 (type: string) + | | Map-reduce partition columns:_col0 (type: string) + | | sort order:+ + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Select Operator [SEL_4] + | | outputColumnNames:["_col0"] + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Filter Operator [FIL_26] + | | predicate:key is not null (type: boolean) + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | TableScan [TS_3] + | | alias:src1 + | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Select Operator [SEL_2] + | outputColumnNames:["_col0","_col1"] + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | Filter Operator [FIL_25] + | predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | TableScan [TS_0] + | alias:srcpart + | Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 4 [SIMPLE_EDGE] + Reduce Output Operator [RS_16] + key expressions:_col0 (type: string) + Map-reduce partition columns:_col0 (type: string) + sort order:+ + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator [SEL_7] + outputColumnNames:["_col0"] + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator [FIL_27] + predicate:(value > 'val_450') (type: boolean) + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + TableScan [TS_5] + alias:src + Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE PREHOOK: query: explain select srcpart.key from srcpart join src on (srcpart.value=src.value) join src1 on (srcpart.key=src1.key) where srcpart.value > 'val_450' PREHOOK: type: QUERY @@ -6585,77 +6579,74 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Vertex dependency in root stage -Map 3 <- Map 4 (BROADCAST_EDGE) -Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) +Map 1 <- Map 3 (BROADCAST_EDGE) +Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 Fetch Operator limit:-1 Stage-1 Reducer 2 - File Output Operator [FS_20] + File Output Operator [FS_19] compressed:true Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE table:{"serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat"} - Select Operator [SEL_19] - outputColumnNames:["_col0"] - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_30] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"1":"_col1 (type: string)","0":"_col0 (type: string)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:(value > 'val_450') (type: boolean) - | Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Map Join Operator [MAPJOIN_29] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"Map 3":"_col0 (type: string)","Map 4":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_7] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_28] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_6] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE - |<-Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) - Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:srcpart - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + Merge Join Operator [MERGEJOIN_29] + | condition map:[{"":"Inner Join 0 to 1"}] + | keys:{"1":"_col0 (type: string)","0":"_col1 (type: string)"} + | outputColumnNames:["_col0"] + | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 1 [SIMPLE_EDGE] + | Reduce Output Operator [RS_14] + | key expressions:_col1 (type: string) + | Map-reduce partition columns:_col1 (type: string) + | sort order:+ + | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | value expressions:_col0 (type: string) + | Map Join Operator [MAPJOIN_28] + | | condition map:[{"":"Inner Join 0 to 1"}] + | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} + | | outputColumnNames:["_col0","_col1"] + | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Map 3 [BROADCAST_EDGE] + | | Reduce Output Operator [RS_11] + | | key expressions:_col0 (type: string) + | | Map-reduce partition columns:_col0 (type: string) + | | sort order:+ + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Select Operator [SEL_4] + | | outputColumnNames:["_col0"] + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | Filter Operator [FIL_26] + | | predicate:key is not null (type: boolean) + | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE + | | TableScan [TS_3] + | | alias:src1 + | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: COMPLETE + | |<-Select Operator [SEL_2] + | outputColumnNames:["_col0","_col1"] + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | Filter Operator [FIL_25] + | predicate:(((value > 'val_450') and key is not null) and value is not null) (type: boolean) + | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE + | TableScan [TS_0] + | alias:srcpart + | Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: COMPLETE + |<-Map 4 [SIMPLE_EDGE] + Reduce Output Operator [RS_16] + key expressions:_col0 (type: string) + Map-reduce partition columns:_col0 (type: string) + sort order:+ + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator [SEL_7] + outputColumnNames:["_col0"] + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator [FIL_27] + predicate:(value > 'val_450') (type: boolean) + Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE + TableScan [TS_5] + alias:src + Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE PREHOOK: query: explain select p_mfgr, p_name, p_size,