[jira] [Commented] (PHOENIX-2743) HivePhoenixHandler for big-big join with predicate push down

ASF GitHub Bot (JIRA) Wed, 13 Apr 2016 01:36:53 -0700

    [ 
https://issues.apache.org/jira/browse/PHOENIX-2743?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15238852#comment-15238852
 ]


ASF GitHub Bot commented on PHOENIX-2743:
-----------------------------------------

Github user ss77892 commented on a diff in the pull request:

    https://github.com/apache/phoenix/pull/155#discussion_r59511383
  
    --- Diff: 
phoenix-hive/src/main/java/org/apache/phoenix/hive/ql/index/IndexPredicateAnalyzer.java
 ---
    @@ -0,0 +1,486 @@
    +/**
    + * Licensed to the Apache Software Foundation (ASF) under one
    + * or more contributor license agreements.  See the NOTICE file
    + * distributed with this work for additional information
    + * regarding copyright ownership.  The ASF licenses this file
    + * to you under the Apache License, Version 2.0 (the
    + * "License"); you may not use this file except in compliance
    + * with the License.  You may obtain a copy of the License at
    + *
    + *     http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing, software
    + * distributed under the License is distributed on an "AS IS" BASIS,
    + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    + * See the License for the specific language governing permissions and
    + * limitations under the License.
    + */
    +package org.apache.phoenix.hive.ql.index;
    +
    +import java.util.ArrayList;
    +import java.util.Arrays;
    +import java.util.HashMap;
    +import java.util.HashSet;
    +import java.util.LinkedHashMap;
    +import java.util.List;
    +import java.util.Map;
    +import java.util.Set;
    +import java.util.Stack;
    +
    +import org.apache.commons.logging.Log;
    +import org.apache.commons.logging.LogFactory;
    +import org.apache.hadoop.hive.ql.exec.FunctionRegistry;
    +import org.apache.hadoop.hive.ql.lib.DefaultGraphWalker;
    +import org.apache.hadoop.hive.ql.lib.DefaultRuleDispatcher;
    +import org.apache.hadoop.hive.ql.lib.Dispatcher;
    +import org.apache.hadoop.hive.ql.lib.GraphWalker;
    +import org.apache.hadoop.hive.ql.lib.Node;
    +import org.apache.hadoop.hive.ql.lib.NodeProcessor;
    +import org.apache.hadoop.hive.ql.lib.NodeProcessorCtx;
    +import org.apache.hadoop.hive.ql.lib.Rule;
    +import org.apache.hadoop.hive.ql.parse.SemanticException;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeColumnDesc;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeConstantDesc;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeDesc;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeDescUtils;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeFieldDesc;
    +import org.apache.hadoop.hive.ql.plan.ExprNodeGenericFuncDesc;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDF;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFBaseCompare;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFBetween;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFBridge;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFIn;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFOPNot;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFOPNotNull;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFOPNull;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToBinary;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToChar;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToDate;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToDecimal;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToUnixTimeStamp;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToUtcTimestamp;
    +import org.apache.hadoop.hive.ql.udf.generic.GenericUDFToVarchar;
    +import org.apache.hadoop.hive.serde2.typeinfo.TypeInfoFactory;
    +
    +import com.google.common.collect.Lists;
    +
    +/**
    + * Clone of org.apache.hadoop.hive.ql.index.IndexPredicateAnalyzer with 
modifying
    + * analyzePredicate method.
    + *
    + *
    + */
    +public class IndexPredicateAnalyzer {
    +
    +    private static final Log LOG = 
LogFactory.getLog(IndexPredicateAnalyzer.class);
    +
    +    private final Set<String> udfNames;
    +    private final Map<String, Set<String>> columnToUDFs;
    +    private FieldValidator fieldValidator;
    +
    +    private boolean acceptsFields;
    +
    +    public IndexPredicateAnalyzer() {
    +        udfNames = new HashSet<String>();
    +        columnToUDFs = new HashMap<String, Set<String>>();
    +    }
    +
    +    public void setFieldValidator(FieldValidator fieldValidator) {
    +        this.fieldValidator = fieldValidator;
    +    }
    +
    +    /**
    +     * Registers a comparison operator as one which can be satisfied by an 
index
    +     * search. Unless this is called, analyzePredicate will never find any
    +     * indexable conditions.
    +     *
    +     * @param udfName name of comparison operator as returned by either
    +     *                {@link GenericUDFBridge#getUdfName} (for simple 
UDF's) or
    +     *                udf.getClass().getName() (for generic UDF's).
    +     */
    +    public void addComparisonOp(String udfName) {
    +        udfNames.add(udfName);
    +    }
    +
    +    /**
    +     * Clears the set of column names allowed in comparisons. (Initially, 
all
    +     * column names are allowed.)
    +     */
    +    public void clearAllowedColumnNames() {
    +        columnToUDFs.clear();
    +    }
    +
    +    /**
    +     * Adds a column name to the set of column names allowed.
    +     *
    +     * @param columnName name of column to be allowed
    +     */
    +    public void allowColumnName(String columnName) {
    +        columnToUDFs.put(columnName, udfNames);
    +    }
    +
    +    /**
    +     * add allowed functions per column
    +     *
    +     * @param columnName
    +     * @param udfs
    +     */
    +    public void addComparisonOp(String columnName, String... udfs) {
    +        Set<String> allowed = columnToUDFs.get(columnName);
    +        if (allowed == null || allowed == udfNames) {
    +            // override
    +            columnToUDFs.put(columnName, new 
HashSet<String>(Arrays.asList(udfs)));
    +        } else {
    +            allowed.addAll(Arrays.asList(udfs));
    +        }
    +    }
    +
    +    /**
    +     * Analyzes a predicate.
    +     *
    +     * @param predicate        predicate to be analyzed
    +     * @param searchConditions receives conditions produced by analysis
    +     * @return residual predicate which could not be translated to
    +     * searchConditions
    +     */
    +    public ExprNodeDesc analyzePredicate(ExprNodeDesc predicate, final 
List<IndexSearchCondition> searchConditions) {
    +
    +        Map<Rule, NodeProcessor> opRules = new LinkedHashMap<Rule, 
NodeProcessor>();
    +        NodeProcessor nodeProcessor = new NodeProcessor() {
    +            @Override
    +            public Object process(Node nd, Stack<Node> stack, 
NodeProcessorCtx procCtx, Object... nodeOutputs) throws SemanticException {
    +
    +                // We can only push down stuff which appears as part of
    +                // a pure conjunction: reject OR, CASE, etc.
    +                for (Node ancestor : stack) {
    +                    if (nd == ancestor) {
    +                        break;
    +                    }
    +                    if (!FunctionRegistry.isOpAnd((ExprNodeDesc) 
ancestor)) {
    +                        return nd;
    +                    }
    +                }
    +
    +                return analyzeExpr((ExprNodeGenericFuncDesc) nd, 
searchConditions, nodeOutputs);
    +            }
    +        };
    +
    +        Dispatcher disp = new DefaultRuleDispatcher(nodeProcessor, 
opRules, null);
    +        GraphWalker ogw = new DefaultGraphWalker(disp);
    +        ArrayList<Node> topNodes = new ArrayList<Node>();
    +        topNodes.add(predicate);
    +        HashMap<Node, Object> nodeOutput = new HashMap<Node, Object>();
    +
    +        try {
    +            ogw.startWalking(topNodes, nodeOutput);
    +        } catch (SemanticException ex) {
    +            throw new RuntimeException(ex);
    +        }
    +
    +        ExprNodeDesc residualPredicate = (ExprNodeDesc) 
nodeOutput.get(predicate);
    +        return residualPredicate;
    +    }
    +
    +    // Check if ExprNodeColumnDesc is wrapped in expr.
    +    // If so, peel off. Otherwise return itself.
    +    private ExprNodeDesc getColumnExpr(ExprNodeDesc expr) {
    +        if (expr instanceof ExprNodeColumnDesc) {
    +            return expr;
    +        }
    +        ExprNodeGenericFuncDesc funcDesc = null;
    +        if (expr instanceof ExprNodeGenericFuncDesc) {
    +            funcDesc = (ExprNodeGenericFuncDesc) expr;
    +        }
    +        if (null == funcDesc) {
    +            return expr;
    +        }
    +        GenericUDF udf = funcDesc.getGenericUDF();
    +        // check if its a simple cast expression.
    +        if ((udf instanceof GenericUDFBridge || udf instanceof 
GenericUDFToBinary || udf instanceof GenericUDFToChar
    +                || udf instanceof GenericUDFToVarchar || udf instanceof 
GenericUDFToDecimal
    +                || udf instanceof GenericUDFToDate || udf instanceof 
GenericUDFToUnixTimeStamp
    +                || udf instanceof GenericUDFToUtcTimestamp) && 
funcDesc.getChildren().size() == 1
    +                && funcDesc.getChildren().get(0) instanceof 
ExprNodeColumnDesc) {
    +            return expr.getChildren().get(0);
    +        }
    +        return expr;
    +    }
    +
    +    private void processingBetweenOperator(ExprNodeGenericFuncDesc expr, 
List<IndexSearchCondition> searchConditions, Object... nodeOutputs) {
    +        ExprNodeColumnDesc columnDesc = null;
    +        String[] fields = null;
    +
    +        if (nodeOutputs[1] instanceof ExprNodeFieldDesc) {
    +            // rowKey field
    +            ExprNodeFieldDesc fieldDesc = (ExprNodeFieldDesc) 
nodeOutputs[1];
    +            fields = ExprNodeDescUtils.extractFields(fieldDesc);
    +
    +            ExprNodeDesc[] extracted = 
ExprNodeDescUtils.extractComparePair((ExprNodeDesc) nodeOutputs[1], 
(ExprNodeDesc) nodeOutputs[2]);
    +            columnDesc = (ExprNodeColumnDesc) extracted[0];
    +        } else if (nodeOutputs[0] instanceof ExprNodeGenericFuncDesc) {
    +            columnDesc = (ExprNodeColumnDesc) ((ExprNodeGenericFuncDesc) 
nodeOutputs[1]).getChildren().get(0);
    +        } else {
    +            columnDesc = (ExprNodeColumnDesc) nodeOutputs[1];
    +        }
    +
    +        String udfName = expr.getGenericUDF().getUdfName();
    +        ExprNodeConstantDesc[] betweenConstants = new 
ExprNodeConstantDesc[]{(ExprNodeConstantDesc) nodeOutputs[2], 
(ExprNodeConstantDesc) nodeOutputs[3]};
    +        boolean isNot = (Boolean) ((ExprNodeConstantDesc) 
nodeOutputs[0]).getValue();
    +
    +        searchConditions.add(new IndexSearchCondition(columnDesc, udfName, 
betweenConstants, expr, fields, isNot));
    +    }
    +
    +    private void processingInOperator(ExprNodeGenericFuncDesc expr, 
List<IndexSearchCondition> searchConditions, boolean isNot, Object... 
nodeOutputs) {
    +        ExprNodeColumnDesc columnDesc = null;
    +        String[] fields = null;
    +
    +        if (LOG.isTraceEnabled()) {
    +            LOG.trace("Processing In Operator. nodeOutputs : " + 
Lists.newArrayList(nodeOutputs));
    +        }
    +
    +        if (nodeOutputs[0] instanceof ExprNodeFieldDesc) {
    +            // rowKey field
    +            ExprNodeFieldDesc fieldDesc = (ExprNodeFieldDesc) 
nodeOutputs[0];
    +            fields = ExprNodeDescUtils.extractFields(fieldDesc);
    +
    +            ExprNodeDesc[] extracted = 
ExprNodeDescUtils.extractComparePair((ExprNodeDesc) nodeOutputs[0], 
(ExprNodeDesc) nodeOutputs[1]);
    +
    +            if (extracted == null) {    // adding for tez
    +                return;
    +            }
    +
    +            if (LOG.isTraceEnabled()) {
    +                LOG.trace("nodeOutputs[0] : " + nodeOutputs[0] + ", 
nodeOutputs[1] : " +
    +                        nodeOutputs[1] + " => " + 
Lists.newArrayList(extracted));
    +            }
    +
    +            columnDesc = (ExprNodeColumnDesc) extracted[0];
    +        } else if (nodeOutputs[0] instanceof ExprNodeGenericFuncDesc) {
    +            columnDesc = (ExprNodeColumnDesc) ((ExprNodeGenericFuncDesc) 
nodeOutputs[0]).getChildren().get(0);
    +        } else {
    +            columnDesc = (ExprNodeColumnDesc) nodeOutputs[0];
    +        }
    +
    +        String udfName = expr.getGenericUDF().getUdfName();
    +        ExprNodeConstantDesc[] inConstantDescs = new 
ExprNodeConstantDesc[nodeOutputs.length - 1];
    +
    +        for (int i = 0, limit = inConstantDescs.length; i < limit; i++) {
    +            if (!(nodeOutputs[i + 1] instanceof ExprNodeConstantDesc)) {   
 // adding for tez
    +                return;
    +            }
    +
    +            inConstantDescs[i] = (ExprNodeConstantDesc) nodeOutputs[i + 1];
    +        }
    +
    +        searchConditions.add(new IndexSearchCondition(columnDesc, udfName, 
inConstantDescs, expr, fields, isNot));
    +    }
    +
    +    private void processingNullOperator(ExprNodeGenericFuncDesc expr, 
List<IndexSearchCondition> searchConditions, Object... nodeOutputs) {
    +        ExprNodeColumnDesc columnDesc = null;
    +        String[] fields = null;
    +
    +        if (nodeOutputs[0] instanceof ExprNodeFieldDesc) {
    +            // rowKey field
    +            ExprNodeFieldDesc fieldDesc = (ExprNodeFieldDesc) 
nodeOutputs[0];
    +            fields = ExprNodeDescUtils.extractFields(fieldDesc);
    +
    +            ExprNodeDesc[] extracted = 
ExprNodeDescUtils.extractComparePair((ExprNodeDesc) nodeOutputs[0], new 
ExprNodeConstantDesc());
    +            columnDesc = (ExprNodeColumnDesc) extracted[0];
    +        } else if (nodeOutputs[0] instanceof ExprNodeGenericFuncDesc) {
    +            columnDesc = (ExprNodeColumnDesc) ((ExprNodeGenericFuncDesc) 
nodeOutputs[0]).getChildren().get(0);
    +        } else {
    +            columnDesc = (ExprNodeColumnDesc) nodeOutputs[0];
    +        }
    +
    +        String udfName = expr.getGenericUDF().getUdfName();
    +
    +        searchConditions.add(new IndexSearchCondition(columnDesc, udfName, 
null, expr, fields, false));
    +    }
    +
    +    private void processingNotNullOperator(ExprNodeGenericFuncDesc expr, 
List<IndexSearchCondition> searchConditions, Object... nodeOutputs) {
    +        ExprNodeColumnDesc columnDesc = null;
    +        String[] fields = null;
    +
    +        if (nodeOutputs[0] instanceof ExprNodeFieldDesc) {
    +            // rowKey field
    +            ExprNodeFieldDesc fieldDesc = (ExprNodeFieldDesc) 
nodeOutputs[0];
    +            fields = ExprNodeDescUtils.extractFields(fieldDesc);
    +
    +            ExprNodeDesc[] extracted = 
ExprNodeDescUtils.extractComparePair((ExprNodeDesc) nodeOutputs[0], new 
ExprNodeConstantDesc());
    +            columnDesc = (ExprNodeColumnDesc) extracted[0];
    +        } else if (nodeOutputs[0] instanceof ExprNodeGenericFuncDesc) {
    +            columnDesc = (ExprNodeColumnDesc) ((ExprNodeGenericFuncDesc) 
nodeOutputs[0]).getChildren().get(0);
    +        } else {
    +            columnDesc = (ExprNodeColumnDesc) nodeOutputs[0];
    +        }
    +
    +        String udfName = expr.getGenericUDF().getUdfName();
    +
    +        searchConditions.add(new IndexSearchCondition(columnDesc, udfName, 
null, expr, fields, true));
    +    }
    +
    +    private ExprNodeDesc analyzeExpr(ExprNodeGenericFuncDesc expr, 
List<IndexSearchCondition> searchConditions, Object... nodeOutputs) throws 
SemanticException {
    +
    +        if (FunctionRegistry.isOpAnd(expr)) {
    +            assert (nodeOutputs.length == 2);
    +            ExprNodeDesc residual1 = (ExprNodeDesc) nodeOutputs[0];
    +            ExprNodeDesc residual2 = (ExprNodeDesc) nodeOutputs[1];
    +            if (residual1 == null) {
    +                return residual2;
    +            }
    +            if (residual2 == null) {
    +                return residual1;
    +            }
    +            List<ExprNodeDesc> residuals = new ArrayList<ExprNodeDesc>();
    +            residuals.add(residual1);
    +            residuals.add(residual2);
    +            return new 
ExprNodeGenericFuncDesc(TypeInfoFactory.booleanTypeInfo, 
FunctionRegistry.getGenericUDFForAnd(), residuals);
    +        }
    +
    +        GenericUDF genericUDF = expr.getGenericUDF();
    +        if (!(genericUDF instanceof GenericUDFBaseCompare)) {
    +            // 2015-10-22 Added by JeongMin Ju : Processing Between/In 
Operator
    +            if (genericUDF instanceof GenericUDFBetween) {
    +                // In case of not between, The value of first element of 
nodeOutputs is true. otherwise false.
    +                processingBetweenOperator(expr, searchConditions, 
nodeOutputs);
    +                return expr;
    +            } else if (genericUDF instanceof GenericUDFIn) {
    +                // In case of not in operator, in operator exist as child 
of not operator.
    +                processingInOperator(expr, searchConditions, false, 
nodeOutputs);
    +                return expr;
    +            } else if (genericUDF instanceof GenericUDFOPNot &&
    +                    ((ExprNodeGenericFuncDesc) 
expr.getChildren().get(0)).getGenericUDF() instanceof GenericUDFIn) {
    +                // In case of not in operator, in operator exist as child 
of not operator.
    +                processingInOperator((ExprNodeGenericFuncDesc) 
expr.getChildren().get(0),
    +                        searchConditions, true, ((ExprNodeGenericFuncDesc) 
nodeOutputs[0]).getChildren().toArray());
    +                return expr;
    +            } else if (genericUDF instanceof GenericUDFOPNull) {
    +                processingNullOperator(expr, searchConditions, 
nodeOutputs);
    +                return expr;
    +            } else if (genericUDF instanceof GenericUDFOPNotNull) {
    +                processingNotNullOperator(expr, searchConditions, 
nodeOutputs);
    +                return expr;
    +            } else {
    +                return expr;
    +            }
    +        }
    +        ExprNodeDesc expr1 = (ExprNodeDesc) nodeOutputs[0];
    +        ExprNodeDesc expr2 = (ExprNodeDesc) nodeOutputs[1];
    +        // We may need to peel off the GenericUDFBridge that is added by 
CBO or
    +        // user
    +        if (expr1.getTypeInfo().equals(expr2.getTypeInfo())) {
    +            expr1 = getColumnExpr(expr1);
    +            expr2 = getColumnExpr(expr2);
    +        }
    +
    +        ExprNodeDesc[] extracted = 
ExprNodeDescUtils.extractComparePair(expr1, expr2);
    +        if (extracted == null || (extracted.length > 2 && !acceptsFields)) 
{
    +            return expr;
    +        }
    +
    +        ExprNodeColumnDesc columnDesc;
    +        ExprNodeConstantDesc constantDesc;
    +        if (extracted[0] instanceof ExprNodeConstantDesc) {
    +            genericUDF = genericUDF.flip();
    +            columnDesc = (ExprNodeColumnDesc) extracted[1];
    +            constantDesc = (ExprNodeConstantDesc) extracted[0];
    +        } else {
    +            columnDesc = (ExprNodeColumnDesc) extracted[0];
    +            constantDesc = (ExprNodeConstantDesc) extracted[1];
    +        }
    +
    +        Set<String> allowed = columnToUDFs.get(columnDesc.getColumn());
    +        if (allowed == null) {
    +            return expr;
    +        }
    +
    +        String udfName = genericUDF.getUdfName();
    +        if (!allowed.contains(genericUDF.getUdfName())) {
    +            return expr;
    +        }
    +
    +        String[] fields = null;
    +        if (extracted.length > 2) {
    +            ExprNodeFieldDesc fieldDesc = (ExprNodeFieldDesc) extracted[2];
    +            if (!isValidField(fieldDesc)) {
    +                return expr;
    +            }
    +            fields = ExprNodeDescUtils.extractFields(fieldDesc);
    +        }
    +
    +        // We also need to update the expr so that the index query can be
    +        // generated.
    +        // Note that, hive does not support UDFToDouble etc in the query 
text.
    +        List<ExprNodeDesc> list = new ArrayList<ExprNodeDesc>();
    +        list.add(expr1);
    +        list.add(expr2);
    +        expr = new ExprNodeGenericFuncDesc(expr.getTypeInfo(), 
expr.getGenericUDF(), list);
    +
    +        searchConditions.add(new IndexSearchCondition(columnDesc, udfName, 
constantDesc, expr, fields));
    +
    +        // we converted the expression to a search condition, so
    +        // remove it from the residual predicate
    +        return fields == null ? null : expr;
    +    }
    +
    +    private boolean isValidField(ExprNodeFieldDesc field) {
    +        return fieldValidator == null || fieldValidator.validate(field);
    +    }
    +
    +    /**
    +     * Translates search conditions back to ExprNodeDesc form (as a 
left-deep
    +     * conjunction).
    +     *
    +     * @param searchConditions (typically produced by analyzePredicate)
    +     * @return ExprNodeGenericFuncDesc form of search conditions
    +     */
    +    public ExprNodeGenericFuncDesc 
translateSearchConditions(List<IndexSearchCondition> searchConditions) {
    +
    +        ExprNodeGenericFuncDesc expr = null;
    +
    +        for (IndexSearchCondition searchCondition : searchConditions) {
    +            if (expr == null) {
    +                expr = searchCondition.getComparisonExpr();
    +                continue;
    +            }
    +
    +            List<ExprNodeDesc> children = new ArrayList<ExprNodeDesc>();
    +            children.add(expr);
    +            children.add(searchCondition.getComparisonExpr());
    +            expr = new 
ExprNodeGenericFuncDesc(TypeInfoFactory.booleanTypeInfo, 
FunctionRegistry.getGenericUDFForAnd(), children);
    +        }
    +
    +        return expr;
    +    }
    +
    +    public void setAcceptsFields(boolean acceptsFields) {
    +        this.acceptsFields = acceptsFields;
    +    }
    +
    +    public static interface FieldValidator {
    +        boolean validate(ExprNodeFieldDesc exprNodeDesc);
    +    }
    +
    +    public static IndexPredicateAnalyzer createAnalyzer(boolean equalOnly) 
{
    +        IndexPredicateAnalyzer analyzer = new IndexPredicateAnalyzer();
    +        
analyzer.addComparisonOp("org.apache.hadoop.hive.ql.udf.generic.GenericUDFOPEqual");
    +
    +        if (equalOnly) {
    +            return analyzer;
    +        }
    +
    +        
analyzer.addComparisonOp("org.apache.hadoop.hive.ql.udf.generic.GenericUDFOPEqualOrGreaterThan");
    --- End diff --
    
    Actually not, but it was done in the same way as it's done in Hive's 
IndexPredicateAnalyzer.java


> HivePhoenixHandler for big-big join with predicate push down
> ------------------------------------------------------------
>
>                 Key: PHOENIX-2743
>                 URL: https://issues.apache.org/jira/browse/PHOENIX-2743
>             Project: Phoenix
>          Issue Type: New Feature
>    Affects Versions: 4.5.0, 4.6.0
>         Environment: hive-1.2.1
>            Reporter: JeongMin Ju
>              Labels: features, performance
>         Attachments: PHOENIX-2743-1.patch
>
>   Original Estimate: 168h
>  Remaining Estimate: 168h
>
> Phoenix support hash join & sort-merge join. But in case of big*big join does 
> not process well.
> Therefore Need other method like Hive.
> I implemented hive-phoenix-handler that can access Apache Phoenix table on 
> HBase using HiveQL.
> hive-phoenix-handler is very faster than hive-hbase-handler because of 
> applying predicate push down.
> I am publishing source code to github for contribution and maybe will be 
> completed by next week.
> https://github.com/mini666/hive-phoenix-handler
> please, review my proposal.



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

[jira] [Commented] (PHOENIX-2743) HivePhoenixHandler for big-big join with predicate push down

Reply via email to