http://git-wip-us.apache.org/repos/asf/hbase-site/blob/315ffef7/apidocs/src-html/org/apache/hadoop/hbase/io/encoding/DataBlockEncoding.html ---------------------------------------------------------------------- diff --git a/apidocs/src-html/org/apache/hadoop/hbase/io/encoding/DataBlockEncoding.html b/apidocs/src-html/org/apache/hadoop/hbase/io/encoding/DataBlockEncoding.html index 7c9a820..940a0dd 100644 --- a/apidocs/src-html/org/apache/hadoop/hbase/io/encoding/DataBlockEncoding.html +++ b/apidocs/src-html/org/apache/hadoop/hbase/io/encoding/DataBlockEncoding.html @@ -47,7 +47,7 @@ <span class="sourceLineNo">039</span> FAST_DIFF(4, "org.apache.hadoop.hbase.io.encoding.FastDiffDeltaEncoder"),<a name="line.39"></a> <span class="sourceLineNo">040</span> // id 5 is reserved for the COPY_KEY algorithm for benchmarking<a name="line.40"></a> <span class="sourceLineNo">041</span> // COPY_KEY(5, "org.apache.hadoop.hbase.io.encoding.CopyKeyDataBlockEncoder"),<a name="line.41"></a> -<span class="sourceLineNo">042</span> PREFIX_TREE(6, "org.apache.hadoop.hbase.codec.prefixtree.PrefixTreeCodec"),<a name="line.42"></a> +<span class="sourceLineNo">042</span> // PREFIX_TREE(6, "org.apache.hadoop.hbase.codec.prefixtree.PrefixTreeCodec"),<a name="line.42"></a> <span class="sourceLineNo">043</span> ROW_INDEX_V1(7, "org.apache.hadoop.hbase.io.encoding.RowIndexCodecV1");<a name="line.43"></a> <span class="sourceLineNo">044</span><a name="line.44"></a> <span class="sourceLineNo">045</span> private final short id;<a name="line.45"></a>
http://git-wip-us.apache.org/repos/asf/hbase-site/blob/315ffef7/apidocs/src-html/org/apache/hadoop/hbase/mapreduce/TableMapReduceUtil.html ---------------------------------------------------------------------- diff --git a/apidocs/src-html/org/apache/hadoop/hbase/mapreduce/TableMapReduceUtil.html b/apidocs/src-html/org/apache/hadoop/hbase/mapreduce/TableMapReduceUtil.html index 9bafe24..739356b 100644 --- a/apidocs/src-html/org/apache/hadoop/hbase/mapreduce/TableMapReduceUtil.html +++ b/apidocs/src-html/org/apache/hadoop/hbase/mapreduce/TableMapReduceUtil.html @@ -809,271 +809,254 @@ <span class="sourceLineNo">801</span> * @see <a href="https://issues.apache.org/jira/browse/PIG-3285">PIG-3285</a><a name="line.801"></a> <span class="sourceLineNo">802</span> */<a name="line.802"></a> <span class="sourceLineNo">803</span> public static void addHBaseDependencyJars(Configuration conf) throws IOException {<a name="line.803"></a> -<span class="sourceLineNo">804</span><a name="line.804"></a> -<span class="sourceLineNo">805</span> // PrefixTreeCodec is part of the hbase-prefix-tree module. If not included in MR jobs jar<a name="line.805"></a> -<span class="sourceLineNo">806</span> // dependencies, MR jobs that write encoded hfiles will fail.<a name="line.806"></a> -<span class="sourceLineNo">807</span> // We used reflection here so to prevent a circular module dependency.<a name="line.807"></a> -<span class="sourceLineNo">808</span> // TODO - if we extract the MR into a module, make it depend on hbase-prefix-tree.<a name="line.808"></a> -<span class="sourceLineNo">809</span> Class prefixTreeCodecClass = null;<a name="line.809"></a> -<span class="sourceLineNo">810</span> try {<a name="line.810"></a> -<span class="sourceLineNo">811</span> prefixTreeCodecClass =<a name="line.811"></a> -<span class="sourceLineNo">812</span> Class.forName("org.apache.hadoop.hbase.codec.prefixtree.PrefixTreeCodec");<a name="line.812"></a> -<span class="sourceLineNo">813</span> } catch (ClassNotFoundException e) {<a name="line.813"></a> -<span class="sourceLineNo">814</span> // this will show up in unit tests but should not show in real deployments<a name="line.814"></a> -<span class="sourceLineNo">815</span> LOG.warn("The hbase-prefix-tree module jar containing PrefixTreeCodec is not present." +<a name="line.815"></a> -<span class="sourceLineNo">816</span> " Continuing without it.");<a name="line.816"></a> -<span class="sourceLineNo">817</span> }<a name="line.817"></a> -<span class="sourceLineNo">818</span><a name="line.818"></a> -<span class="sourceLineNo">819</span> addDependencyJarsForClasses(conf,<a name="line.819"></a> -<span class="sourceLineNo">820</span> // explicitly pull a class from each module<a name="line.820"></a> -<span class="sourceLineNo">821</span> org.apache.hadoop.hbase.HConstants.class, // hbase-common<a name="line.821"></a> -<span class="sourceLineNo">822</span> org.apache.hadoop.hbase.protobuf.generated.ClientProtos.class, // hbase-protocol<a name="line.822"></a> -<span class="sourceLineNo">823</span> org.apache.hadoop.hbase.shaded.protobuf.generated.ClientProtos.class, // hbase-protocol-shaded<a name="line.823"></a> -<span class="sourceLineNo">824</span> org.apache.hadoop.hbase.client.Put.class, // hbase-client<a name="line.824"></a> -<span class="sourceLineNo">825</span> org.apache.hadoop.hbase.ipc.RpcServer.class, // hbase-server<a name="line.825"></a> -<span class="sourceLineNo">826</span> org.apache.hadoop.hbase.CompatibilityFactory.class, // hbase-hadoop-compat<a name="line.826"></a> -<span class="sourceLineNo">827</span> org.apache.hadoop.hbase.mapreduce.JobUtil.class, // hbase-hadoop2-compat<a name="line.827"></a> -<span class="sourceLineNo">828</span> org.apache.hadoop.hbase.mapreduce.TableMapper.class, // hbase-mapreduce<a name="line.828"></a> -<span class="sourceLineNo">829</span> org.apache.hadoop.hbase.metrics.impl.FastLongHistogram.class, // hbase-metrics<a name="line.829"></a> -<span class="sourceLineNo">830</span> org.apache.hadoop.hbase.metrics.Snapshot.class, // hbase-metrics-api<a name="line.830"></a> -<span class="sourceLineNo">831</span> prefixTreeCodecClass, // hbase-prefix-tree (if null will be skipped)<a name="line.831"></a> -<span class="sourceLineNo">832</span> // pull necessary dependencies<a name="line.832"></a> -<span class="sourceLineNo">833</span> org.apache.zookeeper.ZooKeeper.class,<a name="line.833"></a> -<span class="sourceLineNo">834</span> org.apache.hadoop.hbase.shaded.io.netty.channel.Channel.class,<a name="line.834"></a> -<span class="sourceLineNo">835</span> com.google.protobuf.Message.class,<a name="line.835"></a> -<span class="sourceLineNo">836</span> org.apache.hadoop.hbase.shaded.com.google.protobuf.UnsafeByteOperations.class,<a name="line.836"></a> -<span class="sourceLineNo">837</span> org.apache.hadoop.hbase.shaded.com.google.common.collect.Lists.class,<a name="line.837"></a> -<span class="sourceLineNo">838</span> org.apache.htrace.Trace.class,<a name="line.838"></a> -<span class="sourceLineNo">839</span> com.codahale.metrics.MetricRegistry.class,<a name="line.839"></a> -<span class="sourceLineNo">840</span> org.apache.commons.lang3.ArrayUtils.class);<a name="line.840"></a> -<span class="sourceLineNo">841</span> }<a name="line.841"></a> -<span class="sourceLineNo">842</span><a name="line.842"></a> -<span class="sourceLineNo">843</span> /**<a name="line.843"></a> -<span class="sourceLineNo">844</span> * Returns a classpath string built from the content of the "tmpjars" value in {@code conf}.<a name="line.844"></a> -<span class="sourceLineNo">845</span> * Also exposed to shell scripts via `bin/hbase mapredcp`.<a name="line.845"></a> -<span class="sourceLineNo">846</span> */<a name="line.846"></a> -<span class="sourceLineNo">847</span> public static String buildDependencyClasspath(Configuration conf) {<a name="line.847"></a> -<span class="sourceLineNo">848</span> if (conf == null) {<a name="line.848"></a> -<span class="sourceLineNo">849</span> throw new IllegalArgumentException("Must provide a configuration object.");<a name="line.849"></a> -<span class="sourceLineNo">850</span> }<a name="line.850"></a> -<span class="sourceLineNo">851</span> Set<String> paths = new HashSet<>(conf.getStringCollection("tmpjars"));<a name="line.851"></a> -<span class="sourceLineNo">852</span> if (paths.isEmpty()) {<a name="line.852"></a> -<span class="sourceLineNo">853</span> throw new IllegalArgumentException("Configuration contains no tmpjars.");<a name="line.853"></a> -<span class="sourceLineNo">854</span> }<a name="line.854"></a> -<span class="sourceLineNo">855</span> StringBuilder sb = new StringBuilder();<a name="line.855"></a> -<span class="sourceLineNo">856</span> for (String s : paths) {<a name="line.856"></a> -<span class="sourceLineNo">857</span> // entries can take the form 'file:/path/to/file.jar'.<a name="line.857"></a> -<span class="sourceLineNo">858</span> int idx = s.indexOf(":");<a name="line.858"></a> -<span class="sourceLineNo">859</span> if (idx != -1) s = s.substring(idx + 1);<a name="line.859"></a> -<span class="sourceLineNo">860</span> if (sb.length() > 0) sb.append(File.pathSeparator);<a name="line.860"></a> -<span class="sourceLineNo">861</span> sb.append(s);<a name="line.861"></a> -<span class="sourceLineNo">862</span> }<a name="line.862"></a> -<span class="sourceLineNo">863</span> return sb.toString();<a name="line.863"></a> -<span class="sourceLineNo">864</span> }<a name="line.864"></a> -<span class="sourceLineNo">865</span><a name="line.865"></a> -<span class="sourceLineNo">866</span> /**<a name="line.866"></a> -<span class="sourceLineNo">867</span> * Add the HBase dependency jars as well as jars for any of the configured<a name="line.867"></a> -<span class="sourceLineNo">868</span> * job classes to the job configuration, so that JobClient will ship them<a name="line.868"></a> -<span class="sourceLineNo">869</span> * to the cluster and add them to the DistributedCache.<a name="line.869"></a> -<span class="sourceLineNo">870</span> */<a name="line.870"></a> -<span class="sourceLineNo">871</span> public static void addDependencyJars(Job job) throws IOException {<a name="line.871"></a> -<span class="sourceLineNo">872</span> addHBaseDependencyJars(job.getConfiguration());<a name="line.872"></a> -<span class="sourceLineNo">873</span> try {<a name="line.873"></a> -<span class="sourceLineNo">874</span> addDependencyJarsForClasses(job.getConfiguration(),<a name="line.874"></a> -<span class="sourceLineNo">875</span> // when making changes here, consider also mapred.TableMapReduceUtil<a name="line.875"></a> -<span class="sourceLineNo">876</span> // pull job classes<a name="line.876"></a> -<span class="sourceLineNo">877</span> job.getMapOutputKeyClass(),<a name="line.877"></a> -<span class="sourceLineNo">878</span> job.getMapOutputValueClass(),<a name="line.878"></a> -<span class="sourceLineNo">879</span> job.getInputFormatClass(),<a name="line.879"></a> -<span class="sourceLineNo">880</span> job.getOutputKeyClass(),<a name="line.880"></a> -<span class="sourceLineNo">881</span> job.getOutputValueClass(),<a name="line.881"></a> -<span class="sourceLineNo">882</span> job.getOutputFormatClass(),<a name="line.882"></a> -<span class="sourceLineNo">883</span> job.getPartitionerClass(),<a name="line.883"></a> -<span class="sourceLineNo">884</span> job.getCombinerClass());<a name="line.884"></a> -<span class="sourceLineNo">885</span> } catch (ClassNotFoundException e) {<a name="line.885"></a> -<span class="sourceLineNo">886</span> throw new IOException(e);<a name="line.886"></a> -<span class="sourceLineNo">887</span> }<a name="line.887"></a> -<span class="sourceLineNo">888</span> }<a name="line.888"></a> -<span class="sourceLineNo">889</span><a name="line.889"></a> -<span class="sourceLineNo">890</span> /**<a name="line.890"></a> -<span class="sourceLineNo">891</span> * Add the jars containing the given classes to the job's configuration<a name="line.891"></a> -<span class="sourceLineNo">892</span> * such that JobClient will ship them to the cluster and add them to<a name="line.892"></a> -<span class="sourceLineNo">893</span> * the DistributedCache.<a name="line.893"></a> -<span class="sourceLineNo">894</span> * @deprecated rely on {@link #addDependencyJars(Job)} instead.<a name="line.894"></a> -<span class="sourceLineNo">895</span> */<a name="line.895"></a> -<span class="sourceLineNo">896</span> @Deprecated<a name="line.896"></a> -<span class="sourceLineNo">897</span> public static void addDependencyJars(Configuration conf,<a name="line.897"></a> -<span class="sourceLineNo">898</span> Class<?>... classes) throws IOException {<a name="line.898"></a> -<span class="sourceLineNo">899</span> LOG.warn("The addDependencyJars(Configuration, Class<?>...) method has been deprecated since it"<a name="line.899"></a> -<span class="sourceLineNo">900</span> + " is easy to use incorrectly. Most users should rely on addDependencyJars(Job) " +<a name="line.900"></a> -<span class="sourceLineNo">901</span> "instead. See HBASE-8386 for more details.");<a name="line.901"></a> -<span class="sourceLineNo">902</span> addDependencyJarsForClasses(conf, classes);<a name="line.902"></a> -<span class="sourceLineNo">903</span> }<a name="line.903"></a> +<span class="sourceLineNo">804</span> addDependencyJarsForClasses(conf,<a name="line.804"></a> +<span class="sourceLineNo">805</span> // explicitly pull a class from each module<a name="line.805"></a> +<span class="sourceLineNo">806</span> org.apache.hadoop.hbase.HConstants.class, // hbase-common<a name="line.806"></a> +<span class="sourceLineNo">807</span> org.apache.hadoop.hbase.protobuf.generated.ClientProtos.class, // hbase-protocol<a name="line.807"></a> +<span class="sourceLineNo">808</span> org.apache.hadoop.hbase.shaded.protobuf.generated.ClientProtos.class, // hbase-protocol-shaded<a name="line.808"></a> +<span class="sourceLineNo">809</span> org.apache.hadoop.hbase.client.Put.class, // hbase-client<a name="line.809"></a> +<span class="sourceLineNo">810</span> org.apache.hadoop.hbase.ipc.RpcServer.class, // hbase-server<a name="line.810"></a> +<span class="sourceLineNo">811</span> org.apache.hadoop.hbase.CompatibilityFactory.class, // hbase-hadoop-compat<a name="line.811"></a> +<span class="sourceLineNo">812</span> org.apache.hadoop.hbase.mapreduce.JobUtil.class, // hbase-hadoop2-compat<a name="line.812"></a> +<span class="sourceLineNo">813</span> org.apache.hadoop.hbase.mapreduce.TableMapper.class, // hbase-mapreduce<a name="line.813"></a> +<span class="sourceLineNo">814</span> org.apache.hadoop.hbase.metrics.impl.FastLongHistogram.class, // hbase-metrics<a name="line.814"></a> +<span class="sourceLineNo">815</span> org.apache.hadoop.hbase.metrics.Snapshot.class, // hbase-metrics-api<a name="line.815"></a> +<span class="sourceLineNo">816</span> org.apache.zookeeper.ZooKeeper.class,<a name="line.816"></a> +<span class="sourceLineNo">817</span> org.apache.hadoop.hbase.shaded.io.netty.channel.Channel.class,<a name="line.817"></a> +<span class="sourceLineNo">818</span> com.google.protobuf.Message.class,<a name="line.818"></a> +<span class="sourceLineNo">819</span> org.apache.hadoop.hbase.shaded.com.google.protobuf.UnsafeByteOperations.class,<a name="line.819"></a> +<span class="sourceLineNo">820</span> org.apache.hadoop.hbase.shaded.com.google.common.collect.Lists.class,<a name="line.820"></a> +<span class="sourceLineNo">821</span> org.apache.htrace.Trace.class,<a name="line.821"></a> +<span class="sourceLineNo">822</span> com.codahale.metrics.MetricRegistry.class,<a name="line.822"></a> +<span class="sourceLineNo">823</span> org.apache.commons.lang3.ArrayUtils.class);<a name="line.823"></a> +<span class="sourceLineNo">824</span> }<a name="line.824"></a> +<span class="sourceLineNo">825</span><a name="line.825"></a> +<span class="sourceLineNo">826</span> /**<a name="line.826"></a> +<span class="sourceLineNo">827</span> * Returns a classpath string built from the content of the "tmpjars" value in {@code conf}.<a name="line.827"></a> +<span class="sourceLineNo">828</span> * Also exposed to shell scripts via `bin/hbase mapredcp`.<a name="line.828"></a> +<span class="sourceLineNo">829</span> */<a name="line.829"></a> +<span class="sourceLineNo">830</span> public static String buildDependencyClasspath(Configuration conf) {<a name="line.830"></a> +<span class="sourceLineNo">831</span> if (conf == null) {<a name="line.831"></a> +<span class="sourceLineNo">832</span> throw new IllegalArgumentException("Must provide a configuration object.");<a name="line.832"></a> +<span class="sourceLineNo">833</span> }<a name="line.833"></a> +<span class="sourceLineNo">834</span> Set<String> paths = new HashSet<>(conf.getStringCollection("tmpjars"));<a name="line.834"></a> +<span class="sourceLineNo">835</span> if (paths.isEmpty()) {<a name="line.835"></a> +<span class="sourceLineNo">836</span> throw new IllegalArgumentException("Configuration contains no tmpjars.");<a name="line.836"></a> +<span class="sourceLineNo">837</span> }<a name="line.837"></a> +<span class="sourceLineNo">838</span> StringBuilder sb = new StringBuilder();<a name="line.838"></a> +<span class="sourceLineNo">839</span> for (String s : paths) {<a name="line.839"></a> +<span class="sourceLineNo">840</span> // entries can take the form 'file:/path/to/file.jar'.<a name="line.840"></a> +<span class="sourceLineNo">841</span> int idx = s.indexOf(":");<a name="line.841"></a> +<span class="sourceLineNo">842</span> if (idx != -1) s = s.substring(idx + 1);<a name="line.842"></a> +<span class="sourceLineNo">843</span> if (sb.length() > 0) sb.append(File.pathSeparator);<a name="line.843"></a> +<span class="sourceLineNo">844</span> sb.append(s);<a name="line.844"></a> +<span class="sourceLineNo">845</span> }<a name="line.845"></a> +<span class="sourceLineNo">846</span> return sb.toString();<a name="line.846"></a> +<span class="sourceLineNo">847</span> }<a name="line.847"></a> +<span class="sourceLineNo">848</span><a name="line.848"></a> +<span class="sourceLineNo">849</span> /**<a name="line.849"></a> +<span class="sourceLineNo">850</span> * Add the HBase dependency jars as well as jars for any of the configured<a name="line.850"></a> +<span class="sourceLineNo">851</span> * job classes to the job configuration, so that JobClient will ship them<a name="line.851"></a> +<span class="sourceLineNo">852</span> * to the cluster and add them to the DistributedCache.<a name="line.852"></a> +<span class="sourceLineNo">853</span> */<a name="line.853"></a> +<span class="sourceLineNo">854</span> public static void addDependencyJars(Job job) throws IOException {<a name="line.854"></a> +<span class="sourceLineNo">855</span> addHBaseDependencyJars(job.getConfiguration());<a name="line.855"></a> +<span class="sourceLineNo">856</span> try {<a name="line.856"></a> +<span class="sourceLineNo">857</span> addDependencyJarsForClasses(job.getConfiguration(),<a name="line.857"></a> +<span class="sourceLineNo">858</span> // when making changes here, consider also mapred.TableMapReduceUtil<a name="line.858"></a> +<span class="sourceLineNo">859</span> // pull job classes<a name="line.859"></a> +<span class="sourceLineNo">860</span> job.getMapOutputKeyClass(),<a name="line.860"></a> +<span class="sourceLineNo">861</span> job.getMapOutputValueClass(),<a name="line.861"></a> +<span class="sourceLineNo">862</span> job.getInputFormatClass(),<a name="line.862"></a> +<span class="sourceLineNo">863</span> job.getOutputKeyClass(),<a name="line.863"></a> +<span class="sourceLineNo">864</span> job.getOutputValueClass(),<a name="line.864"></a> +<span class="sourceLineNo">865</span> job.getOutputFormatClass(),<a name="line.865"></a> +<span class="sourceLineNo">866</span> job.getPartitionerClass(),<a name="line.866"></a> +<span class="sourceLineNo">867</span> job.getCombinerClass());<a name="line.867"></a> +<span class="sourceLineNo">868</span> } catch (ClassNotFoundException e) {<a name="line.868"></a> +<span class="sourceLineNo">869</span> throw new IOException(e);<a name="line.869"></a> +<span class="sourceLineNo">870</span> }<a name="line.870"></a> +<span class="sourceLineNo">871</span> }<a name="line.871"></a> +<span class="sourceLineNo">872</span><a name="line.872"></a> +<span class="sourceLineNo">873</span> /**<a name="line.873"></a> +<span class="sourceLineNo">874</span> * Add the jars containing the given classes to the job's configuration<a name="line.874"></a> +<span class="sourceLineNo">875</span> * such that JobClient will ship them to the cluster and add them to<a name="line.875"></a> +<span class="sourceLineNo">876</span> * the DistributedCache.<a name="line.876"></a> +<span class="sourceLineNo">877</span> * @deprecated rely on {@link #addDependencyJars(Job)} instead.<a name="line.877"></a> +<span class="sourceLineNo">878</span> */<a name="line.878"></a> +<span class="sourceLineNo">879</span> @Deprecated<a name="line.879"></a> +<span class="sourceLineNo">880</span> public static void addDependencyJars(Configuration conf,<a name="line.880"></a> +<span class="sourceLineNo">881</span> Class<?>... classes) throws IOException {<a name="line.881"></a> +<span class="sourceLineNo">882</span> LOG.warn("The addDependencyJars(Configuration, Class<?>...) method has been deprecated since it"<a name="line.882"></a> +<span class="sourceLineNo">883</span> + " is easy to use incorrectly. Most users should rely on addDependencyJars(Job) " +<a name="line.883"></a> +<span class="sourceLineNo">884</span> "instead. See HBASE-8386 for more details.");<a name="line.884"></a> +<span class="sourceLineNo">885</span> addDependencyJarsForClasses(conf, classes);<a name="line.885"></a> +<span class="sourceLineNo">886</span> }<a name="line.886"></a> +<span class="sourceLineNo">887</span><a name="line.887"></a> +<span class="sourceLineNo">888</span> /**<a name="line.888"></a> +<span class="sourceLineNo">889</span> * Add the jars containing the given classes to the job's configuration<a name="line.889"></a> +<span class="sourceLineNo">890</span> * such that JobClient will ship them to the cluster and add them to<a name="line.890"></a> +<span class="sourceLineNo">891</span> * the DistributedCache.<a name="line.891"></a> +<span class="sourceLineNo">892</span> *<a name="line.892"></a> +<span class="sourceLineNo">893</span> * N.B. that this method at most adds one jar per class given. If there is more than one<a name="line.893"></a> +<span class="sourceLineNo">894</span> * jar available containing a class with the same name as a given class, we don't define<a name="line.894"></a> +<span class="sourceLineNo">895</span> * which of those jars might be chosen.<a name="line.895"></a> +<span class="sourceLineNo">896</span> *<a name="line.896"></a> +<span class="sourceLineNo">897</span> * @param conf The Hadoop Configuration to modify<a name="line.897"></a> +<span class="sourceLineNo">898</span> * @param classes will add just those dependencies needed to find the given classes<a name="line.898"></a> +<span class="sourceLineNo">899</span> * @throws IOException if an underlying library call fails.<a name="line.899"></a> +<span class="sourceLineNo">900</span> */<a name="line.900"></a> +<span class="sourceLineNo">901</span> @InterfaceAudience.Private<a name="line.901"></a> +<span class="sourceLineNo">902</span> public static void addDependencyJarsForClasses(Configuration conf,<a name="line.902"></a> +<span class="sourceLineNo">903</span> Class<?>... classes) throws IOException {<a name="line.903"></a> <span class="sourceLineNo">904</span><a name="line.904"></a> -<span class="sourceLineNo">905</span> /**<a name="line.905"></a> -<span class="sourceLineNo">906</span> * Add the jars containing the given classes to the job's configuration<a name="line.906"></a> -<span class="sourceLineNo">907</span> * such that JobClient will ship them to the cluster and add them to<a name="line.907"></a> -<span class="sourceLineNo">908</span> * the DistributedCache.<a name="line.908"></a> -<span class="sourceLineNo">909</span> *<a name="line.909"></a> -<span class="sourceLineNo">910</span> * N.B. that this method at most adds one jar per class given. If there is more than one<a name="line.910"></a> -<span class="sourceLineNo">911</span> * jar available containing a class with the same name as a given class, we don't define<a name="line.911"></a> -<span class="sourceLineNo">912</span> * which of those jars might be chosen.<a name="line.912"></a> -<span class="sourceLineNo">913</span> *<a name="line.913"></a> -<span class="sourceLineNo">914</span> * @param conf The Hadoop Configuration to modify<a name="line.914"></a> -<span class="sourceLineNo">915</span> * @param classes will add just those dependencies needed to find the given classes<a name="line.915"></a> -<span class="sourceLineNo">916</span> * @throws IOException if an underlying library call fails.<a name="line.916"></a> -<span class="sourceLineNo">917</span> */<a name="line.917"></a> -<span class="sourceLineNo">918</span> @InterfaceAudience.Private<a name="line.918"></a> -<span class="sourceLineNo">919</span> public static void addDependencyJarsForClasses(Configuration conf,<a name="line.919"></a> -<span class="sourceLineNo">920</span> Class<?>... classes) throws IOException {<a name="line.920"></a> -<span class="sourceLineNo">921</span><a name="line.921"></a> -<span class="sourceLineNo">922</span> FileSystem localFs = FileSystem.getLocal(conf);<a name="line.922"></a> -<span class="sourceLineNo">923</span> Set<String> jars = new HashSet<>();<a name="line.923"></a> -<span class="sourceLineNo">924</span> // Add jars that are already in the tmpjars variable<a name="line.924"></a> -<span class="sourceLineNo">925</span> jars.addAll(conf.getStringCollection("tmpjars"));<a name="line.925"></a> -<span class="sourceLineNo">926</span><a name="line.926"></a> -<span class="sourceLineNo">927</span> // add jars as we find them to a map of contents jar name so that we can avoid<a name="line.927"></a> -<span class="sourceLineNo">928</span> // creating new jars for classes that have already been packaged.<a name="line.928"></a> -<span class="sourceLineNo">929</span> Map<String, String> packagedClasses = new HashMap<>();<a name="line.929"></a> -<span class="sourceLineNo">930</span><a name="line.930"></a> -<span class="sourceLineNo">931</span> // Add jars containing the specified classes<a name="line.931"></a> -<span class="sourceLineNo">932</span> for (Class<?> clazz : classes) {<a name="line.932"></a> -<span class="sourceLineNo">933</span> if (clazz == null) continue;<a name="line.933"></a> -<span class="sourceLineNo">934</span><a name="line.934"></a> -<span class="sourceLineNo">935</span> Path path = findOrCreateJar(clazz, localFs, packagedClasses);<a name="line.935"></a> -<span class="sourceLineNo">936</span> if (path == null) {<a name="line.936"></a> -<span class="sourceLineNo">937</span> LOG.warn("Could not find jar for class " + clazz +<a name="line.937"></a> -<span class="sourceLineNo">938</span> " in order to ship it to the cluster.");<a name="line.938"></a> -<span class="sourceLineNo">939</span> continue;<a name="line.939"></a> -<span class="sourceLineNo">940</span> }<a name="line.940"></a> -<span class="sourceLineNo">941</span> if (!localFs.exists(path)) {<a name="line.941"></a> -<span class="sourceLineNo">942</span> LOG.warn("Could not validate jar file " + path + " for class "<a name="line.942"></a> -<span class="sourceLineNo">943</span> + clazz);<a name="line.943"></a> -<span class="sourceLineNo">944</span> continue;<a name="line.944"></a> -<span class="sourceLineNo">945</span> }<a name="line.945"></a> -<span class="sourceLineNo">946</span> jars.add(path.toString());<a name="line.946"></a> -<span class="sourceLineNo">947</span> }<a name="line.947"></a> -<span class="sourceLineNo">948</span> if (jars.isEmpty()) return;<a name="line.948"></a> -<span class="sourceLineNo">949</span><a name="line.949"></a> -<span class="sourceLineNo">950</span> conf.set("tmpjars", StringUtils.arrayToString(jars.toArray(new String[jars.size()])));<a name="line.950"></a> -<span class="sourceLineNo">951</span> }<a name="line.951"></a> -<span class="sourceLineNo">952</span><a name="line.952"></a> -<span class="sourceLineNo">953</span> /**<a name="line.953"></a> -<span class="sourceLineNo">954</span> * Finds the Jar for a class or creates it if it doesn't exist. If the class is in<a name="line.954"></a> -<span class="sourceLineNo">955</span> * a directory in the classpath, it creates a Jar on the fly with the<a name="line.955"></a> -<span class="sourceLineNo">956</span> * contents of the directory and returns the path to that Jar. If a Jar is<a name="line.956"></a> -<span class="sourceLineNo">957</span> * created, it is created in the system temporary directory. Otherwise,<a name="line.957"></a> -<span class="sourceLineNo">958</span> * returns an existing jar that contains a class of the same name. Maintains<a name="line.958"></a> -<span class="sourceLineNo">959</span> * a mapping from jar contents to the tmp jar created.<a name="line.959"></a> -<span class="sourceLineNo">960</span> * @param my_class the class to find.<a name="line.960"></a> -<span class="sourceLineNo">961</span> * @param fs the FileSystem with which to qualify the returned path.<a name="line.961"></a> -<span class="sourceLineNo">962</span> * @param packagedClasses a map of class name to path.<a name="line.962"></a> -<span class="sourceLineNo">963</span> * @return a jar file that contains the class.<a name="line.963"></a> -<span class="sourceLineNo">964</span> * @throws IOException<a name="line.964"></a> -<span class="sourceLineNo">965</span> */<a name="line.965"></a> -<span class="sourceLineNo">966</span> private static Path findOrCreateJar(Class<?> my_class, FileSystem fs,<a name="line.966"></a> -<span class="sourceLineNo">967</span> Map<String, String> packagedClasses)<a name="line.967"></a> -<span class="sourceLineNo">968</span> throws IOException {<a name="line.968"></a> -<span class="sourceLineNo">969</span> // attempt to locate an existing jar for the class.<a name="line.969"></a> -<span class="sourceLineNo">970</span> String jar = findContainingJar(my_class, packagedClasses);<a name="line.970"></a> -<span class="sourceLineNo">971</span> if (null == jar || jar.isEmpty()) {<a name="line.971"></a> -<span class="sourceLineNo">972</span> jar = getJar(my_class);<a name="line.972"></a> -<span class="sourceLineNo">973</span> updateMap(jar, packagedClasses);<a name="line.973"></a> -<span class="sourceLineNo">974</span> }<a name="line.974"></a> -<span class="sourceLineNo">975</span><a name="line.975"></a> -<span class="sourceLineNo">976</span> if (null == jar || jar.isEmpty()) {<a name="line.976"></a> -<span class="sourceLineNo">977</span> return null;<a name="line.977"></a> -<span class="sourceLineNo">978</span> }<a name="line.978"></a> -<span class="sourceLineNo">979</span><a name="line.979"></a> -<span class="sourceLineNo">980</span> LOG.debug(String.format("For class %s, using jar %s", my_class.getName(), jar));<a name="line.980"></a> -<span class="sourceLineNo">981</span> return new Path(jar).makeQualified(fs);<a name="line.981"></a> -<span class="sourceLineNo">982</span> }<a name="line.982"></a> -<span class="sourceLineNo">983</span><a name="line.983"></a> -<span class="sourceLineNo">984</span> /**<a name="line.984"></a> -<span class="sourceLineNo">985</span> * Add entries to <code>packagedClasses</code> corresponding to class files<a name="line.985"></a> -<span class="sourceLineNo">986</span> * contained in <code>jar</code>.<a name="line.986"></a> -<span class="sourceLineNo">987</span> * @param jar The jar who's content to list.<a name="line.987"></a> -<span class="sourceLineNo">988</span> * @param packagedClasses map[class -> jar]<a name="line.988"></a> -<span class="sourceLineNo">989</span> */<a name="line.989"></a> -<span class="sourceLineNo">990</span> private static void updateMap(String jar, Map<String, String> packagedClasses) throws IOException {<a name="line.990"></a> -<span class="sourceLineNo">991</span> if (null == jar || jar.isEmpty()) {<a name="line.991"></a> -<span class="sourceLineNo">992</span> return;<a name="line.992"></a> -<span class="sourceLineNo">993</span> }<a name="line.993"></a> -<span class="sourceLineNo">994</span> ZipFile zip = null;<a name="line.994"></a> -<span class="sourceLineNo">995</span> try {<a name="line.995"></a> -<span class="sourceLineNo">996</span> zip = new ZipFile(jar);<a name="line.996"></a> -<span class="sourceLineNo">997</span> for (Enumeration<? extends ZipEntry> iter = zip.entries(); iter.hasMoreElements();) {<a name="line.997"></a> -<span class="sourceLineNo">998</span> ZipEntry entry = iter.nextElement();<a name="line.998"></a> -<span class="sourceLineNo">999</span> if (entry.getName().endsWith("class")) {<a name="line.999"></a> -<span class="sourceLineNo">1000</span> packagedClasses.put(entry.getName(), jar);<a name="line.1000"></a> -<span class="sourceLineNo">1001</span> }<a name="line.1001"></a> -<span class="sourceLineNo">1002</span> }<a name="line.1002"></a> -<span class="sourceLineNo">1003</span> } finally {<a name="line.1003"></a> -<span class="sourceLineNo">1004</span> if (null != zip) zip.close();<a name="line.1004"></a> -<span class="sourceLineNo">1005</span> }<a name="line.1005"></a> -<span class="sourceLineNo">1006</span> }<a name="line.1006"></a> -<span class="sourceLineNo">1007</span><a name="line.1007"></a> -<span class="sourceLineNo">1008</span> /**<a name="line.1008"></a> -<span class="sourceLineNo">1009</span> * Find a jar that contains a class of the same name, if any. It will return<a name="line.1009"></a> -<span class="sourceLineNo">1010</span> * a jar file, even if that is not the first thing on the class path that<a name="line.1010"></a> -<span class="sourceLineNo">1011</span> * has a class with the same name. Looks first on the classpath and then in<a name="line.1011"></a> -<span class="sourceLineNo">1012</span> * the <code>packagedClasses</code> map.<a name="line.1012"></a> -<span class="sourceLineNo">1013</span> * @param my_class the class to find.<a name="line.1013"></a> -<span class="sourceLineNo">1014</span> * @return a jar file that contains the class, or null.<a name="line.1014"></a> -<span class="sourceLineNo">1015</span> * @throws IOException<a name="line.1015"></a> -<span class="sourceLineNo">1016</span> */<a name="line.1016"></a> -<span class="sourceLineNo">1017</span> private static String findContainingJar(Class<?> my_class, Map<String, String> packagedClasses)<a name="line.1017"></a> -<span class="sourceLineNo">1018</span> throws IOException {<a name="line.1018"></a> -<span class="sourceLineNo">1019</span> ClassLoader loader = my_class.getClassLoader();<a name="line.1019"></a> -<span class="sourceLineNo">1020</span><a name="line.1020"></a> -<span class="sourceLineNo">1021</span> String class_file = my_class.getName().replaceAll("\\.", "/") + ".class";<a name="line.1021"></a> -<span class="sourceLineNo">1022</span><a name="line.1022"></a> -<span class="sourceLineNo">1023</span> if (loader != null) {<a name="line.1023"></a> -<span class="sourceLineNo">1024</span> // first search the classpath<a name="line.1024"></a> -<span class="sourceLineNo">1025</span> for (Enumeration<URL> itr = loader.getResources(class_file); itr.hasMoreElements();) {<a name="line.1025"></a> -<span class="sourceLineNo">1026</span> URL url = itr.nextElement();<a name="line.1026"></a> -<span class="sourceLineNo">1027</span> if ("jar".equals(url.getProtocol())) {<a name="line.1027"></a> -<span class="sourceLineNo">1028</span> String toReturn = url.getPath();<a name="line.1028"></a> -<span class="sourceLineNo">1029</span> if (toReturn.startsWith("file:")) {<a name="line.1029"></a> -<span class="sourceLineNo">1030</span> toReturn = toReturn.substring("file:".length());<a name="line.1030"></a> -<span class="sourceLineNo">1031</span> }<a name="line.1031"></a> -<span class="sourceLineNo">1032</span> // URLDecoder is a misnamed class, since it actually decodes<a name="line.1032"></a> -<span class="sourceLineNo">1033</span> // x-www-form-urlencoded MIME type rather than actual<a name="line.1033"></a> -<span class="sourceLineNo">1034</span> // URL encoding (which the file path has). Therefore it would<a name="line.1034"></a> -<span class="sourceLineNo">1035</span> // decode +s to ' 's which is incorrect (spaces are actually<a name="line.1035"></a> -<span class="sourceLineNo">1036</span> // either unencoded or encoded as "%20"). Replace +s first, so<a name="line.1036"></a> -<span class="sourceLineNo">1037</span> // that they are kept sacred during the decoding process.<a name="line.1037"></a> -<span class="sourceLineNo">1038</span> toReturn = toReturn.replaceAll("\\+", "%2B");<a name="line.1038"></a> -<span class="sourceLineNo">1039</span> toReturn = URLDecoder.decode(toReturn, "UTF-8");<a name="line.1039"></a> -<span class="sourceLineNo">1040</span> return toReturn.replaceAll("!.*$", "");<a name="line.1040"></a> -<span class="sourceLineNo">1041</span> }<a name="line.1041"></a> -<span class="sourceLineNo">1042</span> }<a name="line.1042"></a> -<span class="sourceLineNo">1043</span> }<a name="line.1043"></a> -<span class="sourceLineNo">1044</span><a name="line.1044"></a> -<span class="sourceLineNo">1045</span> // now look in any jars we've packaged using JarFinder. Returns null when<a name="line.1045"></a> -<span class="sourceLineNo">1046</span> // no jar is found.<a name="line.1046"></a> -<span class="sourceLineNo">1047</span> return packagedClasses.get(class_file);<a name="line.1047"></a> -<span class="sourceLineNo">1048</span> }<a name="line.1048"></a> -<span class="sourceLineNo">1049</span><a name="line.1049"></a> -<span class="sourceLineNo">1050</span> /**<a name="line.1050"></a> -<span class="sourceLineNo">1051</span> * Invoke 'getJar' on a custom JarFinder implementation. Useful for some job<a name="line.1051"></a> -<span class="sourceLineNo">1052</span> * configuration contexts (HBASE-8140) and also for testing on MRv2.<a name="line.1052"></a> -<span class="sourceLineNo">1053</span> * check if we have HADOOP-9426.<a name="line.1053"></a> -<span class="sourceLineNo">1054</span> * @param my_class the class to find.<a name="line.1054"></a> -<span class="sourceLineNo">1055</span> * @return a jar file that contains the class, or null.<a name="line.1055"></a> -<span class="sourceLineNo">1056</span> */<a name="line.1056"></a> -<span class="sourceLineNo">1057</span> private static String getJar(Class<?> my_class) {<a name="line.1057"></a> -<span class="sourceLineNo">1058</span> String ret = null;<a name="line.1058"></a> -<span class="sourceLineNo">1059</span> try {<a name="line.1059"></a> -<span class="sourceLineNo">1060</span> ret = JarFinder.getJar(my_class);<a name="line.1060"></a> -<span class="sourceLineNo">1061</span> } catch (Exception e) {<a name="line.1061"></a> -<span class="sourceLineNo">1062</span> // toss all other exceptions, related to reflection failure<a name="line.1062"></a> -<span class="sourceLineNo">1063</span> throw new RuntimeException("getJar invocation failed.", e);<a name="line.1063"></a> -<span class="sourceLineNo">1064</span> }<a name="line.1064"></a> -<span class="sourceLineNo">1065</span><a name="line.1065"></a> -<span class="sourceLineNo">1066</span> return ret;<a name="line.1066"></a> -<span class="sourceLineNo">1067</span> }<a name="line.1067"></a> -<span class="sourceLineNo">1068</span>}<a name="line.1068"></a> +<span class="sourceLineNo">905</span> FileSystem localFs = FileSystem.getLocal(conf);<a name="line.905"></a> +<span class="sourceLineNo">906</span> Set<String> jars = new HashSet<>();<a name="line.906"></a> +<span class="sourceLineNo">907</span> // Add jars that are already in the tmpjars variable<a name="line.907"></a> +<span class="sourceLineNo">908</span> jars.addAll(conf.getStringCollection("tmpjars"));<a name="line.908"></a> +<span class="sourceLineNo">909</span><a name="line.909"></a> +<span class="sourceLineNo">910</span> // add jars as we find them to a map of contents jar name so that we can avoid<a name="line.910"></a> +<span class="sourceLineNo">911</span> // creating new jars for classes that have already been packaged.<a name="line.911"></a> +<span class="sourceLineNo">912</span> Map<String, String> packagedClasses = new HashMap<>();<a name="line.912"></a> +<span class="sourceLineNo">913</span><a name="line.913"></a> +<span class="sourceLineNo">914</span> // Add jars containing the specified classes<a name="line.914"></a> +<span class="sourceLineNo">915</span> for (Class<?> clazz : classes) {<a name="line.915"></a> +<span class="sourceLineNo">916</span> if (clazz == null) continue;<a name="line.916"></a> +<span class="sourceLineNo">917</span><a name="line.917"></a> +<span class="sourceLineNo">918</span> Path path = findOrCreateJar(clazz, localFs, packagedClasses);<a name="line.918"></a> +<span class="sourceLineNo">919</span> if (path == null) {<a name="line.919"></a> +<span class="sourceLineNo">920</span> LOG.warn("Could not find jar for class " + clazz +<a name="line.920"></a> +<span class="sourceLineNo">921</span> " in order to ship it to the cluster.");<a name="line.921"></a> +<span class="sourceLineNo">922</span> continue;<a name="line.922"></a> +<span class="sourceLineNo">923</span> }<a name="line.923"></a> +<span class="sourceLineNo">924</span> if (!localFs.exists(path)) {<a name="line.924"></a> +<span class="sourceLineNo">925</span> LOG.warn("Could not validate jar file " + path + " for class "<a name="line.925"></a> +<span class="sourceLineNo">926</span> + clazz);<a name="line.926"></a> +<span class="sourceLineNo">927</span> continue;<a name="line.927"></a> +<span class="sourceLineNo">928</span> }<a name="line.928"></a> +<span class="sourceLineNo">929</span> jars.add(path.toString());<a name="line.929"></a> +<span class="sourceLineNo">930</span> }<a name="line.930"></a> +<span class="sourceLineNo">931</span> if (jars.isEmpty()) return;<a name="line.931"></a> +<span class="sourceLineNo">932</span><a name="line.932"></a> +<span class="sourceLineNo">933</span> conf.set("tmpjars", StringUtils.arrayToString(jars.toArray(new String[jars.size()])));<a name="line.933"></a> +<span class="sourceLineNo">934</span> }<a name="line.934"></a> +<span class="sourceLineNo">935</span><a name="line.935"></a> +<span class="sourceLineNo">936</span> /**<a name="line.936"></a> +<span class="sourceLineNo">937</span> * Finds the Jar for a class or creates it if it doesn't exist. If the class is in<a name="line.937"></a> +<span class="sourceLineNo">938</span> * a directory in the classpath, it creates a Jar on the fly with the<a name="line.938"></a> +<span class="sourceLineNo">939</span> * contents of the directory and returns the path to that Jar. If a Jar is<a name="line.939"></a> +<span class="sourceLineNo">940</span> * created, it is created in the system temporary directory. Otherwise,<a name="line.940"></a> +<span class="sourceLineNo">941</span> * returns an existing jar that contains a class of the same name. Maintains<a name="line.941"></a> +<span class="sourceLineNo">942</span> * a mapping from jar contents to the tmp jar created.<a name="line.942"></a> +<span class="sourceLineNo">943</span> * @param my_class the class to find.<a name="line.943"></a> +<span class="sourceLineNo">944</span> * @param fs the FileSystem with which to qualify the returned path.<a name="line.944"></a> +<span class="sourceLineNo">945</span> * @param packagedClasses a map of class name to path.<a name="line.945"></a> +<span class="sourceLineNo">946</span> * @return a jar file that contains the class.<a name="line.946"></a> +<span class="sourceLineNo">947</span> * @throws IOException<a name="line.947"></a> +<span class="sourceLineNo">948</span> */<a name="line.948"></a> +<span class="sourceLineNo">949</span> private static Path findOrCreateJar(Class<?> my_class, FileSystem fs,<a name="line.949"></a> +<span class="sourceLineNo">950</span> Map<String, String> packagedClasses)<a name="line.950"></a> +<span class="sourceLineNo">951</span> throws IOException {<a name="line.951"></a> +<span class="sourceLineNo">952</span> // attempt to locate an existing jar for the class.<a name="line.952"></a> +<span class="sourceLineNo">953</span> String jar = findContainingJar(my_class, packagedClasses);<a name="line.953"></a> +<span class="sourceLineNo">954</span> if (null == jar || jar.isEmpty()) {<a name="line.954"></a> +<span class="sourceLineNo">955</span> jar = getJar(my_class);<a name="line.955"></a> +<span class="sourceLineNo">956</span> updateMap(jar, packagedClasses);<a name="line.956"></a> +<span class="sourceLineNo">957</span> }<a name="line.957"></a> +<span class="sourceLineNo">958</span><a name="line.958"></a> +<span class="sourceLineNo">959</span> if (null == jar || jar.isEmpty()) {<a name="line.959"></a> +<span class="sourceLineNo">960</span> return null;<a name="line.960"></a> +<span class="sourceLineNo">961</span> }<a name="line.961"></a> +<span class="sourceLineNo">962</span><a name="line.962"></a> +<span class="sourceLineNo">963</span> LOG.debug(String.format("For class %s, using jar %s", my_class.getName(), jar));<a name="line.963"></a> +<span class="sourceLineNo">964</span> return new Path(jar).makeQualified(fs);<a name="line.964"></a> +<span class="sourceLineNo">965</span> }<a name="line.965"></a> +<span class="sourceLineNo">966</span><a name="line.966"></a> +<span class="sourceLineNo">967</span> /**<a name="line.967"></a> +<span class="sourceLineNo">968</span> * Add entries to <code>packagedClasses</code> corresponding to class files<a name="line.968"></a> +<span class="sourceLineNo">969</span> * contained in <code>jar</code>.<a name="line.969"></a> +<span class="sourceLineNo">970</span> * @param jar The jar who's content to list.<a name="line.970"></a> +<span class="sourceLineNo">971</span> * @param packagedClasses map[class -> jar]<a name="line.971"></a> +<span class="sourceLineNo">972</span> */<a name="line.972"></a> +<span class="sourceLineNo">973</span> private static void updateMap(String jar, Map<String, String> packagedClasses) throws IOException {<a name="line.973"></a> +<span class="sourceLineNo">974</span> if (null == jar || jar.isEmpty()) {<a name="line.974"></a> +<span class="sourceLineNo">975</span> return;<a name="line.975"></a> +<span class="sourceLineNo">976</span> }<a name="line.976"></a> +<span class="sourceLineNo">977</span> ZipFile zip = null;<a name="line.977"></a> +<span class="sourceLineNo">978</span> try {<a name="line.978"></a> +<span class="sourceLineNo">979</span> zip = new ZipFile(jar);<a name="line.979"></a> +<span class="sourceLineNo">980</span> for (Enumeration<? extends ZipEntry> iter = zip.entries(); iter.hasMoreElements();) {<a name="line.980"></a> +<span class="sourceLineNo">981</span> ZipEntry entry = iter.nextElement();<a name="line.981"></a> +<span class="sourceLineNo">982</span> if (entry.getName().endsWith("class")) {<a name="line.982"></a> +<span class="sourceLineNo">983</span> packagedClasses.put(entry.getName(), jar);<a name="line.983"></a> +<span class="sourceLineNo">984</span> }<a name="line.984"></a> +<span class="sourceLineNo">985</span> }<a name="line.985"></a> +<span class="sourceLineNo">986</span> } finally {<a name="line.986"></a> +<span class="sourceLineNo">987</span> if (null != zip) zip.close();<a name="line.987"></a> +<span class="sourceLineNo">988</span> }<a name="line.988"></a> +<span class="sourceLineNo">989</span> }<a name="line.989"></a> +<span class="sourceLineNo">990</span><a name="line.990"></a> +<span class="sourceLineNo">991</span> /**<a name="line.991"></a> +<span class="sourceLineNo">992</span> * Find a jar that contains a class of the same name, if any. It will return<a name="line.992"></a> +<span class="sourceLineNo">993</span> * a jar file, even if that is not the first thing on the class path that<a name="line.993"></a> +<span class="sourceLineNo">994</span> * has a class with the same name. Looks first on the classpath and then in<a name="line.994"></a> +<span class="sourceLineNo">995</span> * the <code>packagedClasses</code> map.<a name="line.995"></a> +<span class="sourceLineNo">996</span> * @param my_class the class to find.<a name="line.996"></a> +<span class="sourceLineNo">997</span> * @return a jar file that contains the class, or null.<a name="line.997"></a> +<span class="sourceLineNo">998</span> * @throws IOException<a name="line.998"></a> +<span class="sourceLineNo">999</span> */<a name="line.999"></a> +<span class="sourceLineNo">1000</span> private static String findContainingJar(Class<?> my_class, Map<String, String> packagedClasses)<a name="line.1000"></a> +<span class="sourceLineNo">1001</span> throws IOException {<a name="line.1001"></a> +<span class="sourceLineNo">1002</span> ClassLoader loader = my_class.getClassLoader();<a name="line.1002"></a> +<span class="sourceLineNo">1003</span><a name="line.1003"></a> +<span class="sourceLineNo">1004</span> String class_file = my_class.getName().replaceAll("\\.", "/") + ".class";<a name="line.1004"></a> +<span class="sourceLineNo">1005</span><a name="line.1005"></a> +<span class="sourceLineNo">1006</span> if (loader != null) {<a name="line.1006"></a> +<span class="sourceLineNo">1007</span> // first search the classpath<a name="line.1007"></a> +<span class="sourceLineNo">1008</span> for (Enumeration<URL> itr = loader.getResources(class_file); itr.hasMoreElements();) {<a name="line.1008"></a> +<span class="sourceLineNo">1009</span> URL url = itr.nextElement();<a name="line.1009"></a> +<span class="sourceLineNo">1010</span> if ("jar".equals(url.getProtocol())) {<a name="line.1010"></a> +<span class="sourceLineNo">1011</span> String toReturn = url.getPath();<a name="line.1011"></a> +<span class="sourceLineNo">1012</span> if (toReturn.startsWith("file:")) {<a name="line.1012"></a> +<span class="sourceLineNo">1013</span> toReturn = toReturn.substring("file:".length());<a name="line.1013"></a> +<span class="sourceLineNo">1014</span> }<a name="line.1014"></a> +<span class="sourceLineNo">1015</span> // URLDecoder is a misnamed class, since it actually decodes<a name="line.1015"></a> +<span class="sourceLineNo">1016</span> // x-www-form-urlencoded MIME type rather than actual<a name="line.1016"></a> +<span class="sourceLineNo">1017</span> // URL encoding (which the file path has). Therefore it would<a name="line.1017"></a> +<span class="sourceLineNo">1018</span> // decode +s to ' 's which is incorrect (spaces are actually<a name="line.1018"></a> +<span class="sourceLineNo">1019</span> // either unencoded or encoded as "%20"). Replace +s first, so<a name="line.1019"></a> +<span class="sourceLineNo">1020</span> // that they are kept sacred during the decoding process.<a name="line.1020"></a> +<span class="sourceLineNo">1021</span> toReturn = toReturn.replaceAll("\\+", "%2B");<a name="line.1021"></a> +<span class="sourceLineNo">1022</span> toReturn = URLDecoder.decode(toReturn, "UTF-8");<a name="line.1022"></a> +<span class="sourceLineNo">1023</span> return toReturn.replaceAll("!.*$", "");<a name="line.1023"></a> +<span class="sourceLineNo">1024</span> }<a name="line.1024"></a> +<span class="sourceLineNo">1025</span> }<a name="line.1025"></a> +<span class="sourceLineNo">1026</span> }<a name="line.1026"></a> +<span class="sourceLineNo">1027</span><a name="line.1027"></a> +<span class="sourceLineNo">1028</span> // now look in any jars we've packaged using JarFinder. Returns null when<a name="line.1028"></a> +<span class="sourceLineNo">1029</span> // no jar is found.<a name="line.1029"></a> +<span class="sourceLineNo">1030</span> return packagedClasses.get(class_file);<a name="line.1030"></a> +<span class="sourceLineNo">1031</span> }<a name="line.1031"></a> +<span class="sourceLineNo">1032</span><a name="line.1032"></a> +<span class="sourceLineNo">1033</span> /**<a name="line.1033"></a> +<span class="sourceLineNo">1034</span> * Invoke 'getJar' on a custom JarFinder implementation. Useful for some job<a name="line.1034"></a> +<span class="sourceLineNo">1035</span> * configuration contexts (HBASE-8140) and also for testing on MRv2.<a name="line.1035"></a> +<span class="sourceLineNo">1036</span> * check if we have HADOOP-9426.<a name="line.1036"></a> +<span class="sourceLineNo">1037</span> * @param my_class the class to find.<a name="line.1037"></a> +<span class="sourceLineNo">1038</span> * @return a jar file that contains the class, or null.<a name="line.1038"></a> +<span class="sourceLineNo">1039</span> */<a name="line.1039"></a> +<span class="sourceLineNo">1040</span> private static String getJar(Class<?> my_class) {<a name="line.1040"></a> +<span class="sourceLineNo">1041</span> String ret = null;<a name="line.1041"></a> +<span class="sourceLineNo">1042</span> try {<a name="line.1042"></a> +<span class="sourceLineNo">1043</span> ret = JarFinder.getJar(my_class);<a name="line.1043"></a> +<span class="sourceLineNo">1044</span> } catch (Exception e) {<a name="line.1044"></a> +<span class="sourceLineNo">1045</span> // toss all other exceptions, related to reflection failure<a name="line.1045"></a> +<span class="sourceLineNo">1046</span> throw new RuntimeException("getJar invocation failed.", e);<a name="line.1046"></a> +<span class="sourceLineNo">1047</span> }<a name="line.1047"></a> +<span class="sourceLineNo">1048</span><a name="line.1048"></a> +<span class="sourceLineNo">1049</span> return ret;<a name="line.1049"></a> +<span class="sourceLineNo">1050</span> }<a name="line.1050"></a> +<span class="sourceLineNo">1051</span>}<a name="line.1051"></a> http://git-wip-us.apache.org/repos/asf/hbase-site/blob/315ffef7/book.html ---------------------------------------------------------------------- diff --git a/book.html b/book.html index 41332bd..1782584 100644 --- a/book.html +++ b/book.html @@ -33437,6 +33437,11 @@ In case the table goes out of date, the unit tests which check for accuracy of p <td class="tableblock halign-left valign-top"><p class="tableblock">superuser|global(A)</p></td> </tr> <tr> +<td class="tableblock halign-left valign-top"></td> +<td class="tableblock halign-left valign-top"><p class="tableblock">getClusterStatus</p></td> +<td class="tableblock halign-left valign-top"><p class="tableblock">superuser|global(A)</p></td> +</tr> +<tr> <td class="tableblock halign-left valign-top"><p class="tableblock">Region</p></td> <td class="tableblock halign-left valign-top"><p class="tableblock">openRegion</p></td> <td class="tableblock halign-left valign-top"><p class="tableblock">superuser|global(A)</p></td> @@ -33787,15 +33792,8 @@ Given the two row keys in the Prefix example, and given an exact match on timest <dt class="hdlist1">Prefix Tree</dt> <dd> <p>Prefix tree encoding was introduced as an experimental feature in HBase 0.96. -It provides similar memory savings to the Prefix, Diff, and Fast Diff encoder, but provides faster random access at a cost of slower encoding speed.</p> -<div class="paragraph"> -<p>Prefix Tree may be appropriate for applications that have high block cache hit ratios. It introduces new 'tree' fields for the row and column. -The row tree field contains a list of offsets/references corresponding to the cells in that row. This allows for a good deal of compression. -For more details about Prefix Tree encoding, see <a href="https://issues.apache.org/jira/browse/HBASE-4676">HBASE-4676</a>.</p> -</div> -<div class="paragraph"> -<p>It is difficult to graphically illustrate a prefix tree, so no image is included. See the Wikipedia article for <a href="http://en.wikipedia.org/wiki/Trie">Trie</a> for more general information about this data structure.</p> -</div> +It provides similar memory savings to the Prefix, Diff, and Fast Diff encoder, but provides faster random access at a cost of slower encoding speed. +It was removed in hbase-2.0.0. It was a good idea but little uptake. If interested in reviving this effort, write the hbase dev list.</p> </dd> </dl> </div> @@ -35486,7 +35484,7 @@ The server will return cellblocks compressed using this same compressor as long <div id="footer"> <div id="footer-text"> Version 3.0.0-SNAPSHOT<br> -Last updated 2017-11-04 14:29:51 UTC +Last updated 2017-11-05 14:29:37 UTC </div> </div> </body> http://git-wip-us.apache.org/repos/asf/hbase-site/blob/315ffef7/bulk-loads.html ---------------------------------------------------------------------- diff --git a/bulk-loads.html b/bulk-loads.html index 2c0b85a..ec0d697 100644 --- a/bulk-loads.html +++ b/bulk-loads.html @@ -7,7 +7,7 @@ <head> <meta charset="UTF-8" /> <meta name="viewport" content="width=device-width, initial-scale=1.0" /> - <meta name="Date-Revision-yyyymmdd" content="20171104" /> + <meta name="Date-Revision-yyyymmdd" content="20171105" /> <meta http-equiv="Content-Language" content="en" /> <title>Apache HBase – Bulk Loads in Apache HBase (TM) @@ -311,7 +311,7 @@ under the License. --> <a href="https://www.apache.org/">The Apache Software Foundation</a>. All rights reserved. - <li id="publishDate" class="pull-right">Last Published: 2017-11-04</li> + <li id="publishDate" class="pull-right">Last Published: 2017-11-05</li> </p> </div>
