http://git-wip-us.apache.org/repos/asf/hbase-site/blob/dccdd274/devapidocs/src-html/org/apache/hadoop/hbase/regionserver/HRegionServer.SystemExitWhenAbortTimeout.html ---------------------------------------------------------------------- diff --git a/devapidocs/src-html/org/apache/hadoop/hbase/regionserver/HRegionServer.SystemExitWhenAbortTimeout.html b/devapidocs/src-html/org/apache/hadoop/hbase/regionserver/HRegionServer.SystemExitWhenAbortTimeout.html index 6369c27..ea05301 100644 --- a/devapidocs/src-html/org/apache/hadoop/hbase/regionserver/HRegionServer.SystemExitWhenAbortTimeout.html +++ b/devapidocs/src-html/org/apache/hadoop/hbase/regionserver/HRegionServer.SystemExitWhenAbortTimeout.html @@ -603,3251 +603,3256 @@ <span class="sourceLineNo">595</span> // init superusers and add the server principal (if using security)<a name="line.595"></a> <span class="sourceLineNo">596</span> // or process owner as default super user.<a name="line.596"></a> <span class="sourceLineNo">597</span> Superusers.initialize(conf);<a name="line.597"></a> -<span class="sourceLineNo">598</span><a name="line.598"></a> -<span class="sourceLineNo">599</span> regionServerAccounting = new RegionServerAccounting(conf);<a name="line.599"></a> +<span class="sourceLineNo">598</span> regionServerAccounting = new RegionServerAccounting(conf);<a name="line.598"></a> +<span class="sourceLineNo">599</span><a name="line.599"></a> <span class="sourceLineNo">600</span> boolean isMasterNotCarryTable =<a name="line.600"></a> <span class="sourceLineNo">601</span> this instanceof HMaster && !LoadBalancer.isTablesOnMaster(conf);<a name="line.601"></a> -<span class="sourceLineNo">602</span> cacheConfig = new CacheConfig(conf, !isMasterNotCarryTable);<a name="line.602"></a> -<span class="sourceLineNo">603</span> mobCacheConfig = new MobCacheConfig(conf, !isMasterNotCarryTable);<a name="line.603"></a> -<span class="sourceLineNo">604</span> uncaughtExceptionHandler = new UncaughtExceptionHandler() {<a name="line.604"></a> -<span class="sourceLineNo">605</span> @Override<a name="line.605"></a> -<span class="sourceLineNo">606</span> public void uncaughtException(Thread t, Throwable e) {<a name="line.606"></a> -<span class="sourceLineNo">607</span> abort("Uncaught exception in executorService thread " + t.getName(), e);<a name="line.607"></a> -<span class="sourceLineNo">608</span> }<a name="line.608"></a> -<span class="sourceLineNo">609</span> };<a name="line.609"></a> -<span class="sourceLineNo">610</span><a name="line.610"></a> -<span class="sourceLineNo">611</span> initializeFileSystem();<a name="line.611"></a> -<span class="sourceLineNo">612</span> spanReceiverHost = SpanReceiverHost.getInstance(getConfiguration());<a name="line.612"></a> -<span class="sourceLineNo">613</span><a name="line.613"></a> -<span class="sourceLineNo">614</span> this.configurationManager = new ConfigurationManager();<a name="line.614"></a> -<span class="sourceLineNo">615</span> setupWindows(getConfiguration(), getConfigurationManager());<a name="line.615"></a> -<span class="sourceLineNo">616</span><a name="line.616"></a> -<span class="sourceLineNo">617</span> // Some unit tests don't need a cluster, so no zookeeper at all<a name="line.617"></a> -<span class="sourceLineNo">618</span> if (!conf.getBoolean("hbase.testing.nocluster", false)) {<a name="line.618"></a> -<span class="sourceLineNo">619</span> // Open connection to zookeeper and set primary watcher<a name="line.619"></a> -<span class="sourceLineNo">620</span> zooKeeper = new ZKWatcher(conf, getProcessName() + ":" +<a name="line.620"></a> -<span class="sourceLineNo">621</span> rpcServices.isa.getPort(), this, canCreateBaseZNode());<a name="line.621"></a> -<span class="sourceLineNo">622</span> // If no master in cluster, skip trying to track one or look for a cluster status.<a name="line.622"></a> -<span class="sourceLineNo">623</span> if (!this.masterless) {<a name="line.623"></a> -<span class="sourceLineNo">624</span> this.csm = new ZkCoordinatedStateManager(this);<a name="line.624"></a> -<span class="sourceLineNo">625</span><a name="line.625"></a> -<span class="sourceLineNo">626</span> masterAddressTracker = new MasterAddressTracker(getZooKeeper(), this);<a name="line.626"></a> -<span class="sourceLineNo">627</span> masterAddressTracker.start();<a name="line.627"></a> -<span class="sourceLineNo">628</span><a name="line.628"></a> -<span class="sourceLineNo">629</span> clusterStatusTracker = new ClusterStatusTracker(zooKeeper, this);<a name="line.629"></a> -<span class="sourceLineNo">630</span> clusterStatusTracker.start();<a name="line.630"></a> -<span class="sourceLineNo">631</span> } else {<a name="line.631"></a> -<span class="sourceLineNo">632</span> masterAddressTracker = null;<a name="line.632"></a> -<span class="sourceLineNo">633</span> clusterStatusTracker = null;<a name="line.633"></a> -<span class="sourceLineNo">634</span> }<a name="line.634"></a> -<span class="sourceLineNo">635</span> } else {<a name="line.635"></a> -<span class="sourceLineNo">636</span> zooKeeper = null;<a name="line.636"></a> -<span class="sourceLineNo">637</span> masterAddressTracker = null;<a name="line.637"></a> -<span class="sourceLineNo">638</span> clusterStatusTracker = null;<a name="line.638"></a> -<span class="sourceLineNo">639</span> }<a name="line.639"></a> -<span class="sourceLineNo">640</span> this.rpcServices.start(zooKeeper);<a name="line.640"></a> -<span class="sourceLineNo">641</span> // This violates 'no starting stuff in Constructor' but Master depends on the below chore<a name="line.641"></a> -<span class="sourceLineNo">642</span> // and executor being created and takes a different startup route. Lots of overlap between HRS<a name="line.642"></a> -<span class="sourceLineNo">643</span> // and M (An M IS A HRS now). Need to refactor so less duplication between M and its super<a name="line.643"></a> -<span class="sourceLineNo">644</span> // Master expects Constructor to put up web servers. Ugh.<a name="line.644"></a> -<span class="sourceLineNo">645</span> // class HRS. TODO.<a name="line.645"></a> -<span class="sourceLineNo">646</span> this.choreService = new ChoreService(getName(), true);<a name="line.646"></a> -<span class="sourceLineNo">647</span> this.executorService = new ExecutorService(getName());<a name="line.647"></a> -<span class="sourceLineNo">648</span> putUpWebUI();<a name="line.648"></a> -<span class="sourceLineNo">649</span> } catch (Throwable t) {<a name="line.649"></a> -<span class="sourceLineNo">650</span> // Make sure we log the exception. HRegionServer is often started via reflection and the<a name="line.650"></a> -<span class="sourceLineNo">651</span> // cause of failed startup is lost.<a name="line.651"></a> -<span class="sourceLineNo">652</span> LOG.error("Failed construction RegionServer", t);<a name="line.652"></a> -<span class="sourceLineNo">653</span> throw t;<a name="line.653"></a> -<span class="sourceLineNo">654</span> }<a name="line.654"></a> -<span class="sourceLineNo">655</span> }<a name="line.655"></a> -<span class="sourceLineNo">656</span><a name="line.656"></a> -<span class="sourceLineNo">657</span> // HMaster should override this method to load the specific config for master<a name="line.657"></a> -<span class="sourceLineNo">658</span> protected String getUseThisHostnameInstead(Configuration conf) throws IOException {<a name="line.658"></a> -<span class="sourceLineNo">659</span> String hostname = conf.get(RS_HOSTNAME_KEY);<a name="line.659"></a> -<span class="sourceLineNo">660</span> if (conf.getBoolean(RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY, false)) {<a name="line.660"></a> -<span class="sourceLineNo">661</span> if (!StringUtils.isBlank(hostname)) {<a name="line.661"></a> -<span class="sourceLineNo">662</span> String msg = RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY + " and " + RS_HOSTNAME_KEY +<a name="line.662"></a> -<span class="sourceLineNo">663</span> " are mutually exclusive. Do not set " + RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY +<a name="line.663"></a> -<span class="sourceLineNo">664</span> " to true while " + RS_HOSTNAME_KEY + " is used";<a name="line.664"></a> -<span class="sourceLineNo">665</span> throw new IOException(msg);<a name="line.665"></a> -<span class="sourceLineNo">666</span> } else {<a name="line.666"></a> -<span class="sourceLineNo">667</span> return rpcServices.isa.getHostName();<a name="line.667"></a> -<span class="sourceLineNo">668</span> }<a name="line.668"></a> -<span class="sourceLineNo">669</span> } else {<a name="line.669"></a> -<span class="sourceLineNo">670</span> return hostname;<a name="line.670"></a> -<span class="sourceLineNo">671</span> }<a name="line.671"></a> -<span class="sourceLineNo">672</span> }<a name="line.672"></a> -<span class="sourceLineNo">673</span><a name="line.673"></a> -<span class="sourceLineNo">674</span> /**<a name="line.674"></a> -<span class="sourceLineNo">675</span> * If running on Windows, do windows-specific setup.<a name="line.675"></a> -<span class="sourceLineNo">676</span> */<a name="line.676"></a> -<span class="sourceLineNo">677</span> private static void setupWindows(final Configuration conf, ConfigurationManager cm) {<a name="line.677"></a> -<span class="sourceLineNo">678</span> if (!SystemUtils.IS_OS_WINDOWS) {<a name="line.678"></a> -<span class="sourceLineNo">679</span> Signal.handle(new Signal("HUP"), new SignalHandler() {<a name="line.679"></a> -<span class="sourceLineNo">680</span> @Override<a name="line.680"></a> -<span class="sourceLineNo">681</span> public void handle(Signal signal) {<a name="line.681"></a> -<span class="sourceLineNo">682</span> conf.reloadConfiguration();<a name="line.682"></a> -<span class="sourceLineNo">683</span> cm.notifyAllObservers(conf);<a name="line.683"></a> -<span class="sourceLineNo">684</span> }<a name="line.684"></a> -<span class="sourceLineNo">685</span> });<a name="line.685"></a> -<span class="sourceLineNo">686</span> }<a name="line.686"></a> -<span class="sourceLineNo">687</span> }<a name="line.687"></a> -<span class="sourceLineNo">688</span><a name="line.688"></a> -<span class="sourceLineNo">689</span> private static NettyEventLoopGroupConfig setupNetty(Configuration conf) {<a name="line.689"></a> -<span class="sourceLineNo">690</span> // Initialize netty event loop group at start as we may use it for rpc server, rpc client & WAL.<a name="line.690"></a> -<span class="sourceLineNo">691</span> NettyEventLoopGroupConfig nelgc =<a name="line.691"></a> -<span class="sourceLineNo">692</span> new NettyEventLoopGroupConfig(conf, "RS-EventLoopGroup");<a name="line.692"></a> -<span class="sourceLineNo">693</span> NettyRpcClientConfigHelper.setEventLoopConfig(conf, nelgc.group(), nelgc.clientChannelClass());<a name="line.693"></a> -<span class="sourceLineNo">694</span> NettyAsyncFSWALConfigHelper.setEventLoopConfig(conf, nelgc.group(), nelgc.clientChannelClass());<a name="line.694"></a> -<span class="sourceLineNo">695</span> return nelgc;<a name="line.695"></a> -<span class="sourceLineNo">696</span> }<a name="line.696"></a> -<span class="sourceLineNo">697</span><a name="line.697"></a> -<span class="sourceLineNo">698</span> private void initializeFileSystem() throws IOException {<a name="line.698"></a> -<span class="sourceLineNo">699</span> // Get fs instance used by this RS. Do we use checksum verification in the hbase? If hbase<a name="line.699"></a> -<span class="sourceLineNo">700</span> // checksum verification enabled, then automatically switch off hdfs checksum verification.<a name="line.700"></a> -<span class="sourceLineNo">701</span> boolean useHBaseChecksum = conf.getBoolean(HConstants.HBASE_CHECKSUM_VERIFICATION, true);<a name="line.701"></a> -<span class="sourceLineNo">702</span> FSUtils.setFsDefault(this.conf, FSUtils.getWALRootDir(this.conf));<a name="line.702"></a> -<span class="sourceLineNo">703</span> this.walFs = new HFileSystem(this.conf, useHBaseChecksum);<a name="line.703"></a> -<span class="sourceLineNo">704</span> this.walRootDir = FSUtils.getWALRootDir(this.conf);<a name="line.704"></a> -<span class="sourceLineNo">705</span> // Set 'fs.defaultFS' to match the filesystem on hbase.rootdir else<a name="line.705"></a> -<span class="sourceLineNo">706</span> // underlying hadoop hdfs accessors will be going against wrong filesystem<a name="line.706"></a> -<span class="sourceLineNo">707</span> // (unless all is set to defaults).<a name="line.707"></a> -<span class="sourceLineNo">708</span> FSUtils.setFsDefault(this.conf, FSUtils.getRootDir(this.conf));<a name="line.708"></a> -<span class="sourceLineNo">709</span> this.fs = new HFileSystem(this.conf, useHBaseChecksum);<a name="line.709"></a> -<span class="sourceLineNo">710</span> this.rootDir = FSUtils.getRootDir(this.conf);<a name="line.710"></a> -<span class="sourceLineNo">711</span> this.tableDescriptors = getFsTableDescriptors();<a name="line.711"></a> -<span class="sourceLineNo">712</span> }<a name="line.712"></a> -<span class="sourceLineNo">713</span><a name="line.713"></a> -<span class="sourceLineNo">714</span> protected TableDescriptors getFsTableDescriptors() throws IOException {<a name="line.714"></a> -<span class="sourceLineNo">715</span> return new FSTableDescriptors(this.conf,<a name="line.715"></a> -<span class="sourceLineNo">716</span> this.fs, this.rootDir, !canUpdateTableDescriptor(), false, getMetaTableObserver());<a name="line.716"></a> +<span class="sourceLineNo">602</span> // no need to instantiate global block cache when master not carry table<a name="line.602"></a> +<span class="sourceLineNo">603</span> if (!isMasterNotCarryTable) {<a name="line.603"></a> +<span class="sourceLineNo">604</span> CacheConfig.instantiateBlockCache(conf);<a name="line.604"></a> +<span class="sourceLineNo">605</span> }<a name="line.605"></a> +<span class="sourceLineNo">606</span> cacheConfig = new CacheConfig(conf);<a name="line.606"></a> +<span class="sourceLineNo">607</span> mobCacheConfig = new MobCacheConfig(conf);<a name="line.607"></a> +<span class="sourceLineNo">608</span><a name="line.608"></a> +<span class="sourceLineNo">609</span> uncaughtExceptionHandler = new UncaughtExceptionHandler() {<a name="line.609"></a> +<span class="sourceLineNo">610</span> @Override<a name="line.610"></a> +<span class="sourceLineNo">611</span> public void uncaughtException(Thread t, Throwable e) {<a name="line.611"></a> +<span class="sourceLineNo">612</span> abort("Uncaught exception in executorService thread " + t.getName(), e);<a name="line.612"></a> +<span class="sourceLineNo">613</span> }<a name="line.613"></a> +<span class="sourceLineNo">614</span> };<a name="line.614"></a> +<span class="sourceLineNo">615</span><a name="line.615"></a> +<span class="sourceLineNo">616</span> initializeFileSystem();<a name="line.616"></a> +<span class="sourceLineNo">617</span> spanReceiverHost = SpanReceiverHost.getInstance(getConfiguration());<a name="line.617"></a> +<span class="sourceLineNo">618</span><a name="line.618"></a> +<span class="sourceLineNo">619</span> this.configurationManager = new ConfigurationManager();<a name="line.619"></a> +<span class="sourceLineNo">620</span> setupWindows(getConfiguration(), getConfigurationManager());<a name="line.620"></a> +<span class="sourceLineNo">621</span><a name="line.621"></a> +<span class="sourceLineNo">622</span> // Some unit tests don't need a cluster, so no zookeeper at all<a name="line.622"></a> +<span class="sourceLineNo">623</span> if (!conf.getBoolean("hbase.testing.nocluster", false)) {<a name="line.623"></a> +<span class="sourceLineNo">624</span> // Open connection to zookeeper and set primary watcher<a name="line.624"></a> +<span class="sourceLineNo">625</span> zooKeeper = new ZKWatcher(conf, getProcessName() + ":" +<a name="line.625"></a> +<span class="sourceLineNo">626</span> rpcServices.isa.getPort(), this, canCreateBaseZNode());<a name="line.626"></a> +<span class="sourceLineNo">627</span> // If no master in cluster, skip trying to track one or look for a cluster status.<a name="line.627"></a> +<span class="sourceLineNo">628</span> if (!this.masterless) {<a name="line.628"></a> +<span class="sourceLineNo">629</span> this.csm = new ZkCoordinatedStateManager(this);<a name="line.629"></a> +<span class="sourceLineNo">630</span><a name="line.630"></a> +<span class="sourceLineNo">631</span> masterAddressTracker = new MasterAddressTracker(getZooKeeper(), this);<a name="line.631"></a> +<span class="sourceLineNo">632</span> masterAddressTracker.start();<a name="line.632"></a> +<span class="sourceLineNo">633</span><a name="line.633"></a> +<span class="sourceLineNo">634</span> clusterStatusTracker = new ClusterStatusTracker(zooKeeper, this);<a name="line.634"></a> +<span class="sourceLineNo">635</span> clusterStatusTracker.start();<a name="line.635"></a> +<span class="sourceLineNo">636</span> } else {<a name="line.636"></a> +<span class="sourceLineNo">637</span> masterAddressTracker = null;<a name="line.637"></a> +<span class="sourceLineNo">638</span> clusterStatusTracker = null;<a name="line.638"></a> +<span class="sourceLineNo">639</span> }<a name="line.639"></a> +<span class="sourceLineNo">640</span> } else {<a name="line.640"></a> +<span class="sourceLineNo">641</span> zooKeeper = null;<a name="line.641"></a> +<span class="sourceLineNo">642</span> masterAddressTracker = null;<a name="line.642"></a> +<span class="sourceLineNo">643</span> clusterStatusTracker = null;<a name="line.643"></a> +<span class="sourceLineNo">644</span> }<a name="line.644"></a> +<span class="sourceLineNo">645</span> this.rpcServices.start(zooKeeper);<a name="line.645"></a> +<span class="sourceLineNo">646</span> // This violates 'no starting stuff in Constructor' but Master depends on the below chore<a name="line.646"></a> +<span class="sourceLineNo">647</span> // and executor being created and takes a different startup route. Lots of overlap between HRS<a name="line.647"></a> +<span class="sourceLineNo">648</span> // and M (An M IS A HRS now). Need to refactor so less duplication between M and its super<a name="line.648"></a> +<span class="sourceLineNo">649</span> // Master expects Constructor to put up web servers. Ugh.<a name="line.649"></a> +<span class="sourceLineNo">650</span> // class HRS. TODO.<a name="line.650"></a> +<span class="sourceLineNo">651</span> this.choreService = new ChoreService(getName(), true);<a name="line.651"></a> +<span class="sourceLineNo">652</span> this.executorService = new ExecutorService(getName());<a name="line.652"></a> +<span class="sourceLineNo">653</span> putUpWebUI();<a name="line.653"></a> +<span class="sourceLineNo">654</span> } catch (Throwable t) {<a name="line.654"></a> +<span class="sourceLineNo">655</span> // Make sure we log the exception. HRegionServer is often started via reflection and the<a name="line.655"></a> +<span class="sourceLineNo">656</span> // cause of failed startup is lost.<a name="line.656"></a> +<span class="sourceLineNo">657</span> LOG.error("Failed construction RegionServer", t);<a name="line.657"></a> +<span class="sourceLineNo">658</span> throw t;<a name="line.658"></a> +<span class="sourceLineNo">659</span> }<a name="line.659"></a> +<span class="sourceLineNo">660</span> }<a name="line.660"></a> +<span class="sourceLineNo">661</span><a name="line.661"></a> +<span class="sourceLineNo">662</span> // HMaster should override this method to load the specific config for master<a name="line.662"></a> +<span class="sourceLineNo">663</span> protected String getUseThisHostnameInstead(Configuration conf) throws IOException {<a name="line.663"></a> +<span class="sourceLineNo">664</span> String hostname = conf.get(RS_HOSTNAME_KEY);<a name="line.664"></a> +<span class="sourceLineNo">665</span> if (conf.getBoolean(RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY, false)) {<a name="line.665"></a> +<span class="sourceLineNo">666</span> if (!StringUtils.isBlank(hostname)) {<a name="line.666"></a> +<span class="sourceLineNo">667</span> String msg = RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY + " and " + RS_HOSTNAME_KEY +<a name="line.667"></a> +<span class="sourceLineNo">668</span> " are mutually exclusive. Do not set " + RS_HOSTNAME_DISABLE_MASTER_REVERSEDNS_KEY +<a name="line.668"></a> +<span class="sourceLineNo">669</span> " to true while " + RS_HOSTNAME_KEY + " is used";<a name="line.669"></a> +<span class="sourceLineNo">670</span> throw new IOException(msg);<a name="line.670"></a> +<span class="sourceLineNo">671</span> } else {<a name="line.671"></a> +<span class="sourceLineNo">672</span> return rpcServices.isa.getHostName();<a name="line.672"></a> +<span class="sourceLineNo">673</span> }<a name="line.673"></a> +<span class="sourceLineNo">674</span> } else {<a name="line.674"></a> +<span class="sourceLineNo">675</span> return hostname;<a name="line.675"></a> +<span class="sourceLineNo">676</span> }<a name="line.676"></a> +<span class="sourceLineNo">677</span> }<a name="line.677"></a> +<span class="sourceLineNo">678</span><a name="line.678"></a> +<span class="sourceLineNo">679</span> /**<a name="line.679"></a> +<span class="sourceLineNo">680</span> * If running on Windows, do windows-specific setup.<a name="line.680"></a> +<span class="sourceLineNo">681</span> */<a name="line.681"></a> +<span class="sourceLineNo">682</span> private static void setupWindows(final Configuration conf, ConfigurationManager cm) {<a name="line.682"></a> +<span class="sourceLineNo">683</span> if (!SystemUtils.IS_OS_WINDOWS) {<a name="line.683"></a> +<span class="sourceLineNo">684</span> Signal.handle(new Signal("HUP"), new SignalHandler() {<a name="line.684"></a> +<span class="sourceLineNo">685</span> @Override<a name="line.685"></a> +<span class="sourceLineNo">686</span> public void handle(Signal signal) {<a name="line.686"></a> +<span class="sourceLineNo">687</span> conf.reloadConfiguration();<a name="line.687"></a> +<span class="sourceLineNo">688</span> cm.notifyAllObservers(conf);<a name="line.688"></a> +<span class="sourceLineNo">689</span> }<a name="line.689"></a> +<span class="sourceLineNo">690</span> });<a name="line.690"></a> +<span class="sourceLineNo">691</span> }<a name="line.691"></a> +<span class="sourceLineNo">692</span> }<a name="line.692"></a> +<span class="sourceLineNo">693</span><a name="line.693"></a> +<span class="sourceLineNo">694</span> private static NettyEventLoopGroupConfig setupNetty(Configuration conf) {<a name="line.694"></a> +<span class="sourceLineNo">695</span> // Initialize netty event loop group at start as we may use it for rpc server, rpc client & WAL.<a name="line.695"></a> +<span class="sourceLineNo">696</span> NettyEventLoopGroupConfig nelgc =<a name="line.696"></a> +<span class="sourceLineNo">697</span> new NettyEventLoopGroupConfig(conf, "RS-EventLoopGroup");<a name="line.697"></a> +<span class="sourceLineNo">698</span> NettyRpcClientConfigHelper.setEventLoopConfig(conf, nelgc.group(), nelgc.clientChannelClass());<a name="line.698"></a> +<span class="sourceLineNo">699</span> NettyAsyncFSWALConfigHelper.setEventLoopConfig(conf, nelgc.group(), nelgc.clientChannelClass());<a name="line.699"></a> +<span class="sourceLineNo">700</span> return nelgc;<a name="line.700"></a> +<span class="sourceLineNo">701</span> }<a name="line.701"></a> +<span class="sourceLineNo">702</span><a name="line.702"></a> +<span class="sourceLineNo">703</span> private void initializeFileSystem() throws IOException {<a name="line.703"></a> +<span class="sourceLineNo">704</span> // Get fs instance used by this RS. Do we use checksum verification in the hbase? If hbase<a name="line.704"></a> +<span class="sourceLineNo">705</span> // checksum verification enabled, then automatically switch off hdfs checksum verification.<a name="line.705"></a> +<span class="sourceLineNo">706</span> boolean useHBaseChecksum = conf.getBoolean(HConstants.HBASE_CHECKSUM_VERIFICATION, true);<a name="line.706"></a> +<span class="sourceLineNo">707</span> FSUtils.setFsDefault(this.conf, FSUtils.getWALRootDir(this.conf));<a name="line.707"></a> +<span class="sourceLineNo">708</span> this.walFs = new HFileSystem(this.conf, useHBaseChecksum);<a name="line.708"></a> +<span class="sourceLineNo">709</span> this.walRootDir = FSUtils.getWALRootDir(this.conf);<a name="line.709"></a> +<span class="sourceLineNo">710</span> // Set 'fs.defaultFS' to match the filesystem on hbase.rootdir else<a name="line.710"></a> +<span class="sourceLineNo">711</span> // underlying hadoop hdfs accessors will be going against wrong filesystem<a name="line.711"></a> +<span class="sourceLineNo">712</span> // (unless all is set to defaults).<a name="line.712"></a> +<span class="sourceLineNo">713</span> FSUtils.setFsDefault(this.conf, FSUtils.getRootDir(this.conf));<a name="line.713"></a> +<span class="sourceLineNo">714</span> this.fs = new HFileSystem(this.conf, useHBaseChecksum);<a name="line.714"></a> +<span class="sourceLineNo">715</span> this.rootDir = FSUtils.getRootDir(this.conf);<a name="line.715"></a> +<span class="sourceLineNo">716</span> this.tableDescriptors = getFsTableDescriptors();<a name="line.716"></a> <span class="sourceLineNo">717</span> }<a name="line.717"></a> <span class="sourceLineNo">718</span><a name="line.718"></a> -<span class="sourceLineNo">719</span> protected Function<TableDescriptorBuilder, TableDescriptorBuilder> getMetaTableObserver() {<a name="line.719"></a> -<span class="sourceLineNo">720</span> return null;<a name="line.720"></a> -<span class="sourceLineNo">721</span> }<a name="line.721"></a> -<span class="sourceLineNo">722</span><a name="line.722"></a> -<span class="sourceLineNo">723</span> protected void login(UserProvider user, String host) throws IOException {<a name="line.723"></a> -<span class="sourceLineNo">724</span> user.login("hbase.regionserver.keytab.file",<a name="line.724"></a> -<span class="sourceLineNo">725</span> "hbase.regionserver.kerberos.principal", host);<a name="line.725"></a> +<span class="sourceLineNo">719</span> protected TableDescriptors getFsTableDescriptors() throws IOException {<a name="line.719"></a> +<span class="sourceLineNo">720</span> return new FSTableDescriptors(this.conf,<a name="line.720"></a> +<span class="sourceLineNo">721</span> this.fs, this.rootDir, !canUpdateTableDescriptor(), false, getMetaTableObserver());<a name="line.721"></a> +<span class="sourceLineNo">722</span> }<a name="line.722"></a> +<span class="sourceLineNo">723</span><a name="line.723"></a> +<span class="sourceLineNo">724</span> protected Function<TableDescriptorBuilder, TableDescriptorBuilder> getMetaTableObserver() {<a name="line.724"></a> +<span class="sourceLineNo">725</span> return null;<a name="line.725"></a> <span class="sourceLineNo">726</span> }<a name="line.726"></a> <span class="sourceLineNo">727</span><a name="line.727"></a> -<span class="sourceLineNo">728</span><a name="line.728"></a> -<span class="sourceLineNo">729</span> /**<a name="line.729"></a> -<span class="sourceLineNo">730</span> * Wait for an active Master.<a name="line.730"></a> -<span class="sourceLineNo">731</span> * See override in Master superclass for how it is used.<a name="line.731"></a> -<span class="sourceLineNo">732</span> */<a name="line.732"></a> -<span class="sourceLineNo">733</span> protected void waitForMasterActive() {}<a name="line.733"></a> -<span class="sourceLineNo">734</span><a name="line.734"></a> -<span class="sourceLineNo">735</span> protected String getProcessName() {<a name="line.735"></a> -<span class="sourceLineNo">736</span> return REGIONSERVER;<a name="line.736"></a> -<span class="sourceLineNo">737</span> }<a name="line.737"></a> -<span class="sourceLineNo">738</span><a name="line.738"></a> -<span class="sourceLineNo">739</span> protected boolean canCreateBaseZNode() {<a name="line.739"></a> -<span class="sourceLineNo">740</span> return this.masterless;<a name="line.740"></a> -<span class="sourceLineNo">741</span> }<a name="line.741"></a> -<span class="sourceLineNo">742</span><a name="line.742"></a> -<span class="sourceLineNo">743</span> protected boolean canUpdateTableDescriptor() {<a name="line.743"></a> -<span class="sourceLineNo">744</span> return false;<a name="line.744"></a> -<span class="sourceLineNo">745</span> }<a name="line.745"></a> -<span class="sourceLineNo">746</span><a name="line.746"></a> -<span class="sourceLineNo">747</span> protected RSRpcServices createRpcServices() throws IOException {<a name="line.747"></a> -<span class="sourceLineNo">748</span> return new RSRpcServices(this);<a name="line.748"></a> -<span class="sourceLineNo">749</span> }<a name="line.749"></a> -<span class="sourceLineNo">750</span><a name="line.750"></a> -<span class="sourceLineNo">751</span> protected void configureInfoServer() {<a name="line.751"></a> -<span class="sourceLineNo">752</span> infoServer.addServlet("rs-status", "/rs-status", RSStatusServlet.class);<a name="line.752"></a> -<span class="sourceLineNo">753</span> infoServer.setAttribute(REGIONSERVER, this);<a name="line.753"></a> +<span class="sourceLineNo">728</span> protected void login(UserProvider user, String host) throws IOException {<a name="line.728"></a> +<span class="sourceLineNo">729</span> user.login("hbase.regionserver.keytab.file",<a name="line.729"></a> +<span class="sourceLineNo">730</span> "hbase.regionserver.kerberos.principal", host);<a name="line.730"></a> +<span class="sourceLineNo">731</span> }<a name="line.731"></a> +<span class="sourceLineNo">732</span><a name="line.732"></a> +<span class="sourceLineNo">733</span><a name="line.733"></a> +<span class="sourceLineNo">734</span> /**<a name="line.734"></a> +<span class="sourceLineNo">735</span> * Wait for an active Master.<a name="line.735"></a> +<span class="sourceLineNo">736</span> * See override in Master superclass for how it is used.<a name="line.736"></a> +<span class="sourceLineNo">737</span> */<a name="line.737"></a> +<span class="sourceLineNo">738</span> protected void waitForMasterActive() {}<a name="line.738"></a> +<span class="sourceLineNo">739</span><a name="line.739"></a> +<span class="sourceLineNo">740</span> protected String getProcessName() {<a name="line.740"></a> +<span class="sourceLineNo">741</span> return REGIONSERVER;<a name="line.741"></a> +<span class="sourceLineNo">742</span> }<a name="line.742"></a> +<span class="sourceLineNo">743</span><a name="line.743"></a> +<span class="sourceLineNo">744</span> protected boolean canCreateBaseZNode() {<a name="line.744"></a> +<span class="sourceLineNo">745</span> return this.masterless;<a name="line.745"></a> +<span class="sourceLineNo">746</span> }<a name="line.746"></a> +<span class="sourceLineNo">747</span><a name="line.747"></a> +<span class="sourceLineNo">748</span> protected boolean canUpdateTableDescriptor() {<a name="line.748"></a> +<span class="sourceLineNo">749</span> return false;<a name="line.749"></a> +<span class="sourceLineNo">750</span> }<a name="line.750"></a> +<span class="sourceLineNo">751</span><a name="line.751"></a> +<span class="sourceLineNo">752</span> protected RSRpcServices createRpcServices() throws IOException {<a name="line.752"></a> +<span class="sourceLineNo">753</span> return new RSRpcServices(this);<a name="line.753"></a> <span class="sourceLineNo">754</span> }<a name="line.754"></a> <span class="sourceLineNo">755</span><a name="line.755"></a> -<span class="sourceLineNo">756</span> protected Class<? extends HttpServlet> getDumpServlet() {<a name="line.756"></a> -<span class="sourceLineNo">757</span> return RSDumpServlet.class;<a name="line.757"></a> -<span class="sourceLineNo">758</span> }<a name="line.758"></a> -<span class="sourceLineNo">759</span><a name="line.759"></a> -<span class="sourceLineNo">760</span> @Override<a name="line.760"></a> -<span class="sourceLineNo">761</span> public boolean registerService(com.google.protobuf.Service instance) {<a name="line.761"></a> -<span class="sourceLineNo">762</span> /*<a name="line.762"></a> -<span class="sourceLineNo">763</span> * No stacking of instances is allowed for a single executorService name<a name="line.763"></a> -<span class="sourceLineNo">764</span> */<a name="line.764"></a> -<span class="sourceLineNo">765</span> com.google.protobuf.Descriptors.ServiceDescriptor serviceDesc =<a name="line.765"></a> -<span class="sourceLineNo">766</span> instance.getDescriptorForType();<a name="line.766"></a> -<span class="sourceLineNo">767</span> String serviceName = CoprocessorRpcUtils.getServiceName(serviceDesc);<a name="line.767"></a> -<span class="sourceLineNo">768</span> if (coprocessorServiceHandlers.containsKey(serviceName)) {<a name="line.768"></a> -<span class="sourceLineNo">769</span> LOG.error("Coprocessor executorService " + serviceName<a name="line.769"></a> -<span class="sourceLineNo">770</span> + " already registered, rejecting request from " + instance);<a name="line.770"></a> -<span class="sourceLineNo">771</span> return false;<a name="line.771"></a> -<span class="sourceLineNo">772</span> }<a name="line.772"></a> -<span class="sourceLineNo">773</span><a name="line.773"></a> -<span class="sourceLineNo">774</span> coprocessorServiceHandlers.put(serviceName, instance);<a name="line.774"></a> -<span class="sourceLineNo">775</span> if (LOG.isDebugEnabled()) {<a name="line.775"></a> -<span class="sourceLineNo">776</span> LOG.debug("Registered regionserver coprocessor executorService: executorService=" + serviceName);<a name="line.776"></a> +<span class="sourceLineNo">756</span> protected void configureInfoServer() {<a name="line.756"></a> +<span class="sourceLineNo">757</span> infoServer.addServlet("rs-status", "/rs-status", RSStatusServlet.class);<a name="line.757"></a> +<span class="sourceLineNo">758</span> infoServer.setAttribute(REGIONSERVER, this);<a name="line.758"></a> +<span class="sourceLineNo">759</span> }<a name="line.759"></a> +<span class="sourceLineNo">760</span><a name="line.760"></a> +<span class="sourceLineNo">761</span> protected Class<? extends HttpServlet> getDumpServlet() {<a name="line.761"></a> +<span class="sourceLineNo">762</span> return RSDumpServlet.class;<a name="line.762"></a> +<span class="sourceLineNo">763</span> }<a name="line.763"></a> +<span class="sourceLineNo">764</span><a name="line.764"></a> +<span class="sourceLineNo">765</span> @Override<a name="line.765"></a> +<span class="sourceLineNo">766</span> public boolean registerService(com.google.protobuf.Service instance) {<a name="line.766"></a> +<span class="sourceLineNo">767</span> /*<a name="line.767"></a> +<span class="sourceLineNo">768</span> * No stacking of instances is allowed for a single executorService name<a name="line.768"></a> +<span class="sourceLineNo">769</span> */<a name="line.769"></a> +<span class="sourceLineNo">770</span> com.google.protobuf.Descriptors.ServiceDescriptor serviceDesc =<a name="line.770"></a> +<span class="sourceLineNo">771</span> instance.getDescriptorForType();<a name="line.771"></a> +<span class="sourceLineNo">772</span> String serviceName = CoprocessorRpcUtils.getServiceName(serviceDesc);<a name="line.772"></a> +<span class="sourceLineNo">773</span> if (coprocessorServiceHandlers.containsKey(serviceName)) {<a name="line.773"></a> +<span class="sourceLineNo">774</span> LOG.error("Coprocessor executorService " + serviceName<a name="line.774"></a> +<span class="sourceLineNo">775</span> + " already registered, rejecting request from " + instance);<a name="line.775"></a> +<span class="sourceLineNo">776</span> return false;<a name="line.776"></a> <span class="sourceLineNo">777</span> }<a name="line.777"></a> -<span class="sourceLineNo">778</span> return true;<a name="line.778"></a> -<span class="sourceLineNo">779</span> }<a name="line.779"></a> -<span class="sourceLineNo">780</span><a name="line.780"></a> -<span class="sourceLineNo">781</span> /**<a name="line.781"></a> -<span class="sourceLineNo">782</span> * Create a 'smarter' Connection, one that is capable of by-passing RPC if the request is to the<a name="line.782"></a> -<span class="sourceLineNo">783</span> * local server; i.e. a short-circuit Connection. Safe to use going to local or remote server.<a name="line.783"></a> -<span class="sourceLineNo">784</span> */<a name="line.784"></a> -<span class="sourceLineNo">785</span> private ClusterConnection createClusterConnection() throws IOException {<a name="line.785"></a> -<span class="sourceLineNo">786</span> Configuration conf = this.conf;<a name="line.786"></a> -<span class="sourceLineNo">787</span> if (conf.get(HConstants.CLIENT_ZOOKEEPER_QUORUM) != null) {<a name="line.787"></a> -<span class="sourceLineNo">788</span> // Use server ZK cluster for server-issued connections, so we clone<a name="line.788"></a> -<span class="sourceLineNo">789</span> // the conf and unset the client ZK related properties<a name="line.789"></a> -<span class="sourceLineNo">790</span> conf = new Configuration(this.conf);<a name="line.790"></a> -<span class="sourceLineNo">791</span> conf.unset(HConstants.CLIENT_ZOOKEEPER_QUORUM);<a name="line.791"></a> -<span class="sourceLineNo">792</span> }<a name="line.792"></a> -<span class="sourceLineNo">793</span> // Create a cluster connection that when appropriate, can short-circuit and go directly to the<a name="line.793"></a> -<span class="sourceLineNo">794</span> // local server if the request is to the local server bypassing RPC. Can be used for both local<a name="line.794"></a> -<span class="sourceLineNo">795</span> // and remote invocations.<a name="line.795"></a> -<span class="sourceLineNo">796</span> ClusterConnection conn = ConnectionUtils.createShortCircuitConnection(conf, null,<a name="line.796"></a> -<span class="sourceLineNo">797</span> userProvider.getCurrent(), serverName, rpcServices, rpcServices);<a name="line.797"></a> -<span class="sourceLineNo">798</span> // This is used to initialize the batch thread pool inside the connection implementation.<a name="line.798"></a> -<span class="sourceLineNo">799</span> // When deploy a fresh cluster, we may first use the cluster connection in InitMetaProcedure,<a name="line.799"></a> -<span class="sourceLineNo">800</span> // which will be executed inside the PEWorker, and then the batch thread pool will inherit the<a name="line.800"></a> -<span class="sourceLineNo">801</span> // thread group of PEWorker, which will be destroy when shutting down the ProcedureExecutor. It<a name="line.801"></a> -<span class="sourceLineNo">802</span> // will cause lots of procedure related UTs to fail, so here let's initialize it first, no harm.<a name="line.802"></a> -<span class="sourceLineNo">803</span> conn.getTable(TableName.META_TABLE_NAME).close();<a name="line.803"></a> -<span class="sourceLineNo">804</span> return conn;<a name="line.804"></a> -<span class="sourceLineNo">805</span> }<a name="line.805"></a> -<span class="sourceLineNo">806</span><a name="line.806"></a> -<span class="sourceLineNo">807</span> /**<a name="line.807"></a> -<span class="sourceLineNo">808</span> * Run test on configured codecs to make sure supporting libs are in place.<a name="line.808"></a> -<span class="sourceLineNo">809</span> * @param c<a name="line.809"></a> -<span class="sourceLineNo">810</span> * @throws IOException<a name="line.810"></a> -<span class="sourceLineNo">811</span> */<a name="line.811"></a> -<span class="sourceLineNo">812</span> private static void checkCodecs(final Configuration c) throws IOException {<a name="line.812"></a> -<span class="sourceLineNo">813</span> // check to see if the codec list is available:<a name="line.813"></a> -<span class="sourceLineNo">814</span> String [] codecs = c.getStrings("hbase.regionserver.codecs", (String[])null);<a name="line.814"></a> -<span class="sourceLineNo">815</span> if (codecs == null) return;<a name="line.815"></a> -<span class="sourceLineNo">816</span> for (String codec : codecs) {<a name="line.816"></a> -<span class="sourceLineNo">817</span> if (!CompressionTest.testCompression(codec)) {<a name="line.817"></a> -<span class="sourceLineNo">818</span> throw new IOException("Compression codec " + codec +<a name="line.818"></a> -<span class="sourceLineNo">819</span> " not supported, aborting RS construction");<a name="line.819"></a> -<span class="sourceLineNo">820</span> }<a name="line.820"></a> -<span class="sourceLineNo">821</span> }<a name="line.821"></a> -<span class="sourceLineNo">822</span> }<a name="line.822"></a> -<span class="sourceLineNo">823</span><a name="line.823"></a> -<span class="sourceLineNo">824</span> public String getClusterId() {<a name="line.824"></a> -<span class="sourceLineNo">825</span> return this.clusterId;<a name="line.825"></a> -<span class="sourceLineNo">826</span> }<a name="line.826"></a> -<span class="sourceLineNo">827</span><a name="line.827"></a> -<span class="sourceLineNo">828</span> /**<a name="line.828"></a> -<span class="sourceLineNo">829</span> * Setup our cluster connection if not already initialized.<a name="line.829"></a> -<span class="sourceLineNo">830</span> */<a name="line.830"></a> -<span class="sourceLineNo">831</span> protected synchronized void setupClusterConnection() throws IOException {<a name="line.831"></a> -<span class="sourceLineNo">832</span> if (clusterConnection == null) {<a name="line.832"></a> -<span class="sourceLineNo">833</span> clusterConnection = createClusterConnection();<a name="line.833"></a> -<span class="sourceLineNo">834</span> metaTableLocator = new MetaTableLocator();<a name="line.834"></a> -<span class="sourceLineNo">835</span> }<a name="line.835"></a> -<span class="sourceLineNo">836</span> }<a name="line.836"></a> -<span class="sourceLineNo">837</span><a name="line.837"></a> -<span class="sourceLineNo">838</span> /**<a name="line.838"></a> -<span class="sourceLineNo">839</span> * All initialization needed before we go register with Master.<br><a name="line.839"></a> -<span class="sourceLineNo">840</span> * Do bare minimum. Do bulk of initializations AFTER we've connected to the Master.<br><a name="line.840"></a> -<span class="sourceLineNo">841</span> * In here we just put up the RpcServer, setup Connection, and ZooKeeper.<a name="line.841"></a> -<span class="sourceLineNo">842</span> */<a name="line.842"></a> -<span class="sourceLineNo">843</span> private void preRegistrationInitialization() {<a name="line.843"></a> -<span class="sourceLineNo">844</span> try {<a name="line.844"></a> -<span class="sourceLineNo">845</span> initializeZooKeeper();<a name="line.845"></a> -<span class="sourceLineNo">846</span> setupClusterConnection();<a name="line.846"></a> -<span class="sourceLineNo">847</span> // Setup RPC client for master communication<a name="line.847"></a> -<span class="sourceLineNo">848</span> this.rpcClient = RpcClientFactory.createClient(conf, clusterId, new InetSocketAddress(<a name="line.848"></a> -<span class="sourceLineNo">849</span> this.rpcServices.isa.getAddress(), 0), clusterConnection.getConnectionMetrics());<a name="line.849"></a> -<span class="sourceLineNo">850</span> } catch (Throwable t) {<a name="line.850"></a> -<span class="sourceLineNo">851</span> // Call stop if error or process will stick around for ever since server<a name="line.851"></a> -<span class="sourceLineNo">852</span> // puts up non-daemon threads.<a name="line.852"></a> -<span class="sourceLineNo">853</span> this.rpcServices.stop();<a name="line.853"></a> -<span class="sourceLineNo">854</span> abort("Initialization of RS failed. Hence aborting RS.", t);<a name="line.854"></a> -<span class="sourceLineNo">855</span> }<a name="line.855"></a> -<span class="sourceLineNo">856</span> }<a name="line.856"></a> -<span class="sourceLineNo">857</span><a name="line.857"></a> -<span class="sourceLineNo">858</span> /**<a name="line.858"></a> -<span class="sourceLineNo">859</span> * Bring up connection to zk ensemble and then wait until a master for this cluster and then after<a name="line.859"></a> -<span class="sourceLineNo">860</span> * that, wait until cluster 'up' flag has been set. This is the order in which master does things.<a name="line.860"></a> -<span class="sourceLineNo">861</span> * <p><a name="line.861"></a> -<span class="sourceLineNo">862</span> * Finally open long-living server short-circuit connection.<a name="line.862"></a> -<span class="sourceLineNo">863</span> */<a name="line.863"></a> -<span class="sourceLineNo">864</span> @edu.umd.cs.findbugs.annotations.SuppressWarnings(value="RV_RETURN_VALUE_IGNORED_BAD_PRACTICE",<a name="line.864"></a> -<span class="sourceLineNo">865</span> justification="cluster Id znode read would give us correct response")<a name="line.865"></a> -<span class="sourceLineNo">866</span> private void initializeZooKeeper() throws IOException, InterruptedException {<a name="line.866"></a> -<span class="sourceLineNo">867</span> // Nothing to do in here if no Master in the mix.<a name="line.867"></a> -<span class="sourceLineNo">868</span> if (this.masterless) {<a name="line.868"></a> -<span class="sourceLineNo">869</span> return;<a name="line.869"></a> -<span class="sourceLineNo">870</span> }<a name="line.870"></a> -<span class="sourceLineNo">871</span><a name="line.871"></a> -<span class="sourceLineNo">872</span> // Create the master address tracker, register with zk, and start it. Then<a name="line.872"></a> -<span class="sourceLineNo">873</span> // block until a master is available. No point in starting up if no master<a name="line.873"></a> -<span class="sourceLineNo">874</span> // running.<a name="line.874"></a> -<span class="sourceLineNo">875</span> blockAndCheckIfStopped(this.masterAddressTracker);<a name="line.875"></a> +<span class="sourceLineNo">778</span><a name="line.778"></a> +<span class="sourceLineNo">779</span> coprocessorServiceHandlers.put(serviceName, instance);<a name="line.779"></a> +<span class="sourceLineNo">780</span> if (LOG.isDebugEnabled()) {<a name="line.780"></a> +<span class="sourceLineNo">781</span> LOG.debug("Registered regionserver coprocessor executorService: executorService=" + serviceName);<a name="line.781"></a> +<span class="sourceLineNo">782</span> }<a name="line.782"></a> +<span class="sourceLineNo">783</span> return true;<a name="line.783"></a> +<span class="sourceLineNo">784</span> }<a name="line.784"></a> +<span class="sourceLineNo">785</span><a name="line.785"></a> +<span class="sourceLineNo">786</span> /**<a name="line.786"></a> +<span class="sourceLineNo">787</span> * Create a 'smarter' Connection, one that is capable of by-passing RPC if the request is to the<a name="line.787"></a> +<span class="sourceLineNo">788</span> * local server; i.e. a short-circuit Connection. Safe to use going to local or remote server.<a name="line.788"></a> +<span class="sourceLineNo">789</span> */<a name="line.789"></a> +<span class="sourceLineNo">790</span> private ClusterConnection createClusterConnection() throws IOException {<a name="line.790"></a> +<span class="sourceLineNo">791</span> Configuration conf = this.conf;<a name="line.791"></a> +<span class="sourceLineNo">792</span> if (conf.get(HConstants.CLIENT_ZOOKEEPER_QUORUM) != null) {<a name="line.792"></a> +<span class="sourceLineNo">793</span> // Use server ZK cluster for server-issued connections, so we clone<a name="line.793"></a> +<span class="sourceLineNo">794</span> // the conf and unset the client ZK related properties<a name="line.794"></a> +<span class="sourceLineNo">795</span> conf = new Configuration(this.conf);<a name="line.795"></a> +<span class="sourceLineNo">796</span> conf.unset(HConstants.CLIENT_ZOOKEEPER_QUORUM);<a name="line.796"></a> +<span class="sourceLineNo">797</span> }<a name="line.797"></a> +<span class="sourceLineNo">798</span> // Create a cluster connection that when appropriate, can short-circuit and go directly to the<a name="line.798"></a> +<span class="sourceLineNo">799</span> // local server if the request is to the local server bypassing RPC. Can be used for both local<a name="line.799"></a> +<span class="sourceLineNo">800</span> // and remote invocations.<a name="line.800"></a> +<span class="sourceLineNo">801</span> ClusterConnection conn = ConnectionUtils.createShortCircuitConnection(conf, null,<a name="line.801"></a> +<span class="sourceLineNo">802</span> userProvider.getCurrent(), serverName, rpcServices, rpcServices);<a name="line.802"></a> +<span class="sourceLineNo">803</span> // This is used to initialize the batch thread pool inside the connection implementation.<a name="line.803"></a> +<span class="sourceLineNo">804</span> // When deploy a fresh cluster, we may first use the cluster connection in InitMetaProcedure,<a name="line.804"></a> +<span class="sourceLineNo">805</span> // which will be executed inside the PEWorker, and then the batch thread pool will inherit the<a name="line.805"></a> +<span class="sourceLineNo">806</span> // thread group of PEWorker, which will be destroy when shutting down the ProcedureExecutor. It<a name="line.806"></a> +<span class="sourceLineNo">807</span> // will cause lots of procedure related UTs to fail, so here let's initialize it first, no harm.<a name="line.807"></a> +<span class="sourceLineNo">808</span> conn.getTable(TableName.META_TABLE_NAME).close();<a name="line.808"></a> +<span class="sourceLineNo">809</span> return conn;<a name="line.809"></a> +<span class="sourceLineNo">810</span> }<a name="line.810"></a> +<span class="sourceLineNo">811</span><a name="line.811"></a> +<span class="sourceLineNo">812</span> /**<a name="line.812"></a> +<span class="sourceLineNo">813</span> * Run test on configured codecs to make sure supporting libs are in place.<a name="line.813"></a> +<span class="sourceLineNo">814</span> * @param c<a name="line.814"></a> +<span class="sourceLineNo">815</span> * @throws IOException<a name="line.815"></a> +<span class="sourceLineNo">816</span> */<a name="line.816"></a> +<span class="sourceLineNo">817</span> private static void checkCodecs(final Configuration c) throws IOException {<a name="line.817"></a> +<span class="sourceLineNo">818</span> // check to see if the codec list is available:<a name="line.818"></a> +<span class="sourceLineNo">819</span> String [] codecs = c.getStrings("hbase.regionserver.codecs", (String[])null);<a name="line.819"></a> +<span class="sourceLineNo">820</span> if (codecs == null) return;<a name="line.820"></a> +<span class="sourceLineNo">821</span> for (String codec : codecs) {<a name="line.821"></a> +<span class="sourceLineNo">822</span> if (!CompressionTest.testCompression(codec)) {<a name="line.822"></a> +<span class="sourceLineNo">823</span> throw new IOException("Compression codec " + codec +<a name="line.823"></a> +<span class="sourceLineNo">824</span> " not supported, aborting RS construction");<a name="line.824"></a> +<span class="sourceLineNo">825</span> }<a name="line.825"></a> +<span class="sourceLineNo">826</span> }<a name="line.826"></a> +<span class="sourceLineNo">827</span> }<a name="line.827"></a> +<span class="sourceLineNo">828</span><a name="line.828"></a> +<span class="sourceLineNo">829</span> public String getClusterId() {<a name="line.829"></a> +<span class="sourceLineNo">830</span> return this.clusterId;<a name="line.830"></a> +<span class="sourceLineNo">831</span> }<a name="line.831"></a> +<span class="sourceLineNo">832</span><a name="line.832"></a> +<span class="sourceLineNo">833</span> /**<a name="line.833"></a> +<span class="sourceLineNo">834</span> * Setup our cluster connection if not already initialized.<a name="line.834"></a> +<span class="sourceLineNo">835</span> */<a name="line.835"></a> +<span class="sourceLineNo">836</span> protected synchronized void setupClusterConnection() throws IOException {<a name="line.836"></a> +<span class="sourceLineNo">837</span> if (clusterConnection == null) {<a name="line.837"></a> +<span class="sourceLineNo">838</span> clusterConnection = createClusterConnection();<a name="line.838"></a> +<span class="sourceLineNo">839</span> metaTableLocator = new MetaTableLocator();<a name="line.839"></a> +<span class="sourceLineNo">840</span> }<a name="line.840"></a> +<span class="sourceLineNo">841</span> }<a name="line.841"></a> +<span class="sourceLineNo">842</span><a name="line.842"></a> +<span class="sourceLineNo">843</span> /**<a name="line.843"></a> +<span class="sourceLineNo">844</span> * All initialization needed before we go register with Master.<br><a name="line.844"></a> +<span class="sourceLineNo">845</span> * Do bare minimum. Do bulk of initializations AFTER we've connected to the Master.<br><a name="line.845"></a> +<span class="sourceLineNo">846</span> * In here we just put up the RpcServer, setup Connection, and ZooKeeper.<a name="line.846"></a> +<span class="sourceLineNo">847</span> */<a name="line.847"></a> +<span class="sourceLineNo">848</span> private void preRegistrationInitialization() {<a name="line.848"></a> +<span class="sourceLineNo">849</span> try {<a name="line.849"></a> +<span class="sourceLineNo">850</span> initializeZooKeeper();<a name="line.850"></a> +<span class="sourceLineNo">851</span> setupClusterConnection();<a name="line.851"></a> +<span class="sourceLineNo">852</span> // Setup RPC client for master communication<a name="line.852"></a> +<span class="sourceLineNo">853</span> this.rpcClient = RpcClientFactory.createClient(conf, clusterId, new InetSocketAddress(<a name="line.853"></a> +<span class="sourceLineNo">854</span> this.rpcServices.isa.getAddress(), 0), clusterConnection.getConnectionMetrics());<a name="line.854"></a> +<span class="sourceLineNo">855</span> } catch (Throwable t) {<a name="line.855"></a> +<span class="sourceLineNo">856</span> // Call stop if error or process will stick around for ever since server<a name="line.856"></a> +<span class="sourceLineNo">857</span> // puts up non-daemon threads.<a name="line.857"></a> +<span class="sourceLineNo">858</span> this.rpcServices.stop();<a name="line.858"></a> +<span class="sourceLineNo">859</span> abort("Initialization of RS failed. Hence aborting RS.", t);<a name="line.859"></a> +<span class="sourceLineNo">860</span> }<a name="line.860"></a> +<span class="sourceLineNo">861</span> }<a name="line.861"></a> +<span class="sourceLineNo">862</span><a name="line.862"></a> +<span class="sourceLineNo">863</span> /**<a name="line.863"></a> +<span class="sourceLineNo">864</span> * Bring up connection to zk ensemble and then wait until a master for this cluster and then after<a name="line.864"></a> +<span class="sourceLineNo">865</span> * that, wait until cluster 'up' flag has been set. This is the order in which master does things.<a name="line.865"></a> +<span class="sourceLineNo">866</span> * <p><a name="line.866"></a> +<span class="sourceLineNo">867</span> * Finally open long-living server short-circuit connection.<a name="line.867"></a> +<span class="sourceLineNo">868</span> */<a name="line.868"></a> +<span class="sourceLineNo">869</span> @edu.umd.cs.findbugs.annotations.SuppressWarnings(value="RV_RETURN_VALUE_IGNORED_BAD_PRACTICE",<a name="line.869"></a> +<span class="sourceLineNo">870</span> justification="cluster Id znode read would give us correct response")<a name="line.870"></a> +<span class="sourceLineNo">871</span> private void initializeZooKeeper() throws IOException, InterruptedException {<a name="line.871"></a> +<span class="sourceLineNo">872</span> // Nothing to do in here if no Master in the mix.<a name="line.872"></a> +<span class="sourceLineNo">873</span> if (this.masterless) {<a name="line.873"></a> +<span class="sourceLineNo">874</span> return;<a name="line.874"></a> +<span class="sourceLineNo">875</span> }<a name="line.875"></a> <span class="sourceLineNo">876</span><a name="line.876"></a> -<span class="sourceLineNo">877</span> // Wait on cluster being up. Master will set this flag up in zookeeper<a name="line.877"></a> -<span class="sourceLineNo">878</span> // when ready.<a name="line.878"></a> -<span class="sourceLineNo">879</span> blockAndCheckIfStopped(this.clusterStatusTracker);<a name="line.879"></a> -<span class="sourceLineNo">880</span><a name="line.880"></a> -<span class="sourceLineNo">881</span> // If we are HMaster then the cluster id should have already been set.<a name="line.881"></a> -<span class="sourceLineNo">882</span> if (clusterId == null) {<a name="line.882"></a> -<span class="sourceLineNo">883</span> // Retrieve clusterId<a name="line.883"></a> -<span class="sourceLineNo">884</span> // Since cluster status is now up<a name="line.884"></a> -<span class="sourceLineNo">885</span> // ID should have already been set by HMaster<a name="line.885"></a> -<span class="sourceLineNo">886</span> try {<a name="line.886"></a> -<span class="sourceLineNo">887</span> clusterId = ZKClusterId.readClusterIdZNode(this.zooKeeper);<a name="line.887"></a> -<span class="sourceLineNo">888</span> if (clusterId == null) {<a name="line.888"></a> -<span class="sourceLineNo">889</span> this.abort("Cluster ID has not been set");<a name="line.889"></a> -<span class="sourceLineNo">890</span> }<a name="line.890"></a> -<span class="sourceLineNo">891</span> LOG.info("ClusterId : " + clusterId);<a name="line.891"></a> -<span class="sourceLineNo">892</span> } catch (KeeperException e) {<a name="line.892"></a> -<span class="sourceLineNo">893</span> this.abort("Failed to retrieve Cluster ID", e);<a name="line.893"></a> -<span class="sourceLineNo">894</span> }<a name="line.894"></a> -<span class="sourceLineNo">895</span> }<a name="line.895"></a> -<span class="sourceLineNo">896</span><a name="line.896"></a> -<span class="sourceLineNo">897</span> waitForMasterActive();<a name="line.897"></a> -<span class="sourceLineNo">898</span> if (isStopped() || isAborted()) {<a name="line.898"></a> -<span class="sourceLineNo">899</span> return; // No need for further initialization<a name="line.899"></a> +<span class="sourceLineNo">877</span> // Create the master address tracker, register with zk, and start it. Then<a name="line.877"></a> +<span class="sourceLineNo">878</span> // block until a master is available. No point in starting up if no master<a name="line.878"></a> +<span class="sourceLineNo">879</span> // running.<a name="line.879"></a> +<span class="sourceLineNo">880</span> blockAndCheckIfStopped(this.masterAddressTracker);<a name="line.880"></a> +<span class="sourceLineNo">881</span><a name="line.881"></a> +<span class="sourceLineNo">882</span> // Wait on cluster being up. Master will set this flag up in zookeeper<a name="line.882"></a> +<span class="sourceLineNo">883</span> // when ready.<a name="line.883"></a> +<span class="sourceLineNo">884</span> blockAndCheckIfStopped(this.clusterStatusTracker);<a name="line.884"></a> +<span class="sourceLineNo">885</span><a name="line.885"></a> +<span class="sourceLineNo">886</span> // If we are HMaster then the cluster id should have already been set.<a name="line.886"></a> +<span class="sourceLineNo">887</span> if (clusterId == null) {<a name="line.887"></a> +<span class="sourceLineNo">888</span> // Retrieve clusterId<a name="line.888"></a> +<span class="sourceLineNo">889</span> // Since cluster status is now up<a name="line.889"></a> +<span class="sourceLineNo">890</span> // ID should have already been set by HMaster<a name="line.890"></a> +<span class="sourceLineNo">891</span> try {<a name="line.891"></a> +<span class="sourceLineNo">892</span> clusterId = ZKClusterId.readClusterIdZNode(this.zooKeeper);<a name="line.892"></a> +<span class="sourceLineNo">893</span> if (clusterId == null) {<a name="line.893"></a> +<span class="sourceLineNo">894</span> this.abort("Cluster ID has not been set");<a name="line.894"></a> +<span class="sourceLineNo">895</span> }<a name="line.895"></a> +<span class="sourceLineNo">896</span> LOG.info("ClusterId : " + clusterId);<a name="line.896"></a> +<span class="sourceLineNo">897</span> } catch (KeeperException e) {<a name="line.897"></a> +<span class="sourceLineNo">898</span> this.abort("Failed to retrieve Cluster ID", e);<a name="line.898"></a> +<span class="sourceLineNo">899</span> }<a name="line.899"></a> <span class="sourceLineNo">900</span> }<a name="line.900"></a> <span class="sourceLineNo">901</span><a name="line.901"></a> -<span class="sourceLineNo">902</span> // watch for snapshots and other procedures<a name="line.902"></a> -<span class="sourceLineNo">903</span> try {<a name="line.903"></a> -<span class="sourceLineNo">904</span> rspmHost = new RegionServerProcedureManagerHost();<a name="line.904"></a> -<span class="sourceLineNo">905</span> rspmHost.loadProcedures(conf);<a name="line.905"></a> -<span class="sourceLineNo">906</span> rspmHost.initialize(this);<a name="line.906"></a> -<span class="sourceLineNo">907</span> } catch (KeeperException e) {<a name="line.907"></a> -<span class="sourceLineNo">908</span> this.abort("Failed to reach coordination cluster when creating procedure handler.", e);<a name="line.908"></a> -<span class="sourceLineNo">909</span> }<a name="line.909"></a> -<span class="sourceLineNo">910</span> }<a name="line.910"></a> -<span class="sourceLineNo">911</span><a name="line.911"></a> -<span class="sourceLineNo">912</span> /**<a name="line.912"></a> -<span class="sourceLineNo">913</span> * Utilty method to wait indefinitely on a znode availability while checking<a name="line.913"></a> -<span class="sourceLineNo">914</span> * if the region server is shut down<a name="line.914"></a> -<span class="sourceLineNo">915</span> * @param tracker znode tracker to use<a name="line.915"></a> -<span class="sourceLineNo">916</span> * @throws IOException any IO exception, plus if the RS is stopped<a name="line.916"></a> -<span class="sourceLineNo">917</span> * @throws InterruptedException<a name="line.917"></a> -<span class="sourceLineNo">918</span> */<a name="line.918"></a> -<span class="sourceLineNo">919</span> private void blockAndCheckIfStopped(ZKNodeTracker tracker)<a name="line.919"></a> -<span class="sourceLineNo">920</span> throws IOException, InterruptedException {<a name="line.920"></a> -<span class="sourceLineNo">921</span> while (tracker.blockUntilAvailable(this.msgInterval, false) == null) {<a name="line.921"></a> -<span class="sourceLineNo">922</span> if (this.stopped) {<a name="line.922"></a> -<span class="sourceLineNo">923</span> throw new IOException("Received the shutdown message while waiting.");<a name="line.923"></a> -<span class="sourceLineNo">924</span> }<a name="line.924"></a> -<span class="sourceLineNo">925</span> }<a name="line.925"></a> -<span class="sourceLineNo">926</span> }<a name="line.926"></a> -<span class="sourceLineNo">927</span><a name="line.927"></a> -<span class="sourceLineNo">928</span> /**<a name="line.928"></a> -<span class="sourceLineNo">929</span> * @return True if the cluster is up.<a name="line.929"></a> -<span class="sourceLineNo">930</span> */<a name="line.930"></a> -<span class="sourceLineNo">931</span> @Override<a name="line.931"></a> -<span class="sourceLineNo">932</span> public boolean isClusterUp() {<a name="line.932"></a> -<span class="sourceLineNo">933</span> return this.masterless ||<a name="line.933"></a> -<span class="sourceLineNo">934</span> (this.clusterStatusTracker != null && this.clusterStatusTracker.isClusterUp());<a name="line.934"></a> -<span class="sourceLineNo">935</span> }<a name="line.935"></a> -<span class="sourceLineNo">936</span><a name="line.936"></a> -<span class="sourceLineNo">937</span> /**<a name="line.937"></a> -<span class="sourceLineNo">938</span> * The HRegionServer sticks in this loop until closed.<a name="line.938"></a> -<span class="sourceLineNo">939</span> */<a name="line.939"></a> -<span class="sourceLineNo">940</span> @Override<a name="line.940"></a> -<span class="sourceLineNo">941</span> public void run() {<a name="line.941"></a> -<span class="sourceLineNo">942</span> try {<a name="line.942"></a> -<span class="sourceLineNo">943</span> // Do pre-registration initializations; zookeeper, lease threads, etc.<a name="line.943"></a> -<span class="sourceLineNo">944</span> preRegistrationInitialization();<a name="line.944"></a> -<span class="sourceLineNo">945</span> } catch (Throwable e) {<a name="line.945"></a> -<span class="sourceLineNo">946</span> abort("Fatal exception during initialization", e);<a name="line.946"></a> -<span class="sourceLineNo">947</span> }<a name="line.947"></a> -<span class="sourceLineNo">948</span><a name="line.948"></a> -<span class="sourceLineNo">949</span> try {<a name="line.949"></a> -<span class="sourceLineNo">950</span> if (!isStopped() && !isAborted()) {<a name="line.950"></a> -<span class="sourceLineNo">951</span> ShutdownHook.install(conf, fs, this, Thread.currentThread());<a name="line.951"></a> -<span class="sourceLineNo">952</span> // Initialize the RegionServerCoprocessorHost now that our ephemeral<a name="line.952"></a> -<span class="sourceLineNo">953</span> // node was created, in case any coprocessors want to use ZooKeeper<a name="line.953"></a> -<span class="sourceLineNo">954</span> this.rsHost = new RegionServerCoprocessorHost(this, this.conf);<a name="line.954"></a> -<span class="sourceLineNo">955</span> }<a name="line.955"></a> -<span class="sourceLineNo">956</span><a name="line.956"></a> -<span class="sourceLineNo">957</span> // Try and register with the Master; tell it we are here. Break if server is stopped or the<a name="line.957"></a> -<span class="sourceLineNo">958</span> // clusterup flag is down or hdfs went wacky. Once registered successfully, go ahead and start<a name="line.958"></a> -<span class="sourceLineNo">959</span> // up all Services. Use RetryCounter to get backoff in case Master is struggling to come up.<a name="line.959"></a> -<span class="sourceLineNo">960</span> LOG.debug("About to register with Master.");<a name="line.960"></a> -<span class="sourceLineNo">961</span> RetryCounterFactory rcf = new RetryCounterFactory(Integer.MAX_VALUE,<a name="line.961"></a> -<span class="sourceLineNo">962</span> this.sleeper.getPeriod(), 1000 * 60 * 5);<a name="line.962"></a> -<span class="sourceLineNo">963</span> RetryCounter rc = rcf.create();<a name="line.963"></a> -<span class="sourceLineNo">964</span> while (keepLooping()) {<a name="line.964"></a> -<span class="sourceLineNo">965</span> RegionServerStartupResponse w = reportForDuty();<a name="line.965"></a> -<span class="sourceLineNo">966</span> if (w == null) {<a name="line.966"></a> -<span class="sourceLineNo">967</span> long sleepTime = rc.getBackoffTimeAndIncrementAttempts();<a name="line.967"></a> -<span class="sourceLineNo">968</span> LOG.warn("reportForDuty failed; sleeping {} ms and then retrying.", sleepTime);<a name="line.968"></a> -<span class="sourceLineNo">969</span> this.sleeper.sleep(sleepTime);<a name="line.969"></a> -<span class="sourceLineNo">970</span> } else {<a name="line.970"></a> -<span class="sourceLineNo">971</span> handleReportForDutyResponse(w);<a name="line.971"></a> -<span class="sourceLineNo">972</span> break;<a name="line.972"></a> -<span class="sourceLineNo">973</span> }<a name="line.973"></a> -<span class="sourceLineNo">974</span> }<a name="line.974"></a> -<span class="sourceLineNo">975</span><a name="line.975"></a> -<span class="sourceLineNo">976</span> if (!isStopped() && isHealthy()) {<a name="line.976"></a> -<span class="sourceLineNo">977</span> // start the snapshot handler and other procedure handlers,<a name="line.977"></a> -<span class="sourceLineNo">978</span> // since the server is ready to run<a name="line.978"></a> -<span class="sourceLineNo">979</span> if (this.rspmHost != null) {<a name="line.979"></a> -<span class="sourceLineNo">980</span> this.rspmHost.start();<a name="line.980"></a> -<span class="sourceLineNo">981</span> }<a name="line.981"></a> -<span class="sourceLineNo">982</span> // Start the Quota Manager<a name="line.982"></a> -<span class="sourceLineNo">983</span> if (this.rsQuotaManager != null) {<a name="line.983"></a> -<span class="sourceLineNo">984</span> rsQuotaManager.start(getRpcServer().getScheduler());<a name="line.984"></a> -<span class="sourceLineNo">985</span> }<a name="line.985"></a> -<span class="sourceLineNo">986</span> if (this.rsSpaceQuotaManager != null) {<a name="line.986"></a> -<span class="sourceLineNo">987</span> this.rsSpaceQuotaManager.start();<a name="line.987"></a> -<span class="sourceLineNo">988</span> }<a name="line.988"></a> -<span class="sourceLineNo">989</span> }<a name="line.989"></a> -<span class="sourceLineNo">990</span><a name="line.990"></a> -<span class="sourceLineNo">991</span> // We registered with the Master. Go into run mode.<a name="line.991"></a> -<span class="sourceLineNo">992</span> long lastMsg = System.currentTimeMillis();<a name="line.992"></a> -<span class="sourceLineNo">993</span> long oldRequestCount = -1;<a name="line.993"></a> -<span class="sourceLineNo">994</span> // The main run loop.<a name="line.994"></a> -<span class="sourceLineNo">995</span> while (!isStopped() && isHealthy()) {<a name="line.995"></a> -<span class="sourceLineNo">996</span> if (!isClusterUp()) {<a name="line.996"></a> -<span class="sourceLineNo">997</span> if (isOnlineRegionsEmpty()) {<a name="line.997"></a> -<span class="sourceLineNo">998</span> stop("Exiting; cluster shutdown set and not carrying any regions");<a name="line.998"></a> -<span class="sourceLineNo">999</span> } else if (!this.stopping) {<a name="line.999"></a> -<span class="sourceLineNo">1000</span> this.stopping = true;<a name="line.1000"></a> -<span class="sourceLineNo">1001</span> LOG.info("Closing user regions");<a name="line.1001"></a> -<span class="sourceLineNo">1002</span> closeUserRegions(this.abortRequested);<a name="line.1002"></a> -<span class="sourceLineNo">1003</span> } else if (this.stopping) {<a name="line.1003"></a> -<span class="sourceLineNo">1004</span> boolean allUserRegionsOffline = areAllUserRegionsOffline();<a name="line.1004"></a> -<span class="sourceLineNo">1005</span> if (allUserRegionsOffline) {<a name="line.1005"></a> -<span class="sourceLineNo">1006</span> // Set stopped if no more write requests tp meta tables<a name="line.1006"></a> -<span class="sourceLineNo">1007</span> // since last time we went around the loop. Any open<a name="line.1007"></a> -<span class="sourceLineNo">1008</span> // meta regions will be closed on our way out.<a name="line.1008"></a> -<span class="sourceLineNo">1009</span> if (oldRequestCount == getWriteRequestCount()) {<a name="line.1009"></a> -<span class="sourceLineNo">1010</span> stop("Stopped; only catalog regions remaining online");<a name="line.1010"></a> -<span class="sourceLineNo">1011</span> break;<a name="line.1011"></a> -<span class="sourceLineNo">1012</span> }<a name="line.1012"></a> -<span class="sourceLineNo">1013</span> oldRequestCount = getWriteRequestCount();<a name="line.1013"></a> -<span class="sourceLineNo">1014</span> } else {<a name="line.1014"></a> -<span class="sourceLineNo">1015</span> // Make sure all regions have been closed -- some regions may<a name="line.1015"></a> -<span class="sourceLineNo">1016</span> // have not got it because we were splitting at the time of<a name="line.1016"></a> -<span class="sourceLineNo">1017</span> // the call to closeUserRegions.<a name="line.1017"></a> -<span class="sourceLineNo">1018</span> closeUserRegions(this.abortRequested);<a name="line.1018"></a> -<span class="sourceLineNo">1019</span> }<a name="line.1019"></a> -<span class="sourceLineNo">1020</span> LOG.debug("Waiting on " + getOnlineRegionsAsPrintableString());<a name="line.1020"></a> -<span class="sourceLineNo">1021</span> }<a name="line.1021"></a> -<span class="sourceLineNo">1022</span> }<a name="line.1022"></a> -<span class="sourceLineNo">1023</span> long now = System.currentTimeMillis();<a name="line.1023"></a> -<span class="sourceLineNo">1024</span> if ((now - lastMsg) >= msgInterval) {<a name="line.1024"></a> -<span class="sourceLineNo">1025</span> tryRegionServerReport(lastMsg, now);<a name="line.1025"></a> -<span class="sourceLineNo">1026</span> lastMsg = System.currentTimeMillis();<a name="line.1026"></a> +<span class="sourceLineNo">902</span> waitForMasterActive();<a name="line.902"></a> +<span class="sourceLineNo">903</span> if (isStopped() || isAborted()) {<a name="line.903"></a> +<span class="sourceLineNo">904</span> return; // No need for further initialization<a name="line.904"></a> +<span class="sourceLineNo">905</span> }<a name="line.905"></a> +<span class="sourceLineNo">906</span><a name="line.906"></a> +<span class="sourceLineNo">907</span> // watch for snapshots and other procedures<a name="line.907"></a> +<span class="sourceLineNo">908</span> try {<a name="line.908"></a> +<span class="sourceLineNo">909</span> rspmHost = new RegionServerProcedureManagerHost();<a name="line.909"></a> +<span class="sourceLineNo">910</span> rspmHost.loadProcedures(conf);<a name="line.910"></a> +<span class="sourceLineNo">911</span> rspmHost.initialize(this);<a name="line.911"></a> +<span class="sourceLineNo">912</span> } catch (KeeperException e) {<a name="line.912"></a> +<span class="sourceLineNo">913</span> this.abort("Failed to reach coordination cluster when creating procedure handler.", e);<a name="line.913"></a> +<span class="sourceLineNo">914</span> }<a name="line.914"></a> +<span class="sourceLineNo">915</span> }<a name="line.915"></a> +<span class="sourceLineNo">916</span><a name="line.916"></a> +<span class="sourceLineNo">917</span> /**<a name="line.917"></a> +<span class="sourceLineNo">918</span> * Utilty method to wait indefinitely on a znode availability while checking<a name="line.918"></a> +<span class="sourceLineNo">919</span> * if the region server is shut down<a name="line.919"></a> +<span class="sourceLineNo">920</span> * @param tracker znode tracker to use<a name="line.920"></a> +<span class="sourceLineNo">921</span> * @throws IOException any IO exception, plus if the RS is stopped<a name="line.921"></a> +<span class="sourceLineNo">922</span> * @throws InterruptedException<a name="line.922"></a> +<span class="sourceLineNo">923</span> */<a name="line.923"></a> +<span class="sourceLineNo">924</span> private void blockAndCheckIfStopped(ZKNodeTracker tracker)<a name="line.924"></a> +<span class="sourceLineNo">925</span> throws IOException, InterruptedException {<a name="line.925"></a> +<span class="sourceLineNo">926</span> while (tracker.blockUntilAvailable(this.msgInterval, false) == null) {<a name="line.926"></a> +<span class="sourceLineNo">927</span> if (this.stopped) {<a name="line.927"></a> +<span class="sourceLineNo">928</span> throw new IOException("Received the shutdown message while waiting.");<a name="line.928"></a> +<span class="sourceLineNo">929</span> }<a name="line.929"></a> +<span class="sourceLineNo">930</span> }<a name="line.930"></a> +<span class="sourceLineNo">931</span> }<a name="line.931"></a> +<span class="sourceLineNo">932</span><a name="line.932"></a> +<span class="sourceLineNo">933</span> /**<a name="line.933"></a> +<span class="sourceLineNo">934</span> * @return True if the cluster is up.<a name="line.934"></a> +<span class="sourceLineNo">935</span> */<a name="line.935"></a> +<span class="sourceLineNo">936</span> @Override<a name="line.936"></a> +<span class="sourceLineNo">937</span> public boolean isClusterUp() {<a name="line.937"></a> +<span class="sourceLineNo">938</span> return this.masterless ||<a name="line.938"></a> +<span class="sourceLineNo">939</span> (this.clusterStatusTracker != null && this.clusterStatusTracker.isClusterUp());<a name="line.939"></a> +<span class="sourceLineNo">940</span> }<a name="line.940"></a> +<span class="sourceLineNo">941</span><a name="line.941"></a> +<span class="sourceLineNo">942</span> /**<a name="line.942"></a> +<span class="sourceLineNo">943</span> * The HRegionServer sticks in this loop until closed.<a name="line.943"></a> +<span class="sourceLineNo">944</span> */<a name="line.944"></a> +<span class="sourceLineNo">945</span> @Override<a name="line.945"></a> +<span class="sourceLineNo">946</span> public void run() {<a name="line.946"></a> +<span class="sourceLineNo">947</span> try {<a name="line.947"></a> +<span class="sourceLineNo">948</span> // Do pre-registration initializations; zookeeper, lease threads, etc.<a name="line.948"></a> +<span class="sourceLineNo">949</span> preRegistrationInitialization();<a name="line.949"></a> +<span class="sourceLineNo">950</span> } catch (Throwable e) {<a name="line.950"></a> +<span class="sourceLineNo">951</span> abort("Fatal exception during initialization", e);<a name="line.951"></a> +<span class="sourceLineNo">952</span> }<a name="line.952"></a> +<span class="sourceLineNo">953</span><a name="line.953"></a> +<span class="sourceLineNo">954</span> try {<a name="line.954"></a> +<span class="sourceLineNo">955</span> if (!isStopped() && !isAborted()) {<a name="line.955"></a> +<span class="sourceLineNo">956</span> ShutdownHook.install(conf, fs, this, Thread.currentThread());<a name="line.956"></a> +<span class="sourceLineNo">957</span> // Initialize the RegionServerCoprocessorHost now that our ephemeral<a name="line.957"></a> +<span class="sourceLineNo">958</span> // node was created, in case any coprocessors want to use ZooKeeper<a name="line.958"></a> +<span class="sourceLineNo">959</span> this.rsHost = new RegionServerCoprocessorHost(this, this.conf);<a name="line.959"></a> +<span class="sourceLineNo">960</span> }<a name="line.960"></a> +<span class="sourceLineNo">961</span><a name="line.961"></a> +<span class="sourceLineNo">962</span> // Try and register with the Master; tell it we are here. Break if server is stopped or the<a name="line.962"></a> +<span class="sourceLineNo">963</span> // clusterup flag is down or hdfs went wacky. Once registered successfully, go ahead and start<a name="line.963"></a> +<span class="sourceLineNo">964</span> // up all Services. Use RetryCounter to get backoff in case Master is struggling to come up.<a name="line.964"></a> +<span class="sourceLineNo">965</span> LOG.debug("About to register with Master.");<a name="line.965"></a> +<span class="sourceLineNo">966</span> RetryCounterFactory rcf = new RetryCounterFactory(Integer.MAX_VALUE,<a name="line.966"></a> +<span class="sourceLineNo">967</span> this.sleeper.getPeriod(), 1000 * 60 * 5);<a name="line.967"></a> +<span class="sourceLineNo">968</span> RetryCounter rc = rcf.create();<a name="line.968"></a> +<span class="sourceLineNo">969</span> while (keepLooping()) {<a name="line.969"></a> +<span class="sourceLineNo">970</span> RegionServerStartupResponse w = reportForDuty();<a name="line.970"></a> +<span class="sourceLineNo">971</span> if (w == null) {<a name="line.971"></a> +<span class="sourceLineNo">972</span> long sleepTime = rc.getBackoffTimeAndIncrementAttempts();<a name="line.972"></a> +<span class="sourceLineNo">973</span> LOG.warn("reportForDuty failed; sleeping {} ms and then retrying.", sleepTime);<a name="line.973"></a> +<span class="sourceLineNo">974</span> this.sleeper.sleep(sleepTime);<a name="line.974"></a> +<span class="sourceLineNo">975</span> } else {<a name="line.975"></a> +<span class="sourceLineNo">976</span> handleReportForDutyResponse(w);<a name="line.976"></a> +<span class="sourceLineNo">977</span> break;<a name="line.977"></a> +<span class="sourceLineNo">978</span> }<a name="line.978"></a> +<span class="sourceLineNo">979</span> }<a name="line.979"></a> +<span class="sourceLineNo">980</span><a name="line.980"></a> +<span class="sourceLineNo">981</span> if (!isStopped() && isHealthy()) {<a name="line.981"></a> +<span class="sourceLineNo">982</span> // start the snapshot handler and other procedure handlers,<a name="line.982"></a> +<span class="sourceLineNo">983</span> // since the server is ready to run<a name="line.983"></a> +<span class="sourceLineNo">984</span> if (this.rspmHost != null) {<a name="line.984"></a> +<span class="sourceLineNo">985</span> this.rspmHost.start();<a name="line.985"></a> +<span class="sourceLineNo">986</span> }<a name="line.986"></a> +<span class="sourceLineNo">987</span> // Start the Quota Manager<a name="line.987"></a> +<span class="sourceLineNo">988</span> if (this.rsQuotaManager != null) {<a name="line.988"></a> +<span class="sourceLineNo">989</span> rsQuotaManager.start(getRpcServer().getScheduler());<a name="line.989"></a> +<span class="sourceLineNo">990</span> }<a name="line.990"></a> +<span class="sourceLineNo">991</span> if (this.rsSpaceQuotaManager != null) {<a name="line.991"></a> +<span class="sourceLineNo">992</span> this.rsSpaceQuotaManager.start();<a name="line.992"></a> +<span class="sourceLineNo">993</span> }<a name="line.993"></a> +<span class="sourceLineNo">994</span> }<a name="line.994"></a> +<span class="sourceLineNo">995</span><a name="line.995"></a> +<span class="sourceLineNo">996</span> // We registered with the Master. Go into run mode.<a name="line.996"></a> +<span class="sourceLineNo">997</span> long lastMsg = System.currentTimeMillis();<a name="line.997"></a> +<span class="sourceLineNo">998</span> long oldRequestCount = -1;<a name="line.998"></a> +<span class="sourceLineNo">999</span> // The main run loop.<a name="line.999"></a> +<span class="sourceLineNo">1000</span> while (!isStopped() && isHealthy()) {<a name="line.1000"></a> +<span class="sourceLineNo">1001</span> if (!isClusterUp()) {<a name="line.1001"></a> +<span class="sourceLineNo">1002</span> if (isOnlineRegionsEmpty()) {<a name="line.1002"></a> +<span class="sourceLineNo">1003</span> stop("Exiting; cluster shutdown set and not carrying any regions");<a name="line.1003"></a> +<span class="sourceLineNo">1004</span> } else if (!this.stopping) {<a name="line.1004"></a> +<span class="sourceLineNo">1005</span> this.stopping = true;<a name="line.1005"></a> +<span class="sourceLineNo">1006</span> LOG.info("Closing user regions");<a name="line.1006"></a> +<span class="sourceLineNo">1007</span> closeUserRegions(this.abortRequested);<a name="line.1007"></a> +<span class="sourceLineNo">1008</span> } else if (this.stopping) {<a name="line.1008"></a> +<span class="sourceLineNo">1009</span> boolean allUserRegionsOffline = areAllUserRegionsOffline();<a name="line.1009"></a> +<span class="sourceLineNo">1010</span> if (allUserRegionsOffline) {<a name="line.1010"></a> +<span class="sourceLineNo">1011</span> // Set stopped if no more write requests tp meta tables<a name="line.1011"></a> +<span class="sourceLineNo">1012</span> // since last time we went around the loop. Any open<a name="line.1012"></a> +<span class="sourceLineNo">1013</span> // meta regions will be closed on our way out.<a name="line.1013"></a> +<span class="sourceLineNo">1014</span> if (oldRequestCount == getWriteRequestCount()) {<a name="line.1014"></a> +<span class="sourceLineNo">1015</span> stop("Stopped; only catalog regions remaining online");<a name="line.1015"></a> +<span class="sourceLineNo">1016</span> break;<a name="line.1016"></a> +<span class="sourceLineNo">1017</span> }<a name="line.1017"></a> +<span class="sourceLineNo">1018</span> oldRequestCount = getWriteRequestCount();<a name="line.1018"></a> +<span class="sourceLineNo">1019</span> } else {<a name="line.1019"></a> +<span class="sourceLineNo">1020</span> // Make sure all regions have been closed -- some regions may<a name="line.1020"></a> +<span class="sourceLineNo">1021</span> // have not got it because we were splitting at the time of<a name="line.1021"></a> +<span class="sourceLineNo">1022</span> // the call to closeUserRegions.<a name="line.1022"></a> +<span class="sourceLineNo">1023</span> closeUserRegions(this.abortRequested);<a name="line.1023"></a> +<span class="sourceLineNo">1024</span> }<a name="line.1024"></a> +<span class="sourceLineNo">1025</span> LOG.debug("Waiting on " + getOnlineRegionsAsPrintableString());<a name="line.1025"></a> +<span class="sourceLineNo">1026</span> }<a name="line.1026"></a> <span class="sourceLineNo">1027</span> }<a name="line.1027"></a> -<span class="sourceLineNo">1028</span> if (!isStopped() && !isAborted()) {<a name="line.1028"></a> -<span class="sourceLineNo">1029</span> this.sleeper.sleep();<a name="line.1029"></a> -<span class="sourceLineNo">1030</span> }<a name="line.1030"></a> -<span class="sourceLineNo">1031</span> } // for<a name="line.1031"></a> -<span class="sourceLineNo">1032</span> } catch (Throwable t) {<a name="line.1032"></a> -<span class="sourceLineNo">1033</span> if (!rpcServices.checkOOME(t)) {<a name="line.1033"></a> -<span class="sourceLineNo">1034</span> String prefix = t instanceof YouAreDeadException? "": "Unhandled: ";<a name="line.1034"></a> -<span class="sourceLineNo">1035</span> abort(prefix + t.getMessage(), t);<a name="line.1035"></a> -<span class="sourceLineNo">1036</span> }<a name="line.1036"></a> -<span class="sourceLineNo">1037</span> }<a name="line.1037"></a> -<span class="sourceLineNo">1038</span><a name="line.1038"></a> -<span class="sourceLineNo">1039</span> if (abortRequested) {<a name="line.1039"></a> -<span class="sourceLineNo">1040</span> Timer abortMonitor = new Timer("Abort regionserver monitor", true);<a name="line.1040"></a> -<span class="sourceLineNo">1041</span> TimerTask abortTimeoutTask = null;<a name="line.1041"></a> -<span class="sourceLineNo">1042</span> try {<a name="line.1042"></a> -<span class="sourceLineNo">1043</span> abortTimeoutTask =<a name="line.1043"></a> -<span class="sourceLineNo">1044</span> Class.forName(conf.get(ABORT_TIMEOUT_TASK, SystemExitWhenAbortTimeout.class.getName()))<a name="line.1044"></a> -<span class="sourceLineNo">1045</span> .asSubclass(TimerTask.class).getDeclaredConstructor().newInstance();<a name="line.1045"></a> -<span class="sourceLineNo">1046</span> } catch (Exception e) {<a name="line.1046"></a> -<span class="sourceLineNo">1047</span> LOG.warn("Initialize abort timeout task failed", e);<a name="line.1047"></a> -<span class="sourceLineNo">1048</span> }<a name="line.1048"></a> -<span class="sourceLineNo">1049</span>
<TRUNCATED>