Added: helix/site-content/1.4.3-docs/Quickstart.html
URL: 
http://svn.apache.org/viewvc/helix/site-content/1.4.3-docs/Quickstart.html?rev=1923435&view=auto
==============================================================================
--- helix/site-content/1.4.3-docs/Quickstart.html (added)
+++ helix/site-content/1.4.3-docs/Quickstart.html Wed Jan 29 07:13:35 2025
@@ -0,0 +1,869 @@
+
+<!DOCTYPE html>
+
+
+
+
+
+
+<!--
+ Generated by Apache Maven Doxia at 2025-01-28  Rendered using Reflow Maven 
Skin 2.0.0 (https://olamy.github.io/reflow-maven-skin)
+-->
+<html  xml:lang="en" lang="en">
+
+       <head>
+               <meta charset="UTF-8" />
+               <title>Apache Helix &#x2013; Quickstart</title>
+               <meta name="viewport" content="width=device-width, 
initial-scale=1.0" />
+               <meta name="description" content="" />
+               <meta http-equiv="content-language" content="en" />
+
+               <link href="./css/bootstrap.min.css" rel="stylesheet" />
+               <link href="./css/bootstrap-responsive.min.css" 
rel="stylesheet" />
+               <link href="./css/docs.css" rel="stylesheet" />
+               <link href="./css/reflow-skin.css" rel="stylesheet" />
+
+
+               <link href="./css/lightbox.css" rel="stylesheet" />
+
+               <link href="./css/site.css" rel="stylesheet" />
+               <link href="./css/print.css" rel="stylesheet" media="print" />
+
+               <!-- Le HTML5 shim, for IE6-8 support of HTML5 elements -->
+               <!--[if lt IE 9]>
+                       <script src="./js/html5.js"></script>
+               <![endif]-->
+
+
+
+
+
+    
+<!-- Matomo -->
+<script>
+    var _paq = window._paq = window._paq || [];
+                        _paq.push(['disableCookies']);
+                                    _paq.push(['trackPageView']);
+                                    _paq.push(['enableLinkTracking']);
+                    
+    (function() {
+        var u="https://analytics.apache.org";;
+        _paq.push(['setTrackerUrl', u+'/matomo.php']);
+        _paq.push(['setSiteId', '15']);
+        var d=document, g=d.createElement('script'), 
s=d.getElementsByTagName('script')[0];
+        g.async=true; g.src=u+'/matomo.js'; s.parentNode.insertBefore(g,s);
+    })();
+</script>
+<!-- End Matomo Code -->
+       </head>
+
+       <body class="page-quickstart project-143-docs" data-spy="scroll" 
data-offset="60" data-target="#toc-scroll-target">
+
+    
+               <div class="navbar navbar-fixed-top">
+                       <div class="navbar-inner">
+                               <div class="container">
+                                       <a class="btn btn-navbar" 
data-toggle="collapse" data-target="#top-nav-collapse">
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                       </a>
+                                       <a class="brand" 
href="http://helix.apache.org";>Apache Helix</a>
+                                       <div class="nav-collapse collapse" 
id="top-nav-collapse">
+                                               <ul class="nav pull-right">
+                                                       <li ><a 
href="index.html" title="Helix 1.4.3">Helix 1.4.3</a></li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Get Helix <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="download.html" title="Download">Download</a></li>
+                                                                       <li ><a 
href="Building.html" title="Building">Building</a></li>
+                                                                       <li ><a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release 
Notes</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown 
active">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Hands-On <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li 
class="active"><a href="" title="Quick Start">Quick Start</a></li>
+                                                                       <li ><a 
href="Tutorial.html" title="Tutorial">Tutorial</a></li>
+                                                                       <li ><a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Recipes <b class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a></li>
+                                                                       <li ><a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a></li>
+                                                                       <li ><a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a></li>
+                                                                       <li ><a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a></li>
+                                                                       <li ><a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a></li>
+                                                               </ul>
+                                                       </li>
+                                               </ul>
+                                       </div><!--/.nav-collapse -->
+                               </div>
+                       </div>
+               </div>
+
+       <div class="container">
+
+       <!-- Masthead
+       ================================================== -->
+
+       <header>
+       <div class="jumbotron subhead">
+               <div class="row" id="banner">
+                       <div class="span12">
+                               <div class="pull-left">
+                                       <a href="http://helix.apache.org/"; 
id="bannerLeft"><img src="../images/helix-logo.jpg" alt='"''"' /></a>
+                                       <p class="lead">A cluster management 
framework for partitioned and replicated distributed resources</p>
+                               </div>
+                               <div class="pull-right">
+                                       <a href="http://www.apache.org/"; 
id="bannerRight"><img src="../images/feather_small.gif" alt='"''"' /></a>
+                               </div>
+                       </div>
+               </div>
+       </div>
+               <div>
+                       <ul class="breadcrumb">
+                               <li><a href="../" title="Apache Helix">Apache 
Helix</a></li>
+                               <li class="divider">/</li>
+                               <li><a href="./" title="Release 1.4.3">Release 
1.4.3</a></li>
+                               <li class="divider">/</li>
+                               <li>Quickstart</li>
+                               <li class="publishDate version-date 
pull-right">Last Published: 2025-01-28</li>
+                       </ul>
+               </div>
+       </header>
+
+       <div class="main-body">
+       <div class="row">
+               <div class="span12">
+                       <div class="body-content">
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+--> 
+<section> 
+ <div class="page-header">
+  <h2 id="Quickstart">Quickstart</h2>
+ </div> 
+</section> 
+<section> 
+ <h2 id="Get_Helix">Get Helix</h2> 
+ <p>First, let's get Helix. Either build it, or download it.</p> 
+ <section> 
+  <h3 id="Build">Build</h3> 
+  <div class="source"> 
+   <pre><code>git clone https://git-wip-us.apache.org/repos/asf/helix.git
+cd helix
+git checkout tags/helix-1.4.3
+mvn install package -DskipTests
+cd helix-core/target/helix-core-pkg/bin # This folder contains all the scripts 
used in following sections
+chmod +x *
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="Download">Download</h3> 
+  <p>Download the 1.4.3 release package <a href="./download.html">here</a></p> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="Overview">Overview</h2> 
+ <p>In this Quickstart, we'll set up a leader-standby replicated, partitioned 
system. Then we'll demonstrate how to add a node, rebalance the partitions, and 
show how Helix manages failover.</p> 
+</section> 
+<section> 
+ <h2 id="Let.27s_Do_It">Let's Do It</h2> 
+ <p>Helix provides command line interfaces to set up the cluster and view the 
cluster state. The best way to understand how Helix views a cluster is to build 
a cluster.</p> 
+ <section> 
+  <h3 id="Get_to_the_Tools_Directory">Get to the Tools Directory</h3> 
+  <p>If you built the code:</p> 
+  <div class="source"> 
+   <pre><code>cd helix/helix/helix-core/target/helix-core-pkg/bin
+</code></pre> 
+  </div> 
+  <p>If you downloaded the release package, extract it.</p> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="Short_Version">Short Version</h2> 
+ <p>You can observe the components working together in this demo, which does 
the following:</p> 
+ <ul> 
+  <li>Create a cluster</li> 
+  <li>Add 2 nodes (participants) to the cluster</li> 
+  <li>Set up a resource with 6 partitions and 2 replicas: 1 Leader, and 1 
Standby per partition</li> 
+  <li>Show the cluster state after Helix balances the partitions</li> 
+  <li>Add a third node</li> 
+  <li>Show the cluster state. Note that the third node has taken leadership of 
2 partitions.</li> 
+  <li>Kill the third node (Helix takes care of failover)</li> 
+  <li>Show the cluster state. Note that the two surviving nodes take over 
leadership of the partitions from the failed node</li> 
+ </ul> 
+ <section> 
+  <h3 id="Run_the_Demo">Run the Demo</h3> 
+  <div class="source"> 
+   <pre><code>cd helix/helix/helix-core/target/helix-core-pkg/bin
+./quickstart.sh
+</code></pre> 
+  </div> 
+  <section> 
+   <h4 id="The_Initial_Setup">The Initial Setup</h4> 
+   <p>2 nodes are set up and the partitions are rebalanced.</p> 
+   <p>The cluster state is as follows:</p> 
+   <div class="source"> 
+    <pre><code>CLUSTER STATE: After starting 2 nodes
+                localhost_12000    localhost_12001
+MyResource_0           L                  S
+MyResource_1           S                  L
+MyResource_2           L                  S
+MyResource_3           L                  S
+MyResource_4           S                  L
+MyResource_5           S                  L
+</code></pre> 
+   </div> 
+   <p>Note there is one leader and one standby per partition.</p> 
+  </section> 
+  <section> 
+   <h4 id="Add_a_Node">Add a Node</h4> 
+   <p>A third node is added and the cluster is rebalanced.</p> 
+   <p>The cluster state changes to:</p> 
+   <div class="source"> 
+    <pre><code>CLUSTER STATE: After adding a third node
+               localhost_12000    localhost_12001    localhost_12002
+MyResource_0          S                  L                  S
+MyResource_1          S                  S                  L
+MyResource_2          L                  S                  S
+MyResource_3          S                  S                  L
+MyResource_4          L                  S                  S
+MyResource_5          S                  L                  S
+</code></pre> 
+   </div> 
+   <p>Note there is one leader and <i>two</i> standbys per partition. This is 
expected because there are three nodes.</p> 
+  </section> 
+  <section> 
+   <h4 id="Kill_a_Node">Kill a Node</h4> 
+   <p>Finally, a node is killed to simulate a failure</p> 
+   <p>Helix makes sure each partition has a leader. The cluster state changes 
to:</p> 
+   <div class="source"> 
+    <pre><code>CLUSTER STATE: After the 3rd node stops/crashes
+               localhost_12000    localhost_12001    localhost_12002
+MyResource_0          S                  L                  -
+MyResource_1          S                  L                  -
+MyResource_2          L                  S                  -
+MyResource_3          L                  S                  -
+MyResource_4          L                  S                  -
+MyResource_5          S                  L                  -
+</code></pre> 
+   </div> 
+  </section> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="Long_Version">Long Version</h2> 
+ <p>Now you can run the same steps by hand. In this detailed version, we'll do 
the following:</p> 
+ <ul> 
+  <li>Define a cluster</li> 
+  <li>Add two nodes to the cluster</li> 
+  <li>Add a 6-partition resource with 1 leader and 2 standby replicas per 
partition</li> 
+  <li>Verify that the cluster is healthy and inspect the Helix view</li> 
+  <li>Expand the cluster: add a few nodes and rebalance the partitions</li> 
+  <li>Failover: stop a node and verify the leadership transfer</li> 
+ </ul> 
+ <section> 
+  <h3 id="Install_and_Start_ZooKeeper">Install and Start ZooKeeper</h3> 
+  <p>Zookeeper can be started in standalone mode or replicated mode.</p> 
+  <p>More information is available at</p> 
+  <ul> 
+   <li><a class="externalLink" 
href="http://zookeeper.apache.org/doc/r3.3.3/zookeeperStarted.html";>http://zookeeper.apache.org/doc/r3.3.3/zookeeperStarted.html</a></li>
 
+   <li><a class="externalLink" 
href="http://zookeeper.apache.org/doc/trunk/zookeeperAdmin.html#sc_zkMulitServerSetup";>http://zookeeper.apache.org/doc/trunk/zookeeperAdmin.html#sc_zkMulitServerSetup</a></li>
 
+  </ul> 
+  <p>In this example, let's start zookeeper in local mode.</p> 
+  <section> 
+   <h4 id="Start_ZooKeeper_Locally_on_Port_2199">Start ZooKeeper Locally on 
Port 2199</h4> 
+   <div class="source"> 
+    <pre><code>./start-standalone-zookeeper.sh 2199 &amp;
+</code></pre> 
+   </div> 
+  </section> 
+ </section> 
+ <section> 
+  <h3 id="Define_the_Cluster">Define the Cluster</h3> 
+  <p>The helix-admin tool is used for cluster administration tasks. In the 
Quickstart, we'll use the command line interface. Helix supports a REST 
interface as well.</p> 
+  <p>zookeeper_address is of the format host:port e.g localhost:2199 for 
standalone or host1:port,host2:port for multi-node.</p> 
+  <p>Next, we'll set up a cluster MYCLUSTER cluster with these attributes:</p> 
+  <ul> 
+   <li>3 instances running on localhost at ports 12913,12914,12915</li> 
+   <li>One database named myDB with 6 partitions</li> 
+   <li>Each partition will have 3 replicas with 1 leader, 2 standbys</li> 
+   <li>ZooKeeper running locally at localhost:2199</li> 
+  </ul> 
+  <section> 
+   <h4 id="Create_the_Cluster_MYCLUSTER">Create the Cluster MYCLUSTER</h4> 
+   <div class="source"> 
+    <pre><code># ./helix-admin.sh --zkSvr &lt;zk_address&gt; --addCluster 
&lt;clustername&gt;
+./helix-admin.sh --zkSvr localhost:2199 --addCluster MYCLUSTER
+</code></pre> 
+   </div> 
+  </section> 
+ </section> 
+ <section> 
+  <h3 id="Add_Nodes_to_the_Cluster">Add Nodes to the Cluster</h3> 
+  <p>In this case we'll add three nodes: localhost:12913, localhost:12914, 
localhost:12915</p> 
+  <div class="source"> 
+   <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt;  --addNode 
&lt;clustername&gt; &lt;host:port&gt;
+./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER localhost:12913
+./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER localhost:12914
+./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER localhost:12915
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="Define_the_Resource_and_Partitioning">Define the Resource and 
Partitioning</h3> 
+  <p>In this example, the resource is a database, partitioned 6 ways. Note 
that in a production system, it's common to over-partition for better load 
balancing. Helix has been used in production to manage hundreds of databases 
each with 10s or 100s of partitions running on 10s of physical nodes.</p> 
+  <section> 
+   <h4 
id="Create_a_Database_with_6_Partitions_using_the_LeaderStandby_State_Model">Create
 a Database with 6 Partitions using the LeaderStandby State Model</h4> 
+   <p>Helix ensures there will be exactly one leader for each partition.</p> 
+   <div class="source"> 
+    <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt; --addResource 
&lt;clustername&gt; &lt;resourceName&gt; &lt;numPartitions&gt; 
&lt;StateModelName&gt;
+./helix-admin.sh --zkSvr localhost:2199 --addResource MYCLUSTER myDB 6 
LeaderStandby
+</code></pre> 
+   </div> 
+  </section> 
+  <section> 
+   <h4 id="Let_Helix_Assign_Partitions_to_Nodes">Let Helix Assign Partitions 
to Nodes</h4> 
+   <p>This command will distribute the partitions amongst all the nodes in the 
cluster. In this example, each partition has 3 replicas.</p> 
+   <div class="source"> 
+    <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt; --rebalance 
&lt;clustername&gt; &lt;resourceName&gt; &lt;replication factor&gt;
+./helix-admin.sh --zkSvr localhost:2199 --rebalance MYCLUSTER myDB 3
+</code></pre> 
+   </div> 
+   <p>Now the cluster is defined in ZooKeeper. The nodes (localhost:12913, 
localhost:12914, localhost:12915) and resource (myDB, with 6 partitions using 
the LeaderStandby model) are all properly configured. And the <i>IdealState</i> 
has been calculated, assuming a replication factor of 3.</p> 
+  </section> 
+ </section> 
+ <section> 
+  <h3 id="Start_the_Helix_Controller">Start the Helix Controller</h3> 
+  <p>Now that the cluster is defined in ZooKeeper, the Helix controller can 
manage the cluster.</p> 
+  <div class="source"> 
+   <pre><code># Start the cluster manager, which will manage MYCLUSTER
+./run-helix-controller.sh --zkSvr localhost:2199 --cluster MYCLUSTER 
2&gt;&amp;1 &gt; /tmp/controller.log &amp;
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="Start_up_the_Cluster_to_be_Managed">Start up the Cluster to be 
Managed</h3> 
+  <p>We've started up ZooKeeper, defined the cluster, the resources, the 
partitioning, and started up the Helix controller. Next, we'll start up the 
nodes of the system to be managed. Each node is a Participant, which is an 
instance of the system component to be managed. Helix assigns work to 
Participants, keeps track of their roles and health, and takes action when a 
node fails.</p> 
+  <div class="source"> 
+   <pre><code># start up each instance.  These are mock implementations that 
are actively managed by Helix
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12913 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12913.log
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12914 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12914.log
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12915 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12915.log
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="Inspect_the_Cluster">Inspect the Cluster</h3> 
+  <p>Now, let's see the Helix view of our cluster. We'll work our way down as 
follows:</p> 
+  <div class="source"> 
+   <pre><code>Clusters -&gt; MYCLUSTER -&gt; instances -&gt; instance detail
+                      -&gt; resources -&gt; resource detail
+                      -&gt; partitions
+</code></pre> 
+  </div> 
+  <p>A single Helix controller can manage multiple clusters, though so far, 
we've only defined one cluster. Let's see:</p> 
+  <div class="source"> 
+   <pre><code># List existing clusters
+./helix-admin.sh --zkSvr localhost:2199 --listClusters
+
+Existing clusters:
+MYCLUSTER
+</code></pre> 
+  </div> 
+  <p>Now, let's see the Helix view of MYCLUSTER:</p> 
+  <div class="source"> 
+   <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt; --listClusterInfo 
&lt;clusterName&gt;
+./helix-admin.sh --zkSvr localhost:2199 --listClusterInfo MYCLUSTER
+
+Existing resources in cluster MYCLUSTER:
+myDB
+Instances in cluster MYCLUSTER:
+localhost_12915
+localhost_12914
+localhost_12913
+</code></pre> 
+  </div> 
+  <p>Let's look at the details of an instance:</p> 
+  <div class="source"> 
+   <pre><code># ./helix-admin.sh --zkSvr &lt;zk_address&gt; --listInstanceInfo 
&lt;clusterName&gt; &lt;InstanceName&gt;
+./helix-admin.sh --zkSvr localhost:2199 --listInstanceInfo MYCLUSTER 
localhost_12913
+
+InstanceConfig: {
+  "id" : "localhost_12913",
+  "mapFields" : {
+  },
+  "listFields" : {
+  },
+  "simpleFields" : {
+    "HELIX_ENABLED" : "true",
+    "HELIX_HOST" : "localhost",
+    "HELIX_PORT" : "12913"
+  }
+}
+</code></pre> 
+  </div> 
+  <section> 
+   <h4 id="Query_Information_about_a_Resource">Query Information about a 
Resource</h4> 
+   <div class="source"> 
+    <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt; --listResourceInfo 
&lt;clusterName&gt; &lt;resourceName&gt;
+./helix-admin.sh --zkSvr localhost:2199 --listResourceInfo MYCLUSTER myDB
+
+IdealState for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_1" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "LEADER"
+    },
+    "myDB_4" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+    "myDB_0" : [ "localhost_12914", "localhost_12913", "localhost_12915" ],
+    "myDB_1" : [ "localhost_12915", "localhost_12913", "localhost_12914" ],
+    "myDB_2" : [ "localhost_12913", "localhost_12915", "localhost_12914" ],
+    "myDB_3" : [ "localhost_12915", "localhost_12913", "localhost_12914" ],
+    "myDB_4" : [ "localhost_12913", "localhost_12914", "localhost_12915" ],
+    "myDB_5" : [ "localhost_12914", "localhost_12915", "localhost_12913" ]
+  },
+  "simpleFields" : {
+    "IDEAL_STATE_MODE" : "AUTO",
+    "REBALANCE_MODE" : "SEMI_AUTO",
+    "NUM_PARTITIONS" : "6",
+    "REPLICAS" : "3",
+    "STATE_MODEL_DEF_REF" : "LeaderStandby",
+    "STATE_MODEL_FACTORY_NAME" : "DEFAULT"
+  }
+}
+
+ExternalView for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_1" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "LEADER"
+    },
+    "myDB_4" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12914" : "STANDBY",
+      "localhost_12915" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+  },
+  "simpleFields" : {
+    "BUCKET_SIZE" : "0"
+  }
+}
+</code></pre> 
+   </div> 
+   <p>Now, let's look at one of the partitions:</p> 
+   <div class="source"> 
+    <pre><code># helix-admin.sh --zkSvr &lt;zk_address&gt; --listResourceInfo 
&lt;clusterName&gt; &lt;partition&gt;
+./helix-admin.sh --zkSvr localhost:2199 --listResourceInfo mycluster myDB_0
+</code></pre> 
+   </div> 
+  </section> 
+ </section> 
+ <section> 
+  <h3 id="Expand_the_Cluster">Expand the Cluster</h3> 
+  <p>Next, we'll show how Helix does the work that you'd otherwise have to 
build into your system. When you add capacity to your cluster, you want the 
work to be evenly distributed. In this example, we started with 3 nodes, with 6 
partitions. The partitions were evenly balanced, 2 leaders and 4 standbys per 
node. Let's add 3 more nodes: localhost:12916, localhost:12917, 
localhost:12918</p> 
+  <div class="source"> 
+   <pre><code>./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER 
localhost:12916
+./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER localhost:12917
+./helix-admin.sh --zkSvr localhost:2199  --addNode MYCLUSTER localhost:12918
+</code></pre> 
+  </div> 
+  <p>And start up these instances:</p> 
+  <div class="source"> 
+   <pre><code># start up each instance.  These are mock implementations that 
are actively managed by Helix
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12916 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12916.log
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12917 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12917.log
+./start-helix-participant.sh --zkSvr localhost:2199 --cluster MYCLUSTER --host 
localhost --port 12918 --stateModelType LeaderStandby 2&gt;&amp;1 &gt; 
/tmp/participant_12918.log
+</code></pre> 
+  </div> 
+  <p>And now, let Helix do the work for you. To shift the work, simply 
rebalance. After the rebalance, each node will have one leader and two 
standbys.</p> 
+  <div class="source"> 
+   <pre><code>./helix-admin.sh --zkSvr localhost:2199 --rebalance MYCLUSTER 
myDB 3
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="View_the_Cluster">View the Cluster</h3> 
+  <p>OK, let's see how it looks:</p> 
+  <div class="source"> 
+   <pre><code>./helix-admin.sh --zkSvr localhost:2199 --listResourceInfo 
MYCLUSTER myDB
+
+IdealState for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12917" : "LEADER"
+    },
+    "myDB_1" : {
+      "localhost_12916" : "STANDBY",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12915" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_4" : {
+      "localhost_12916" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+    "myDB_0" : [ "localhost_12917", "localhost_12913", "localhost_12914" ],
+    "myDB_1" : [ "localhost_12918", "localhost_12917", "localhost_12916" ],
+    "myDB_2" : [ "localhost_12913", "localhost_12917", "localhost_12918" ],
+    "myDB_3" : [ "localhost_12915", "localhost_12917", "localhost_12918" ],
+    "myDB_4" : [ "localhost_12916", "localhost_12917", "localhost_12918" ],
+    "myDB_5" : [ "localhost_12914", "localhost_12915", "localhost_12913" ]
+  },
+  "simpleFields" : {
+    "IDEAL_STATE_MODE" : "AUTO",
+    "REBALANCE_MODE" : "SEMI_AUTO",
+    "NUM_PARTITIONS" : "6",
+    "REPLICAS" : "3",
+    "STATE_MODEL_DEF_REF" : "LeaderStandby",
+    "STATE_MODEL_FACTORY_NAME" : "DEFAULT"
+  }
+}
+
+ExternalView for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12917" : "LEADER"
+    },
+    "myDB_1" : {
+      "localhost_12916" : "STANDBY",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12915" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_4" : {
+      "localhost_12916" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+  },
+  "simpleFields" : {
+    "BUCKET_SIZE" : "0"
+  }
+}
+</code></pre> 
+  </div> 
+  <p>Mission accomplished. The partitions are nicely balanced.</p> 
+ </section> 
+ <section> 
+  <h3 id="How_about_Failover.3F">How about Failover?</h3> 
+  <p>Building a fault tolerant system isn't trivial, but with Helix, it's 
easy. Helix detects a failed instance, and triggers leadership transfer 
automatically.</p> 
+  <p>First, let's fail an instance. In this example, we'll kill 
localhost:12918 to simulate a failure.</p> 
+  <p>We lost localhost:12918, so myDB_1 lost its LEADER. Helix can fix that, 
it will transfer leadership to a healthy node that is currently a STANDBY, say 
localhost:12197. Helix balances the load as best as it can, given there are 6 
partitions on 5 nodes. Let's see:</p> 
+  <div class="source"> 
+   <pre><code>./helix-admin.sh --zkSvr localhost:2199 --listResourceInfo 
MYCLUSTER myDB
+
+IdealState for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12917" : "LEADER"
+    },
+    "myDB_1" : {
+      "localhost_12916" : "STANDBY",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12915" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_4" : {
+      "localhost_12916" : "LEADER",
+      "localhost_12917" : "STANDBY",
+      "localhost_12918" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+    "myDB_0" : [ "localhost_12917", "localhost_12913", "localhost_12914" ],
+    "myDB_1" : [ "localhost_12918", "localhost_12917", "localhost_12916" ],
+    "myDB_2" : [ "localhost_12913", "localhost_12918", "localhost_12917" ],
+    "myDB_3" : [ "localhost_12915", "localhost_12918", "localhost_12917" ],
+    "myDB_4" : [ "localhost_12916", "localhost_12917", "localhost_12918" ],
+    "myDB_5" : [ "localhost_12914", "localhost_12915", "localhost_12913" ]
+  },
+  "simpleFields" : {
+    "IDEAL_STATE_MODE" : "AUTO",
+    "REBALANCE_MODE" : "SEMI_AUTO",
+    "NUM_PARTITIONS" : "6",
+    "REPLICAS" : "3",
+    "STATE_MODEL_DEF_REF" : "LeaderStandby",
+    "STATE_MODEL_FACTORY_NAME" : "DEFAULT"
+  }
+}
+
+ExternalView for myDB:
+{
+  "id" : "myDB",
+  "mapFields" : {
+    "myDB_0" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "STANDBY",
+      "localhost_12917" : "LEADER"
+    },
+    "myDB_1" : {
+      "localhost_12916" : "STANDBY",
+      "localhost_12917" : "LEADER"
+    },
+    "myDB_2" : {
+      "localhost_12913" : "LEADER",
+      "localhost_12917" : "STANDBY"
+    },
+    "myDB_3" : {
+      "localhost_12915" : "LEADER",
+      "localhost_12917" : "STANDBY"
+    },
+    "myDB_4" : {
+      "localhost_12916" : "LEADER",
+      "localhost_12917" : "STANDBY"
+    },
+    "myDB_5" : {
+      "localhost_12913" : "STANDBY",
+      "localhost_12914" : "LEADER",
+      "localhost_12915" : "STANDBY"
+    }
+  },
+  "listFields" : {
+  },
+  "simpleFields" : {
+    "BUCKET_SIZE" : "0"
+  }
+}
+</code></pre> 
+  </div> 
+  <p>As we've seen in this Quickstart, Helix takes care of partitioning, load 
balancing, elasticity, failure detection and recovery.</p> 
+ </section> 
+ <section> 
+  <h3 id="ZooInspector">ZooInspector</h3> 
+  <p>You can view all of the underlying data by going direct to zookeeper. Use 
ZooInspector that comes with zookeeper to browse the data. This is a java 
applet (make sure you have X windows)</p> 
+  <p>To start zooinspector run the following command from 
&lt;zk_install_directory&gt;/contrib/ZooInspector</p> 
+  <div class="source"> 
+   <pre><code>java -cp 
zookeeper-3.3.3-ZooInspector.jar:lib/jtoaster-1.4.3.jar:../../lib/log4j-1.2.15.jar:../../zookeeper-3.3.3.jar
 org.apache.zookeeper.inspector.ZooInspector
+</code></pre> 
+  </div> 
+ </section> 
+ <section> 
+  <h3 id="Next">Next</h3> 
+  <p>Now that you understand the idea of Helix, read the <a 
href="./Tutorial.html">tutorial</a> to learn how to choose the right state 
model and constraints for your system, and how to implement it. In many cases, 
the built-in features meet your requirements. And best of all, Helix is a 
customizable framework, so you can plug in your own behavior, while retaining 
the automation provided by Helix.</p> 
+ </section> 
+</section>
+                       </div>
+               </div>
+       </div>
+       </div>
+
+       </div><!-- /container -->
+
+       <!-- Footer
+       ================================================== -->
+       <footer class="well">
+               <div class="container">
+                       <div class="row">
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li class="nav-header">Get 
Helix</li>
+                                               <li >
+                                                       <a href="download.html" 
title="Download">Download</a>
+                                               </li>
+                                               <li >
+                                                       <a href="Building.html" 
title="Building">Building</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release Notes</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Hands-On</li>
+                                               <li class="active">
+                                                       <a href="#" 
title="Quick Start">Quick Start</a>
+                                               </li>
+                                               <li >
+                                                       <a href="Tutorial.html" 
title="Tutorial">Tutorial</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Recipes</li>
+                                               <li >
+                                                       <a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                       </div>
+               </div>
+       </footer>
+
+       <div class="container subfooter">
+               <div class="row">
+                       <div class="span12">
+                               <p class="pull-right"><a href="#">Back to 
top</a></p>
+                               <p class="copyright">Copyright &copy;2025 <a 
href="http://www.apache.org";>Apache Software Foundation</a>. All Rights 
Reserved.</p>
+                               <p><a 
href="https://github.com/olamy/reflow-maven-skin"; title="Reflow Maven 
skin">Reflow Maven skin</a> maintained by <a href="https://twitter.com/olamy"; 
target="_blank" title="Olivier Lamy">Olivier Lamy</a>.</p>
+               <div class="row span16"><div>Apache Helix, Apache, the Apache 
feather logo, and the Apache Helix project logos are trademarks of The Apache 
Software Foundation.
+        All other marks mentioned may be trademarks or registered trademarks 
of their respective owners.</div>
+        <a 
href="https://helix.apache.org/1.4.3-docs/privacy-policy.html";>Privacy 
Policy</a>
+      </div>
+                       </div>
+               </div>
+       </div>
+
+       <!-- Le javascript
+       ================================================== -->
+       <!-- Placed at the end of the document so the pages load faster -->
+       <script src="./js/jquery.min.js"></script>
+
+       <script src="./js/bootstrap.min.js"></script>
+       <script src="./js/lightbox.min.js"></script>
+       <script src="./js/reflow-scroll.js"></script>
+
+       <script src="./js/reflow-skin.js"></script>
+
+       </body>
+</html>
\ No newline at end of file

Added: helix/site-content/1.4.3-docs/Tutorial.html
URL: 
http://svn.apache.org/viewvc/helix/site-content/1.4.3-docs/Tutorial.html?rev=1923435&view=auto
==============================================================================
--- helix/site-content/1.4.3-docs/Tutorial.html (added)
+++ helix/site-content/1.4.3-docs/Tutorial.html Wed Jan 29 07:13:35 2025
@@ -0,0 +1,442 @@
+
+<!DOCTYPE html>
+
+
+
+
+
+
+<!--
+ Generated by Apache Maven Doxia at 2025-01-28  Rendered using Reflow Maven 
Skin 2.0.0 (https://olamy.github.io/reflow-maven-skin)
+-->
+<html  xml:lang="en" lang="en">
+
+       <head>
+               <meta charset="UTF-8" />
+               <title>Apache Helix &#x2013; Tutorial</title>
+               <meta name="viewport" content="width=device-width, 
initial-scale=1.0" />
+               <meta name="description" content="" />
+               <meta http-equiv="content-language" content="en" />
+
+               <link href="./css/bootstrap.min.css" rel="stylesheet" />
+               <link href="./css/bootstrap-responsive.min.css" 
rel="stylesheet" />
+               <link href="./css/docs.css" rel="stylesheet" />
+               <link href="./css/reflow-skin.css" rel="stylesheet" />
+
+
+               <link href="./css/lightbox.css" rel="stylesheet" />
+
+               <link href="./css/site.css" rel="stylesheet" />
+               <link href="./css/print.css" rel="stylesheet" media="print" />
+
+               <!-- Le HTML5 shim, for IE6-8 support of HTML5 elements -->
+               <!--[if lt IE 9]>
+                       <script src="./js/html5.js"></script>
+               <![endif]-->
+
+
+
+
+
+    
+<!-- Matomo -->
+<script>
+    var _paq = window._paq = window._paq || [];
+                        _paq.push(['disableCookies']);
+                                    _paq.push(['trackPageView']);
+                                    _paq.push(['enableLinkTracking']);
+                    
+    (function() {
+        var u="https://analytics.apache.org";;
+        _paq.push(['setTrackerUrl', u+'/matomo.php']);
+        _paq.push(['setSiteId', '15']);
+        var d=document, g=d.createElement('script'), 
s=d.getElementsByTagName('script')[0];
+        g.async=true; g.src=u+'/matomo.js'; s.parentNode.insertBefore(g,s);
+    })();
+</script>
+<!-- End Matomo Code -->
+       </head>
+
+       <body class="page-tutorial project-143-docs" data-spy="scroll" 
data-offset="60" data-target="#toc-scroll-target">
+
+    
+               <div class="navbar navbar-fixed-top">
+                       <div class="navbar-inner">
+                               <div class="container">
+                                       <a class="btn btn-navbar" 
data-toggle="collapse" data-target="#top-nav-collapse">
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                       </a>
+                                       <a class="brand" 
href="http://helix.apache.org";>Apache Helix</a>
+                                       <div class="nav-collapse collapse" 
id="top-nav-collapse">
+                                               <ul class="nav pull-right">
+                                                       <li ><a 
href="index.html" title="Helix 1.4.3">Helix 1.4.3</a></li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Get Helix <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="download.html" title="Download">Download</a></li>
+                                                                       <li ><a 
href="Building.html" title="Building">Building</a></li>
+                                                                       <li ><a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release 
Notes</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown 
active">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Hands-On <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="Quickstart.html" title="Quick Start">Quick Start</a></li>
+                                                                       <li 
class="active"><a href="" title="Tutorial">Tutorial</a></li>
+                                                                       <li ><a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Recipes <b class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a></li>
+                                                                       <li ><a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a></li>
+                                                                       <li ><a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a></li>
+                                                                       <li ><a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a></li>
+                                                                       <li ><a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a></li>
+                                                               </ul>
+                                                       </li>
+                                               </ul>
+                                       </div><!--/.nav-collapse -->
+                               </div>
+                       </div>
+               </div>
+
+       <div class="container">
+
+       <!-- Masthead
+       ================================================== -->
+
+       <header>
+       <div class="jumbotron subhead">
+               <div class="row" id="banner">
+                       <div class="span12">
+                               <div class="pull-left">
+                                       <a href="http://helix.apache.org/"; 
id="bannerLeft"><img src="../images/helix-logo.jpg" alt='"''"' /></a>
+                                       <p class="lead">A cluster management 
framework for partitioned and replicated distributed resources</p>
+                               </div>
+                               <div class="pull-right">
+                                       <a href="http://www.apache.org/"; 
id="bannerRight"><img src="../images/feather_small.gif" alt='"''"' /></a>
+                               </div>
+                       </div>
+               </div>
+       </div>
+               <div>
+                       <ul class="breadcrumb">
+                               <li><a href="../" title="Apache Helix">Apache 
Helix</a></li>
+                               <li class="divider">/</li>
+                               <li><a href="./" title="Release 1.4.3">Release 
1.4.3</a></li>
+                               <li class="divider">/</li>
+                               <li>Tutorial</li>
+                               <li class="publishDate version-date 
pull-right">Last Published: 2025-01-28</li>
+                       </ul>
+               </div>
+       </header>
+
+       <div class="main-body">
+       <div class="row">
+               <div class="span12">
+                       <div class="body-content">
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+--> 
+<div class="page-header">
+ <h1>Helix Tutorial</h1>
+</div> 
+<p>In this tutorial, we will cover the roles of a Helix-managed cluster, and 
show the code you need to write to integrate with it. In many cases, there is a 
simple default behavior that is often appropriate, but you can also customize 
the behavior.</p> 
+<p>Convention: we first cover the <i>basic</i> approach, which is the easiest 
to implement. Then, we'll describe <i>advanced</i> options, which give you more 
control over the system behavior, but require you to write more code.</p> 
+<section> 
+ <section> 
+  <h3 id="Prerequisites">Prerequisites</h3> 
+  <ol style="list-style-type: decimal"> 
+   <li>Read <a href="../Concepts.html">Concepts/Terminology</a> and <a 
href="../Architecture.html">Architecture</a></li> 
+   <li>Read the <a href="./Quickstart.html">Quickstart guide</a> to learn how 
Helix models and manages a cluster</li> 
+   <li>Install Helix source. See: <a href="./Quickstart.html">Quickstart</a> 
for the steps.</li> 
+  </ol> 
+ </section> 
+ <section> 
+  <h3 id="Tutorial_Outline">Tutorial Outline</h3> 
+  <ol style="list-style-type: decimal"> 
+   <li><a href="./tutorial_participant.html">Participant</a></li> 
+   <li><a href="./tutorial_spectator.html">Spectator</a></li> 
+   <li><a href="./tutorial_controller.html">Controller</a></li> 
+   <li><a href="./tutorial_rebalance.html">Rebalancing Algorithms</a></li> 
+   <li><a href="./tutorial_user_def_rebalancer.html">User-Defined 
Rebalancing</a></li> 
+   <li><a href="./tutorial_state.html">State Machines</a></li> 
+   <li><a href="./tutorial_messaging.html">Messaging</a></li> 
+   <li><a href="./tutorial_health.html">Customized health check</a></li> 
+   <li><a href="./tutorial_throttling.html">Throttling</a></li> 
+   <li><a href="./tutorial_propstore.html">Application Property Store</a></li> 
+   <li><a href="./tutorial_admin.html">Admin Interface</a></li> 
+   <li><a href="./tutorial_yaml.html">YAML Cluster Setup</a></li> 
+   <li><a href="./tutorial_agent.html">Helix Agent (for non-JVM 
systems)</a></li> 
+   <li><a href="./tutorial_task_framework.html">Task Framework</a> 
+    <ol style="list-style-type: decimal"> 
+     <li><a href="./tutorial_user_content_store.html">Task with User Defined 
Content Store</a></li> 
+     <li><a href="./tutorial_task_throttling.html">Task Throttling</a></li> 
+     <li><a href="./quota_scheduling.html">Quota-based Scheduling</a></li> 
+    </ol> </li> 
+   <li><a href="./tutorial_rest_service.html">Helix REST Service 2.0</a></li> 
+   <li><a href="./tutorial_ui.html">Helix UI Setup</a></li> 
+   <li><a href="./tutorial_customized_view.html">Helix Customized 
View</a></li> 
+   <li><a href="./tutorial_cloud_support.html">Helix Cloud Support</a></li> 
+   <li><a href="./tutorial_distributed_lock.html">Helix Distributed 
Lock</a></li> 
+  </ol> 
+ </section> 
+ <section> 
+  <h3 id="Preliminaries">Preliminaries</h3> 
+  <p>First, we need to set up the system. Let's walk through the steps in 
building a distributed system using Helix.</p> 
+  <section> 
+   <h4 id="Start_ZooKeeper">Start ZooKeeper</h4> 
+   <p>This starts a zookeeper in standalone mode. For production deployment, 
see <a class="externalLink" href="http://zookeeper.apache.org";>Apache 
ZooKeeper</a> for instructions.</p> 
+   <div class="source"> 
+    <pre><code>./start-standalone-zookeeper.sh 2199 &amp;
+</code></pre> 
+   </div> 
+  </section> 
+  <section> 
+   <h4 id="Create_a_Cluster">Create a Cluster</h4> 
+   <p>Creating a cluster will define the cluster in appropriate znodes on 
ZooKeeper.</p> 
+   <p>Using the Java API:</p> 
+   <div class="source"> 
+    <pre><code>// Create setup tool instance
+// Note: ZK_ADDRESS is the host:port of Zookeeper
+String ZK_ADDRESS = "localhost:2199";
+admin = new ZKHelixAdmin(ZK_ADDRESS);
+
+String CLUSTER_NAME = "helix-demo";
+//Create cluster namespace in zookeeper
+admin.addCluster(CLUSTER_NAME);
+</code></pre> 
+   </div> 
+   <p>OR</p> 
+   <p>Using the command-line interface:</p> 
+   <div class="source"> 
+    <pre><code>./helix-admin.sh --zkSvr localhost:2199 --addCluster helix-demo
+</code></pre> 
+   </div> 
+  </section> 
+  <section> 
+   <h4 id="Configure_the_Nodes_of_the_Cluster">Configure the Nodes of the 
Cluster</h4> 
+   <p>First we'll add new nodes to the cluster, then configure the nodes in 
the cluster. Each node in the cluster must be uniquely identifiable. The most 
commonly used convention is hostname:port.</p> 
+   <div class="source"> 
+    <pre><code>String CLUSTER_NAME = "helix-demo";
+int NUM_NODES = 2;
+String hosts[] = new String[]{"localhost","localhost"};
+String ports[] = new String[]{"7000","7001"};
+for (int i = 0; i &lt; NUM_NODES; i++)
+{
+  InstanceConfig instanceConfig = new InstanceConfig(hosts[i]+ "_" + ports[i]);
+  instanceConfig.setHostName(hosts[i]);
+  instanceConfig.setPort(ports[i]);
+  instanceConfig.setInstanceEnabled(true);
+
+  //Add additional system specific configuration if needed. These can be 
accessed during the node start up.
+  instanceConfig.getRecord().setSimpleField("key", "value");
+  admin.addInstance(CLUSTER_NAME, instanceConfig);
+}
+</code></pre> 
+   </div> 
+  </section> 
+  <section> 
+   <h4 id="Configure_the_Resource">Configure the Resource</h4> 
+   <p>A <b>resource</b> represents the actual task performed by the nodes. It 
can be a database, index, topic, queue or any other processing entity. A 
resource can be divided into many sub-parts known as <b>partitions</b>.</p> 
+   <section> 
+    <h5 id="Define_the_State_Model_and_Constraints">Define the State Model and 
Constraints</h5> 
+    <p>For scalability and fault tolerance, each partition can have one or 
more replicas. The <b>state model</b> allows one to declare the system behavior 
by first enumerating the various STATES, and the TRANSITIONS between them. A 
simple model is ONLINE-OFFLINE where ONLINE means the task is active and 
OFFLINE means it's not active. You can also specify how many replicas must be 
in each state, these are known as <b>constraints</b>. For example, in a search 
system, one might need more than one node serving the same index to handle the 
load.</p> 
+    <p>The allowed states:</p> 
+    <ul> 
+     <li>LEADER</li> 
+     <li>STANDBY</li> 
+     <li>OFFLINE</li> 
+    </ul> 
+    <p>The allowed transitions:</p> 
+    <ul> 
+     <li>OFFLINE to STANDBY</li> 
+     <li>STANDBY to OFFLINE</li> 
+     <li>STANDBY to LEADER</li> 
+     <li>LEADER to STANDBY</li> 
+    </ul> 
+    <p>The constraints:</p> 
+    <ul> 
+     <li>no more than 1 LEADER per partition</li> 
+     <li>the rest of the replicas should be STANDBYs</li> 
+    </ul> 
+    <p>The following snippet shows how to declare the state model and 
constraints for the LEADER-STANDBY model.</p> 
+    <div class="source"> 
+     <pre><code>String STATE_MODEL_NAME = "LeaderStandby";
+StateModelDefinition.Builder builder = new 
StateModelDefinition.Builder(STATE_MODEL_NAME);
+// Define your own states: those are opaque strings to Helix
+// Only the topology of the state machine (initial state, transitions, 
priorities, final DROPPED state) is meaningful to Helix
+String LEADER = "LEADER";
+String STANDBY = "STANDBY";
+String OFFLINE = "OFFLINE";
+
+// Add states and their rank to indicate priority. A lower rank corresponds to 
a higher priority
+builder.addState(LEADER, 1);
+builder.addState(STANDBY, 2);
+builder.addState(OFFLINE);
+// Note the special inclusion of the DROPPED state (REQUIRED)
+builder.addState(HelixDefinedState.DROPPED.name());
+
+// Set the initial state when the node starts
+builder.initialState(OFFLINE);
+
+// Add transitions between the states.
+builder.addTransition(OFFLINE, STANDBY);
+builder.addTransition(STANDBY, OFFLINE);
+builder.addTransition(STANDBY, LEADER);
+builder.addTransition(LEADER, STANDBY);
+
+// There must be a path to DROPPED from each state (REQUIRED)
+builder.addTransition(OFFLINE, HelixDefinedState.DROPPED.name());
+
+// set constraints on states
+
+// static constraint: upper bound of 1 LEADER
+builder.upperBound(LEADER, 1);
+
+// dynamic constraint: R means it should be derived based on the replication 
factor for the cluster
+// this allows a different replication factor for each resource without
+// having to define a new state model
+
+builder.dynamicUpperBound(STANDBY, "R");
+
+StateModelDefinition myStateModel = builder.build();
+admin.addStateModelDef(CLUSTER_NAME, STATE_MODEL_NAME, myStateModel);
+</code></pre> 
+    </div> 
+   </section> 
+   <section> 
+    <h5 id="Assigning_Partitions_to_Nodes">Assigning Partitions to Nodes</h5> 
+    <p>The final goal of Helix is to ensure that the constraints on the state 
model are satisfied. Helix does this by assigning a <b>state</b> to a partition 
(such as LEADER, STANDBY), and placing it on a particular node.</p> 
+    <p>There are 3 assignment modes Helix can operate in:</p> 
+    <ul> 
+     <li>FULL_AUTO: Helix decides the placement and state of a partition.</li> 
+     <li>SEMI_AUTO: Application decides the placement but Helix decides the 
state of a partition.</li> 
+     <li>CUSTOMIZED: Application controls the placement and state of a 
partition.</li> 
+    </ul> 
+    <p>For more information on the assignment modes, see the <a 
href="./tutorial_rebalance.html">Rebalancing Algorithms</a> section of this 
tutorial.</p> 
+    <div class="source"> 
+     <pre><code>String RESOURCE_NAME = "MyDB";
+int NUM_PARTITIONS = 6;
+String STATE_MODEL_NAME = "LeaderStandby";
+String MODE = "SEMI_AUTO";
+int NUM_REPLICAS = 2;
+
+admin.addResource(CLUSTER_NAME, RESOURCE_NAME, NUM_PARTITIONS, 
STATE_MODEL_NAME, MODE);
+admin.rebalance(CLUSTER_NAME, RESOURCE_NAME, NUM_REPLICAS);
+</code></pre> 
+    </div> 
+   </section> 
+  </section> 
+ </section> 
+</section>
+                       </div>
+               </div>
+       </div>
+       </div>
+
+       </div><!-- /container -->
+
+       <!-- Footer
+       ================================================== -->
+       <footer class="well">
+               <div class="container">
+                       <div class="row">
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li class="nav-header">Get 
Helix</li>
+                                               <li >
+                                                       <a href="download.html" 
title="Download">Download</a>
+                                               </li>
+                                               <li >
+                                                       <a href="Building.html" 
title="Building">Building</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release Notes</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Hands-On</li>
+                                               <li >
+                                                       <a 
href="Quickstart.html" title="Quick Start">Quick Start</a>
+                                               </li>
+                                               <li class="active">
+                                                       <a href="#" 
title="Tutorial">Tutorial</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Recipes</li>
+                                               <li >
+                                                       <a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                       </div>
+               </div>
+       </footer>
+
+       <div class="container subfooter">
+               <div class="row">
+                       <div class="span12">
+                               <p class="pull-right"><a href="#">Back to 
top</a></p>
+                               <p class="copyright">Copyright &copy;2025 <a 
href="http://www.apache.org";>Apache Software Foundation</a>. All Rights 
Reserved.</p>
+                               <p><a 
href="https://github.com/olamy/reflow-maven-skin"; title="Reflow Maven 
skin">Reflow Maven skin</a> maintained by <a href="https://twitter.com/olamy"; 
target="_blank" title="Olivier Lamy">Olivier Lamy</a>.</p>
+               <div class="row span16"><div>Apache Helix, Apache, the Apache 
feather logo, and the Apache Helix project logos are trademarks of The Apache 
Software Foundation.
+        All other marks mentioned may be trademarks or registered trademarks 
of their respective owners.</div>
+        <a 
href="https://helix.apache.org/1.4.3-docs/privacy-policy.html";>Privacy 
Policy</a>
+      </div>
+                       </div>
+               </div>
+       </div>
+
+       <!-- Le javascript
+       ================================================== -->
+       <!-- Placed at the end of the document so the pages load faster -->
+       <script src="./js/jquery.min.js"></script>
+
+       <script src="./js/bootstrap.min.js"></script>
+       <script src="./js/lightbox.min.js"></script>
+       <script src="./js/reflow-scroll.js"></script>
+
+       <script src="./js/reflow-skin.js"></script>
+
+       </body>
+</html>
\ No newline at end of file

Added: helix/site-content/1.4.3-docs/WorkflowExample.json
URL: 
http://svn.apache.org/viewvc/helix/site-content/1.4.3-docs/WorkflowExample.json?rev=1923435&view=auto
==============================================================================
--- helix/site-content/1.4.3-docs/WorkflowExample.json (added)
+++ helix/site-content/1.4.3-docs/WorkflowExample.json Wed Jan 29 07:13:35 2025
@@ -0,0 +1,46 @@
+{"id":"Workflow1",
+ "WorkflowConfig":{
+    "id":"Workflow1",
+    "Expiry":"43200000",
+    "FailureThreshold":"0",
+    "IsJobQueue":"true",
+    "TargetState":"START",
+    "Terminable":"false",
+    "capacity":"500"
+ },
+ "Jobs":[
+         {
+          "id" : "Job1",
+          "simpleFields": {
+              "JobID":"Job1",
+              "WorkflowID" : "Workflow1"
+          },
+          "mapFields":{
+              "Task1" : {
+                   "TASK_ID" : "Task1",
+                   "TASK_COMMAND" : "Backup",
+                   "TASK_TARGET_PARTITION" : "p1"
+               },
+               "Task2" : {
+                   "TASK_ID" : "Task2",
+                   "TASK_COMMAND" : "ReIndex"
+               }
+           },
+           "listFields":{}
+         },
+         {
+           "id":"Job2",
+           "Command":"Cleanup",
+           "TargetResource":"DB2"
+         },
+         {
+           "id":"Job3",
+           "Command":"Backup",
+           "TargetResource":"DB3"
+        }
+  ],
+  "ParentJobs":{
+      "Job1":["Job2","Job3],
+      "Job2":["Job3"]
+  }
+}
\ No newline at end of file

Added: helix/site-content/1.4.3-docs/auto_exit_maintenance.html
URL: 
http://svn.apache.org/viewvc/helix/site-content/1.4.3-docs/auto_exit_maintenance.html?rev=1923435&view=auto
==============================================================================
--- helix/site-content/1.4.3-docs/auto_exit_maintenance.html (added)
+++ helix/site-content/1.4.3-docs/auto_exit_maintenance.html Wed Jan 29 
07:13:35 2025
@@ -0,0 +1,398 @@
+
+<!DOCTYPE html>
+
+
+
+
+
+
+<!--
+ Generated by Apache Maven Doxia at 2025-01-28  Rendered using Reflow Maven 
Skin 2.0.0 (https://olamy.github.io/reflow-maven-skin)
+-->
+<html  xml:lang="en" lang="en">
+
+       <head>
+               <meta charset="UTF-8" />
+               <title>Apache Helix &#x2013; Auto-exit of Maintenance 
Mode</title>
+               <meta name="viewport" content="width=device-width, 
initial-scale=1.0" />
+               <meta name="description" content="" />
+               <meta http-equiv="content-language" content="en" />
+
+               <link href="./css/bootstrap.min.css" rel="stylesheet" />
+               <link href="./css/bootstrap-responsive.min.css" 
rel="stylesheet" />
+               <link href="./css/docs.css" rel="stylesheet" />
+               <link href="./css/reflow-skin.css" rel="stylesheet" />
+
+
+               <link href="./css/lightbox.css" rel="stylesheet" />
+
+               <link href="./css/site.css" rel="stylesheet" />
+               <link href="./css/print.css" rel="stylesheet" media="print" />
+
+               <!-- Le HTML5 shim, for IE6-8 support of HTML5 elements -->
+               <!--[if lt IE 9]>
+                       <script src="./js/html5.js"></script>
+               <![endif]-->
+
+
+
+
+
+    
+<!-- Matomo -->
+<script>
+    var _paq = window._paq = window._paq || [];
+                        _paq.push(['disableCookies']);
+                                    _paq.push(['trackPageView']);
+                                    _paq.push(['enableLinkTracking']);
+                    
+    (function() {
+        var u="https://analytics.apache.org";;
+        _paq.push(['setTrackerUrl', u+'/matomo.php']);
+        _paq.push(['setSiteId', '15']);
+        var d=document, g=d.createElement('script'), 
s=d.getElementsByTagName('script')[0];
+        g.async=true; g.src=u+'/matomo.js'; s.parentNode.insertBefore(g,s);
+    })();
+</script>
+<!-- End Matomo Code -->
+       </head>
+
+       <body class="page-auto_exit_maintenance project-143-docs" 
data-spy="scroll" data-offset="60" data-target="#toc-scroll-target">
+
+    
+               <div class="navbar navbar-fixed-top">
+                       <div class="navbar-inner">
+                               <div class="container">
+                                       <a class="btn btn-navbar" 
data-toggle="collapse" data-target="#top-nav-collapse">
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                               <span class="icon-bar"></span>
+                                       </a>
+                                       <a class="brand" 
href="http://helix.apache.org";>Apache Helix</a>
+                                       <div class="nav-collapse collapse" 
id="top-nav-collapse">
+                                               <ul class="nav pull-right">
+                                                       <li ><a 
href="index.html" title="Helix 1.4.3">Helix 1.4.3</a></li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Get Helix <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="download.html" title="Download">Download</a></li>
+                                                                       <li ><a 
href="Building.html" title="Building">Building</a></li>
+                                                                       <li ><a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release 
Notes</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Hands-On <b 
class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="Quickstart.html" title="Quick Start">Quick Start</a></li>
+                                                                       <li ><a 
href="Tutorial.html" title="Tutorial">Tutorial</a></li>
+                                                                       <li ><a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a></li>
+                                                               </ul>
+                                                       </li>
+                                                       <li class="dropdown">
+                                                               <a href="#" 
class="dropdown-toggle" data-toggle="dropdown">Recipes <b class="caret"></b></a>
+                                                               <ul 
class="dropdown-menu">
+                                                                       <li ><a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a></li>
+                                                                       <li ><a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a></li>
+                                                                       <li ><a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a></li>
+                                                                       <li ><a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a></li>
+                                                                       <li ><a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a></li>
+                                                               </ul>
+                                                       </li>
+                                               </ul>
+                                       </div><!--/.nav-collapse -->
+                               </div>
+                       </div>
+               </div>
+
+       <div class="container">
+
+       <!-- Masthead
+       ================================================== -->
+
+       <header>
+       <div class="jumbotron subhead">
+               <div class="row" id="banner">
+                       <div class="span12">
+                               <div class="pull-left">
+                                       <a href="http://helix.apache.org/"; 
id="bannerLeft"><img src="../images/helix-logo.jpg" alt='"''"' /></a>
+                                       <p class="lead">A cluster management 
framework for partitioned and replicated distributed resources</p>
+                               </div>
+                               <div class="pull-right">
+                                       <a href="http://www.apache.org/"; 
id="bannerRight"><img src="../images/feather_small.gif" alt='"''"' /></a>
+                               </div>
+                       </div>
+               </div>
+       </div>
+               <div>
+                       <ul class="breadcrumb">
+                               <li><a href="../" title="Apache Helix">Apache 
Helix</a></li>
+                               <li class="divider">/</li>
+                               <li><a href="./" title="Release 1.4.3">Release 
1.4.3</a></li>
+                               <li class="divider">/</li>
+                               <li>Auto-exit of Maintenance Mode</li>
+                               <li class="publishDate version-date 
pull-right">Last Published: 2025-01-28</li>
+                       </ul>
+               </div>
+       </header>
+
+       <div class="main-body">
+       <div class="row">
+               <div class="span12">
+                       <div class="body-content">
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+--> 
+<div class="page-header">
+ <h1>Auto-exit of Maintenance Mode</h1>
+</div> 
+<section> 
+ <h2 id="Introduction">Introduction</h2> 
+ <p>Auto-exit of maintenance mode is a feature addition to Helix. It concerns 
a feature that allows clusters to switch out of maintenance mode automatically 
to save operational costs and to improve availability.</p> 
+</section> 
+<section> 
+ <h2 id="Background">Background</h2> 
+ <section> 
+  <h3 id="Maintenance_Mode">Maintenance Mode</h3> 
+  <p>The maintenance mode in Helix refers to a Helix cluster state where the 
Helix Controller will not trigger any type of rebalance. In short, if a cluster 
is in maintenance, the Controller will not bootstrap any new partitions. 
However, this does not mean that there won't be any (upward) state transitions. 
For example, partitions missing a top-state (e.g. <b>MASTER/LEADER</b>) replica 
will get a state transition in order to fill in the void for a top-state 
replica.</p> 
+  <section> 
+   <h4 id="Possible_Scenarios">Possible Scenarios</h4> 
+   <p>There are two possible conditions under which a cluster will go into 
maintenance mode automatically.</p> 
+   <ol style="list-style-type: decimal"> 
+    <li>There are more offline/disabled instances than ClusterConfig's 
<b>MAX_OFFLINE_INSTANCES_ALLOWED</b>.</li> 
+    <li>There exist instances that have more partitions than ClusterConfig's 
<b>MAX_PARTITIONS_PER_INSTANCE</b>.</li> 
+   </ol> 
+   <p>Difficulty in Manually Exiting Maintenance Mode</p> 
+   <p>Although maintenance mode has been designed to prevent a large-scale 
reshuffling of replicas when there are intermittent, transient Participant 
connection issues. When in maintenance, no new partitions will be bootstrapped, 
which will block many native operations such as creation of stores/DBs. 
Currently, in order to unblock, an operator must manually disable maintenance 
mode via Helix REST API. Since it's difficult to predict when temporary 
disconnects will happen, it has been a challenge to address them in a prompt 
manner.</p> 
+  </section> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="Problem_Statement">Problem Statement</h2> 
+ <p>Currently, once clusters enter maintenance mode automatically, exiting 
must be done manually. This is an added human effort. We want a feature to 
automate this to reduce downtime and increase availability.</p> 
+</section> 
+<section> 
+ <h2 id="Architecture.2FImplementation">Architecture/Implementation</h2> 
+ <section> 
+  <h3 id="Maintenance_Recovery_Threshold">Maintenance Recovery Threshold</h3> 
+  <p>Recall that there are two cases in which a cluster may enter maintenance 
mode automatically:</p> 
+  <blockquote> 
+   <ol style="list-style-type: decimal"> 
+    <li>There are more offline/disabled instances than ClusterConfig's 
MAX_OFFLINE_INSTANCES_ALLOWED.</li> 
+    <li>There exist instances that have more partitions than ClusterConfig's 
MAX_PARTITIONS_PER_INSTANCE.</li> 
+   </ol> 
+  </blockquote> 
+  <p>It is important to note that we are mainly concerned with Case 1. Case 2 
is meant to be a sanity check against Helix's CRUSH-ed rebalance algorithm, and 
this has little to do with the original motivation behind cluster maintenance 
mode. So, although we will <i>still</i> check against Case 2 when determining 
whether it is safe to exit maintenance mode, we will only address Case 1 in 
this section.</p> 
+  <p>With that said, it is not hard to imagine a cluster in production 
experiencing a flip-flop behavior around the exact value of <b>ClusterConfig's 
MAX_OFFLINE_INSTANCES_ALLOWED</b> field. Such behavior is undesirable and may 
defeat the purpose of using this feature. To mitigate it in design is to have a 
separate, <i>more strict</i> threshold for recovering out of maintenance mode. 
We therefore propose to add a new field, <b>MAINTENANCE_RECOVERY_THRESHOLD</b>. 
<b>MAINTENANCE_RECOVERY_THRESHOLD</b> will be defined by the user and hold a 
more conservative value than <b>MAX_OFFLINE_INSTANCES_ALLOWED</b> to allow for 
some wiggle room in deciding what value is enough to call a cluster 
“<i>sufficiently recovered</i>”. Additionally, we will also give users the 
flexibility to <i>“opt-out”</i> of the auto-exit feature by treating a 
<b>MAINTENANCE_RECOVERY_THRESHOLD</b> value of -1 as a disable signal.</p> 
+  <p>In short,</p> 
+  <ul> 
+   <li>If NumOfflineDisabledInstances &lt; 
NUM_OFFLINE_INSTANCES_FOR_AUTO_EXIT, exit maintenance mode</li> 
+   <li>NUM_OFFLINE_INSTANCES_FOR_AUTO_EXIT &lt;= 
MAX_OFFLINE_INSTANCES_ALLOWED</li> 
+   <li>NUM_OFFLINE_INSTANCES_FOR_AUTO_EXIT &lt; 0 or not set → Opt-out of 
auto-exiting of maintenance mode</li> 
+  </ul> 
+ </section> 
+ <section> 
+  <h3 id="Additional_Fields_in_MaintenanceSignal">Additional Fields in 
MaintenanceSignal</h3> 
+  <p>Currently, Helix stores the maintenance signal in 
/{CLUSTER_NAME}/CONTROLLER/MAINTENANCE. A sample maintenance signal ZNode will 
look like the following:</p> 
+  <div class="source"> 
+   <pre><code class="language-json">{
+  "id" : "maintenance",
+  "simpleFields" : {
+    "REASON" : "Offline Instances count 5 greater than allowed count 4. Stop 
rebalance and put the cluster 
CLUSTER_TestClusterInMaintenanceModeWhenReachingOfflineInstancesLimit into 
maintenance mode.",
+    "TRIGGERED_BY" : "CONTROLLER",
+    "TIMESTAMP" : "12312838831***",
+    // The following are sample user-defined fields from the REST call payload 
//
+    "id" : "hulee",
+    "jira" : "HELIX-123",
+    "cluster" : "testCluster"
+  },
+  "listFields" : {
+  },
+  "mapFields" : {
+  }
+}
+</code></pre> 
+  </div> 
+  <p>A simpleField will be newly added (notice the “<b>TRIGGERED_BY</b>” 
field) to denote whether the current maintenance signal has been generated 
automatically by the Controller. There will initially be <b>two</b> possible 
entries for this field:</p> 
+  <ul> 
+   <li><b>CONTROLLER</b></li> 
+   <li><b>USER</b></li> 
+  </ul> 
+  <p>Also, the TIMESTAMP field will be added so that the value could be 
retrieved via REST.</p> 
+  <p>In addition, we will allow addition of custom fields in simpleFields. See 
the example above. Users will be able to add these fields by using the REST 
endpoints that will be provided when <b>enabling</b> the maintenance mode. Note 
that when disabling maintenance mode, these fields will no longer be available 
because disabling maintenance mode will remove the maintenance signal 
altogether.</p> 
+ </section> 
+ <section> 
+  <h3 id="Recording_Maintenance_History">Recording Maintenance History</h3> 
+  <p>Currently, Helix maintains the controller history in the 
/{clusterName}/CONTROLLER/HISTORY ZNode. We plan to add a history for 
maintenance mode. This way, users will be able to access the history in 
ZooKeeper directly, or utilize the REST endpoint for viewing. The format will 
be in a human-readable format like the following (this is how Helix maintains 
the Controller leader history):</p> 
+  <div class="source"> 
+   <pre><code class="language-java">long currentTime = 
System.currentTimeMillis();
+DateFormat df = new SimpleDateFormat("yyyy-MM-dd-HH:mm:ss");
+df.setTimeZone(TimeZone.getTimeZone("UTC"));
+String dateTime = df.format(new Date(currentTime));
+</code></pre> 
+  </div> 
+  <p>Note that Helix only records <i>10 most recent</i> changes in the HISTORY 
ZNode. We will follow a similar protocol for persisting maintenance 
mode-related history. Note that <b>all changes around maintenance mode will be 
recorded</b> (both entering and exiting of the mode).</p> 
+ </section> 
+ <section> 
+  <h3 id="Backward_Compatibility">Backward Compatibility</h3> 
+  <p>Old versions of Helix Controllers will not refer to the newly-added 
fields, in which case they will simply lack the auto-exit functionality.</p> 
+ </section> 
+ <section> 
+  <h3 id="Asynchronous_Processing">Asynchronous Processing</h3> 
+  <p>Note that in order for a cluster to exit maintenance mode, the Controller 
must check against <i>all conditions</i> that are outlined above. That is, it 
needs to make sure <b>1) the total count of offline/disabled instances is less 
than the threshold and that 2) there are no instances with more partitions than 
the threshold</b>. Checking against Condition 2 requires traversing all 
resources' states, which could be costly in clusters of large scale. From this, 
we potentially risk adding a significant latency to the pipeline, which is 
undesirable because it could cause problems regarding availability (for 
example, longer pipeline runs may exacerbate the rate at which ZooKeeper Event 
Callbacks accumulate. Helix currently deals with a large number of ZK Event 
Callbacks by re-booting the Controller, which could nick Helix's as well as 
applications' availability numbers).</p> 
+  <p>For this reason, we will make the checks happen asynchronously. 
Additional tweak may be required to ensure that the maintenance signal is 
cached appropriately through each run of the pipeline to avoid the race 
condition.</p> 
+ </section> 
+ <section> 
+  <h3 id="Periodic_Check_on_Cluster_Recovery_Status">Periodic Check on Cluster 
Recovery Status</h3> 
+  <p>Auto-exit is inherently triggered as part of Helix's rebalance pipeline; 
that is, if there is no rebalance triggered, there wouldn't be any auto-exits 
triggered either. In theory, this is a non-issue because whether a cluster goes 
into or recovers out of maintenance mode is determined by changes around 
LiveInstances, and a LiveInstance change is an event that triggers Helix's 
rebalance pipeline.</p> 
+  <p>Regardless, there has been anecdotal reports where such events seemed to 
have been “swallowed” or “disappeared” - if that is true for any reason 
(mostly a ZK callback queue issue), one way to mitigate it is to enable 
periodically-triggered rebalances. Note that this is actually a feature 
<i>already supported</i> by Helix.</p> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="How_to_Use_the_Auto-Exit_Feature">How to Use the Auto-Exit 
Feature</h2> 
+ <section> 
+  <h3 id="Why_Use_Auto-Exit">Why Use Auto-Exit</h3> 
+  <p>Helix is used to manage resources in distributed clusters; therefore, it 
inevitably gets to have hundreds of instances. With so many clusters and 
traffic to the ZooKeeper, Helix's metadata store, there are cases in which some 
Participants in the cluster experience transient connection failure, which may 
cause Helix to respond to each little change that happens to the cluster. For 
users of stateful systems, this may be undesirable, so they opt to set a config 
for entering maintenance mode automatically. Maintenance mode is a temporary 
mode that the cluster can enter in order to ensure that there are no 
bootstrapping state transitions on instances.</p> 
+  <p>However, no bootstrapping state transitions could mean that some 
operations such as addition of resources would be halted, which causes periods 
of unavailability. It was the cluster operator's responsibility to determine 
whether the given cluster has sufficiently recovered enough to exit maintenance 
mode. The auto-exit feature removes such overhead.</p> 
+ </section> 
+ <section> 
+  <h3 id="Guide">Guide</h3> 
+  <p>First, we encourage all users of this feature to understand Helix's 
workflow below:</p> 
+  <p><img src="./images/auto-exit-maintenance.jpg" alt="Intro"></p> 
+  <p>In order to use this feature, you'd need to set the following config 
parameters in your cluster's ClusterConfig.</p> 
+  <section> 
+   <h4 id="Auto-enter_maintenance_mode">Auto-enter maintenance mode</h4> 
+   <p><b>MAX_OFFLINE_INSTANCES_ALLOWED</b>: the number of offline and disabled 
instances allowed before the cluster automatically enters maintenance mode.</p> 
+   <p><b>MAX_PARTITIONS_PER_INSTANCE</b>: the number of partitions on any 
given instance, where, if any instance in the cluster happens to have more 
partitions than this number, the cluster automatically enters maintenance 
mode</p> 
+  </section> 
+  <section> 
+   <h4 id="Auto-exit_maintenance_mode">Auto-exit maintenance mode</h4> 
+   <p><b>NUM_OFFLINE_INSTANCES_FOR_AUTO_EXIT</b>: set this value to allow your 
cluster to auto-exit when the number of offline and disabled instances are at 
this value. Note that this value must be less than 
MAX_OFFLINE_INSTANCES_ALLOWED (Read the design above on why). Note that the 
appropriate value for this is dependent on the characteristics of the cluster. 
In general, start with 1, meaning that the cluster will only auto-exit 
maintenance mode when it is down to 1 offline or disable instance, and increase 
the value as you increase tolerance.</p> 
+   <p>Note that the cluster will auto-exit only if it has <i>automatically</i> 
entered maintenance mode previously.</p> 
+  </section> 
+ </section> 
+</section> 
+<section> 
+ <h2 id="FAQ">FAQ</h2> 
+ <section> 
+  <section> 
+   <h4 id="How_is_this_related_to_DelayedAutoRebalancer.3F">How is this 
related to <b>DelayedAutoRebalancer</b>?</h4> 
+   <ul> 
+    <li>If you are using DelayedAutoRebalancer for your clusters, this 
auto-exit feature would still work as expected. Fundamentally, 
DelayedAutoRebalancer and maintenance mode are mutually independent. That is, 
under maintenance mode, Helix uses a different rebalancing strategy. Once the 
cluster auto-exits maintenance mode, it will go back to whichever rebalancing 
mode it was on previously.</li> 
+    <li>Delayed Partition Movement is a feature in Helix's FULL-AUTO 
rebalancer.</li> 
+    <li>The rebalance delay will work at the instance level and 
entering/exiting maintenance mode will not affect the time at which the 
delay-counting started.</li> 
+   </ul> 
+  </section> 
+  <section> 
+   <h4 
id="How_do_I_know_what_the_appropriate_value_is_for_MAINTENANCE_RECOVERY_THRESHOLD.3F">How
 do I know what the appropriate value is for 
<b><b>MAINTENANCE_RECOVERY_THRESHOLD</b></b>?</h4> 
+   <ul> 
+    <li>As a framework, we cannot provide the right value for this threshold. 
It should depend on the nature of the application and the risk tolerance 
thereof. Familiarize yourself with the rules outlined above and start with a 
low value (for example, 0) and increase your tolerance.</li> 
+   </ul> 
+  </section> 
+ </section> 
+</section>
+                       </div>
+               </div>
+       </div>
+       </div>
+
+       </div><!-- /container -->
+
+       <!-- Footer
+       ================================================== -->
+       <footer class="well">
+               <div class="container">
+                       <div class="row">
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li class="nav-header">Get 
Helix</li>
+                                               <li >
+                                                       <a href="download.html" 
title="Download">Download</a>
+                                               </li>
+                                               <li >
+                                                       <a href="Building.html" 
title="Building">Building</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="releasenotes/release-1.4.3.html" title="Release Notes">Release Notes</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Hands-On</li>
+                                               <li >
+                                                       <a 
href="Quickstart.html" title="Quick Start">Quick Start</a>
+                                               </li>
+                                               <li >
+                                                       <a href="Tutorial.html" 
title="Tutorial">Tutorial</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="../javadocs/1.4.3" title="Javadocs">Javadocs</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                               <div class="span3 bottom-nav">
+                                       <ul class="nav nav-list">
+                                               <li 
class="nav-header">Recipes</li>
+                                               <li >
+                                                       <a 
href="recipes/lock_manager.html" title="Distributed lock manager">Distributed 
lock manager</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rabbitmq_consumer_group.html" title="Rabbit MQ consumer 
group">Rabbit MQ consumer group</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/rsync_replicated_file_store.html" title="Rsync replicated file 
store">Rsync replicated file store</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/service_discovery.html" title="Service discovery">Service 
discovery</a>
+                                               </li>
+                                               <li >
+                                                       <a 
href="recipes/task_dag_execution.html" title="Distributed task DAG 
execution">Distributed task DAG execution</a>
+                                               </li>
+                                       </ul>
+                               </div>
+                       </div>
+               </div>
+       </footer>
+
+       <div class="container subfooter">
+               <div class="row">
+                       <div class="span12">
+                               <p class="pull-right"><a href="#">Back to 
top</a></p>
+                               <p class="copyright">Copyright &copy;2025 <a 
href="http://www.apache.org";>Apache Software Foundation</a>. All Rights 
Reserved.</p>
+                               <p><a 
href="https://github.com/olamy/reflow-maven-skin"; title="Reflow Maven 
skin">Reflow Maven skin</a> maintained by <a href="https://twitter.com/olamy"; 
target="_blank" title="Olivier Lamy">Olivier Lamy</a>.</p>
+               <div class="row span16"><div>Apache Helix, Apache, the Apache 
feather logo, and the Apache Helix project logos are trademarks of The Apache 
Software Foundation.
+        All other marks mentioned may be trademarks or registered trademarks 
of their respective owners.</div>
+        <a 
href="https://helix.apache.org/1.4.3-docs/privacy-policy.html";>Privacy 
Policy</a>
+      </div>
+                       </div>
+               </div>
+       </div>
+
+       <!-- Le javascript
+       ================================================== -->
+       <!-- Placed at the end of the document so the pages load faster -->
+       <script src="./js/jquery.min.js"></script>
+
+       <script src="./js/bootstrap.min.js"></script>
+       <script src="./js/lightbox.min.js"></script>
+       <script src="./js/reflow-scroll.js"></script>
+
+       <script src="./js/reflow-skin.js"></script>
+
+       </body>
+</html>
\ No newline at end of file


Reply via email to