somandal commented on code in PR #15575:
URL: https://github.com/apache/pinot/pull/15575#discussion_r2049749036
##########
pinot-controller/src/main/java/org/apache/pinot/controller/helix/core/rebalance/DefaultRebalancePreChecker.java:
##########
@@ -379,6 +382,58 @@ private RebalancePreCheckerResult
checkRebalanceConfig(RebalanceConfig rebalance
: RebalancePreCheckerResult.warn(StringUtil.join("\n",
warnings.toArray(String[]::new)));
}
+ private RebalancePreCheckerResult checkReplicaGroups(TableConfig
tableConfig, RebalanceConfig rebalanceConfig) {
+ String message;
+ if (tableConfig.getTableType() == TableType.OFFLINE) {
+ message = "OFFLINE segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.OFFLINE);
+ } else {
+ // for realtime table
+ message = "COMPLETED segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.COMPLETED) + "\n"
+ + "CONSUMING segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.CONSUMING);
+ }
+ String tierMessage = "";
+ if (tableConfig.getTierConfigsList() != null) {
+ List<String> tierMessageList = new ArrayList<>();
+ for (TierConfig tierConfig : tableConfig.getTierConfigsList()) {
+ tierMessageList.add(tierConfig.getName() + " tier - " +
getReplicaGroupInfo(tableConfig, tierConfig.getName()));
+ }
+ tierMessage = "\n" + StringUtil.join("\n",
tierMessageList.toArray(String[]::new));
+ }
+ if (rebalanceConfig.isReassignInstances()) {
+ return RebalancePreCheckerResult.pass(message + tierMessage);
+ }
+ return RebalancePreCheckerResult.warn(
Review Comment:
we should only warn if `replicaGroups` is enabled, right? For balanced
assignment, it doesn't matter if we set `reassignInstances` or not, since it
will always update based on the currently tagged list
##########
pinot-controller/src/main/java/org/apache/pinot/controller/helix/core/rebalance/DefaultRebalancePreChecker.java:
##########
@@ -379,6 +382,58 @@ private RebalancePreCheckerResult
checkRebalanceConfig(RebalanceConfig rebalance
: RebalancePreCheckerResult.warn(StringUtil.join("\n",
warnings.toArray(String[]::new)));
}
+ private RebalancePreCheckerResult checkReplicaGroups(TableConfig
tableConfig, RebalanceConfig rebalanceConfig) {
+ String message;
+ if (tableConfig.getTableType() == TableType.OFFLINE) {
+ message = "OFFLINE segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.OFFLINE);
+ } else {
+ // for realtime table
+ message = "COMPLETED segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.COMPLETED) + "\n"
+ + "CONSUMING segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.CONSUMING);
+ }
+ String tierMessage = "";
+ if (tableConfig.getTierConfigsList() != null) {
+ List<String> tierMessageList = new ArrayList<>();
+ for (TierConfig tierConfig : tableConfig.getTierConfigsList()) {
+ tierMessageList.add(tierConfig.getName() + " tier - " +
getReplicaGroupInfo(tableConfig, tierConfig.getName()));
+ }
+ tierMessage = "\n" + StringUtil.join("\n",
tierMessageList.toArray(String[]::new));
+ }
+ if (rebalanceConfig.isReassignInstances()) {
+ return RebalancePreCheckerResult.pass(message + tierMessage);
+ }
+ return RebalancePreCheckerResult.warn(
+ "reassignInstances is disabled, replica groups may not update.\n" +
message + tierMessage);
Review Comment:
nit: reword to "replica groups may not be update"
##########
pinot-controller/src/main/java/org/apache/pinot/controller/helix/core/rebalance/DefaultRebalancePreChecker.java:
##########
@@ -379,6 +382,58 @@ private RebalancePreCheckerResult
checkRebalanceConfig(RebalanceConfig rebalance
: RebalancePreCheckerResult.warn(StringUtil.join("\n",
warnings.toArray(String[]::new)));
}
+ private RebalancePreCheckerResult checkReplicaGroups(TableConfig
tableConfig, RebalanceConfig rebalanceConfig) {
+ String message;
+ if (tableConfig.getTableType() == TableType.OFFLINE) {
+ message = "OFFLINE segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.OFFLINE);
+ } else {
+ // for realtime table
+ message = "COMPLETED segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.COMPLETED) + "\n"
+ + "CONSUMING segments - " + getReplicaGroupInfo(tableConfig,
InstancePartitionsType.CONSUMING);
+ }
+ String tierMessage = "";
+ if (tableConfig.getTierConfigsList() != null) {
+ List<String> tierMessageList = new ArrayList<>();
+ for (TierConfig tierConfig : tableConfig.getTierConfigsList()) {
+ tierMessageList.add(tierConfig.getName() + " tier - " +
getReplicaGroupInfo(tableConfig, tierConfig.getName()));
+ }
+ tierMessage = "\n" + StringUtil.join("\n",
tierMessageList.toArray(String[]::new));
+ }
+ if (rebalanceConfig.isReassignInstances()) {
+ return RebalancePreCheckerResult.pass(message + tierMessage);
+ }
+ return RebalancePreCheckerResult.warn(
+ "reassignInstances is disabled, replica groups may not update.\n" +
message + tierMessage);
+ }
+
+ private String getReplicaGroupInfo(TableConfig tableConfig,
InstancePartitionsType type) {
+ if (!InstanceAssignmentConfigUtils.allowInstanceAssignment(tableConfig,
type)) {
+ return "Replica Groups are not enabled, replication: " +
tableConfig.getReplication();
+ }
+ return getReplicaGroupInfo(tableConfig, type.toString());
+ }
+
+ private static String getReplicaGroupInfo(TableConfig tableConfig, String
type) {
+ Map<String, InstanceAssignmentConfig> instanceAssignmentConfigMap =
tableConfig.getInstanceAssignmentConfigMap();
+ if (instanceAssignmentConfigMap != null &&
instanceAssignmentConfigMap.containsKey(type)) {
+ InstanceReplicaGroupPartitionConfig instanceReplicaGroupPartitionConfig =
+
instanceAssignmentConfigMap.get(type).getReplicaGroupPartitionConfig();
+ if (!instanceReplicaGroupPartitionConfig.isReplicaGroupBased()) {
+ return "Replica Groups are not enabled, replication: " +
tableConfig.getReplication();
Review Comment:
Can you check once which `replication` is picked up if the
InstanceAssignmentConfig is present, but in that the replicaGroups is disabled
and `replication` is set up? What if it is disabled but we set
`numReplicaGroups` to some value and also set `replication`? Just want to
ensure the correct one is picked up (good way to test is to try a rebalance
dry-run locally and see which change results in NO_OP vs. showing that
rebalance is needed)
e.g.
```
"instanceAssignmentConfigMap": {
"OFFLINE": {
"tagPoolConfig": {
"tag": "DefaultTenant_OFFLINE",
"poolBased": false,
"numPools": 0
},
"replicaGroupPartitionConfig": {
"replicaGroupBased": false,
"numReplicaGroups": 3,
...
...
},
..
}
},
```
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]