siddharthteotia commented on a change in pull request #4446: Add support in the
rebalancer for the user to provide minimum number of serving replicas
URL: https://github.com/apache/incubator-pinot/pull/4446#discussion_r308991002
##########
File path:
pinot-controller/src/main/java/org/apache/pinot/controller/helix/core/TableRebalancer.java
##########
@@ -139,112 +153,293 @@ public RebalanceResult rebalance(TableConfig
tableConfig, RebalanceSegmentStrate
}
if (EqualityUtils.isEqual(targetIdealState, currentIdealState)) {
- LOGGER.info("Table {} is rebalanced.", tableNameWithType);
-
LOGGER.info("Finished rebalancing table {} in {} ms.",
tableNameWithType,
TimeUnit.NANOSECONDS.toMillis(System.nanoTime() - startTime));
result.setIdealStateMapping(targetIdealState.getRecord().getMapFields());
result.setPartitionAssignment(targetPartitionAssignment);
+ result.setStatus("Successfully finished rebalancing");
+ result.setStatusCode(RebalanceResult.RebalanceStatus.DONE);
return result;
}
// if ideal state needs to change, get the next 'safe' state (based on
whether downtime is OK or not)
IdealState nextIdealState = getNextState(currentIdealState,
targetIdealState, rebalanceConfig);
+ LOGGER.info("Got new ideal state after making changes to partition map
of all segments. Will attempt to persist this in ZK. Logging the difference
between new and target ideal state");
+ printIdealStateDifference(targetIdealState, nextIdealState);
// If the ideal state is large enough, enable compression
if (HelixHelper.MAX_PARTITION_COUNT_IN_UNCOMPRESSED_IDEAL_STATE <
nextIdealState.getPartitionSet().size()) {
nextIdealState.getRecord().setBooleanField("enableCompression", true);
}
- // Check version and set ideal state
+ // Check version and set ideal state to nextIdealState
try {
- LOGGER.info("Updating IdealState for table {}", tableNameWithType);
+ LOGGER.info("Going to update current IdealState in ZK for table {},
current version {} and creation time {}",
+ tableNameWithType, currentIdealState.getRecord().getVersion(),
currentIdealState.getRecord().getCreationTime());
if (zkBaseDataAccessor
.set(idealStateKey.getPath(), nextIdealState.getRecord(),
currentIdealState.getRecord().getVersion(),
AccessOption.PERSISTENT)) {
+ LOGGER.info("Successfully persisted the ideal state for table {} in
ZK. Will wait for External view to converge",
+ tableNameWithType);
+ ++_rebalancerStats.updatestoIdealStateInZK;
// if we succeeded, wait for the change to stabilize
waitForStable(tableNameWithType);
// clear retries as it tracks failures with each idealstate update
attempt
retries = 0;
+ LOGGER.info("External view converged for the change in ideal state
for table {}. Will start the next iteration (if any)",
+ tableNameWithType);
continue;
}
- // in case of any error, we retry a bounded number of types
+ // in case of any error, we retry a bounded number of times
} catch (ZkBadVersionException e) {
- LOGGER.warn("Version changed while updating ideal state for resource:
{}", tableNameWithType);
+ // we will go back in the loop and reattempt by recomputing the target
ideal state
+ LOGGER.info("Version changed while updating ideal state for resource:
{}, was expecting version {}",
+ tableNameWithType, currentIdealState.getRecord().getVersion());
} catch (Exception e) {
- LOGGER.warn("Caught exception while updating ideal state for resource:
{}", tableNameWithType, e);
+ if (e instanceof IllegalStateException && e.getCause() instanceof
ExternalViewErrored) {
+ if (e.getCause() instanceof ExternalViewErrored) {
+ LOGGER.error("External view reported error for table {} after
updating ideal state", tableNameWithType);
+ } else if (e.getCause() instanceof ExternalViewConvergeTimeout) {
+ LOGGER.error("Timedout while waiting for external view to converge
for table {}", tableNameWithType);
Review comment:
done
----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
For queries about this service, please contact Infrastructure at:
[email protected]
With regards,
Apache Git Services
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]