kaisun2000 commented on issue #1394:
URL: https://github.com/apache/helix/issues/1394#issuecomment-699699145
The case is exactly the same as I can confirm from debugger.
LOG 1843
>2020-09-27T21:29:31.1669800Z END: WorkflowControllerDataProvider.refresh()
for cluster CLUSTER_TestTaskRebalancerStopResume, pipleline TASK, Cache
resrouce config
Content:**{stopAndDeleteQueue_masterJob=ZnRecord=stopAndDeleteQueue_masterJob,
{Command=Reindex, ConcurrentTasksPerInstance=1, DisableExternalView=false,
Expiry=86400000, FailureThreshold=0, IgnoreDependentJobFailure=false,
JobCommandConfig={"Delay":"2000"}, JobID=stopAndDeleteQueue_masterJob,
MONITORING_DISABLED=true, MaxAttemptsPerTask=10,
MaxForcedReassignmentsPerTask=10, RebalanceRunningTask=false,
TargetPartitionStates=MASTER, TargetResource=TestDB,
TimeoutPerPartition=3600000, WorkflowID=stopAndDeleteQueue}{}{},** Stat=Stat
{_version=0, _creationTime=1601242170561, _modifiedTime=1601242170561,
_ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted_masterJob0=ZnRecord=deleteJobFromRecurrentQueueNotStarted_masterJob0,
{Command=Reindex, ConcurrentTasksPerInstance=1, DisableExternalView=false,
Expiry=86400000, Fail
ureThreshold=0, IgnoreDependentJobFailure=false,
JobCommandConfig={"Delay":"200"},
JobID=deleteJobFromRecurrentQueueNotStarted_masterJob0,
MONITORING_DISABLED=true, MaxAttemptsPerTask=10,
MaxForcedReassignmentsPerTask=10, RebalanceRunningTask=false,
TargetPartitionStates=MASTER, TargetResource=TestDB,
TimeoutPerPartition=3600000,
WorkflowID=deleteJobFromRecurrentQueueNotStarted}{}{}, Stat=Stat {_version=0,
_creationTime=1601242166392, _modifiedTime=1601242166392, _ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0=ZnRecord=deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0,
{Command=Reindex, ConcurrentTasksPerInstance=1, DisableExternalView=false,
Expiry=86400000, FailureThreshold=0, IgnoreDependentJobFailure=false,
JobCommandConfig={"Delay":"200"},
JobID=deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0,
MONITORING_DISABLED=true, MaxAttemptsPerTask=10,
MaxForcedReassignmentsPerTask=10, RebalanceRunningTask=false, TargetP
artitionStates=MASTER, TargetResource=TestDB, TimeoutPerPartition=3600000,
WorkflowID=deleteJobFromRecurrentQueueNotStarted_20200927T212926}{}{},
Stat=Stat {_version=0, _creationTime=1601242166409,
_modifiedTime=1601242166409, _ephemeralOwner=0},
**stopAndDeleteQueue=ZnRecord=stopAndDeleteQueue,
{AllowOverlapJobAssignment=false,
Dag={"allNodes":["stopAndDeleteQueue_masterJob","stopAndDeleteQueue_slaveJob"],"childrenToParents":{"stopAndDeleteQueue_slaveJob":["stopAndDeleteQueue_masterJob"]},"parentsToChildren":{"stopAndDeleteQueue_masterJob":["stopAndDeleteQueue_slaveJob"]}},
Expiry=120000, FailureThreshold=0, IsJobQueue=true, JobPurgeInterval=1800000,
MONITORING_DISABLED=true, ParallelJobs=1, TargetState=START, Terminable=false,
WorkflowID=stopAndDeleteQueue,** capacity=2147483647}{JobTypes={}}{}, Stat=Stat
{_version=2, _creationTime=1601242170547, _modifiedTime=1601242170572,
_ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted=ZnRecord=deleteJobFromRecurrentQueueNotStarted,
{
AllowOverlapJobAssignment=false,
Dag={"allNodes":["deleteJobFromRecurrentQueueNotStarted_masterJob0","deleteJobFromRecurrentQueueNotStarted_slaveJob1"],"childrenToParents":{"deleteJobFromRecurrentQueueNotStarted_slaveJob1":["deleteJobFromRecurrentQueueNotStarted_masterJob0"]},"parentsToChildren":{"deleteJobFromRecurrentQueueNotStarted_masterJob0":["deleteJobFromRecurrentQueueNotStarted_slaveJob1"]}},
Expiry=120000, FailureThreshold=0, IsJobQueue=true, JobPurgeInterval=1800000,
MONITORING_DISABLED=true, ParallelJobs=1, RecurrenceInterval=60,
RecurrenceUnit=SECONDS, StartTime=09-27-2020 21:29:26, TargetState=START,
Terminable=false, WorkflowID=deleteJobFromRecurrentQueueNotStarted,
capacity=2147483647}{JobTypes={}}{}, Stat=Stat {_version=2,
_creationTime=1601242166394, _modifiedTime=1601242170517, _ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted_slaveJob1=ZnRecord=deleteJobFromRecurrentQueueNotStarted_slaveJob1,
{Command=Reindex, ConcurrentTasksPerInstance=1, DisableExternalV
iew=false, Expiry=86400000, FailureThreshold=0,
IgnoreDependentJobFailure=false, JobCommandConfig={"Delay":"200"},
JobID=deleteJobFromRecurrentQueueNotStarted_slaveJob1,
MONITORING_DISABLED=true, MaxAttemptsPerTask=10,
MaxForcedReassignmentsPerTask=10, RebalanceRunningTask=false,
TargetPartitionStates=SLAVE, TargetResource=TestDB,
TimeoutPerPartition=3600000,
WorkflowID=deleteJobFromRecurrentQueueNotStarted}{}{}, Stat=Stat {_version=0,
_creationTime=1601242166392, _modifiedTime=1601242166392, _ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted_20200927T212926=ZnRecord=deleteJobFromRecurrentQueueNotStarted_20200927T212926,
{AllowOverlapJobAssignment=false,
Dag={"allNodes":["deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0","deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1"],"childrenToParents":{"deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1":["deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0"]},"parentsToChildren"
:{"deleteJobFromRecurrentQueueNotStarted_20200927T212926_masterJob0":["deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1"]}},
Expiry=120000, FailureThreshold=0, IsJobQueue=true, JobPurgeInterval=1800000,
MONITORING_DISABLED=true, ParallelJobs=1, StartTime=09-27-2020 21:29:26,
TargetState=START, Terminable=true,
WorkflowID=deleteJobFromRecurrentQueueNotStarted_20200927T212926,
capacity=2147483647}{JobTypes={}}{}, Stat=Stat {_version=0,
_creationTime=1601242166410, _modifiedTime=1601242166410, _ephemeralOwner=0},
deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1=ZnRecord=deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1,
{Command=Reindex, ConcurrentTasksPerInstance=1, DisableExternalView=false,
Expiry=86400000, FailureThreshold=0, IgnoreDependentJobFailure=false,
JobCommandConfig={"Delay":"200"},
JobID=deleteJobFromRecurrentQueueNotStarted_20200927T212926_slaveJob1,
MONITORING_DISABLED=true, MaxAttemptsPerTask=10, MaxForcedReassignmentsPerTask
=10, RebalanceRunningTask=false, TargetPartitionStates=SLAVE,
TargetResource=TestDB, TimeoutPerPartition=3600000,
WorkflowID=deleteJobFromRecurrentQueueNotStarted_20200927T212926}{}{},
Stat=Stat {_version=0, _creationTime=1601242166410,
_modifiedTime=1601242166410, _ephemeralOwner=0}}
2020-09-27T21:29:31.1710456Z Job stopAndDeleteQueue_slaveJob exists in
jobdag bug job config missing, expire the job
2020-09-27T21:29:31.1711452Z removed job
config:/TaskRebalancer/stopAndDeleteQueue_slaveJob
----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]