Peter Bacsko created YUNIKORN-2550:
--------------------------------------
Summary: Fix locking in PartitionContext
Key: YUNIKORN-2550
URL: https://issues.apache.org/jira/browse/YUNIKORN-2550
Project: Apache YuniKorn
Issue Type: Sub-task
Components: core - common
Reporter: Peter Bacsko
Assignee: Peter Bacsko
Possible deadlock was detected:
{noformat}
~/repos/yunikorn-core/pkg/scheduler/partition.go:448
scheduler.(*PartitionContext).GetQueue { pc.RLock() } <<<<<
~/repos/yunikorn-core/pkg/scheduler/partition.go:447
scheduler.(*PartitionContext).GetQueue { func (pc *PartitionContext)
GetQueue(name string) *objects.Queue { }
~/repos/yunikorn-core/pkg/scheduler/placement/provided_rule.go:107
placement.(*providedRule).placeApplication { // if we cannot create the queue
must exist }
~/repos/yunikorn-core/pkg/scheduler/placement/placement.go:125
placement.(*AppPlacementManager).PlaceApplication { queueName, err =
checkRule.placeApplication(app, m.queueFn) }
~/repos/yunikorn-core/pkg/scheduler/partition.go:309
scheduler.(*PartitionContext).AddApplication { err :=
pc.getPlacementManager().PlaceApplication(app) }
~/repos/yunikorn-core/pkg/scheduler/context.go:523
scheduler.(*ClusterContext).handleRMUpdateApplicationEvent { schedApp :=
objects.NewApplication(app, ugi, cc.rmEventHandler, request.RmID) }
~/repos/yunikorn-core/pkg/scheduler/scheduler.go:130
scheduler.(*Scheduler).handleRMEvent { case ev := <-s.pendingEvents: }
Lock order is different between {{PartitionContext}} and {{AppPlacementManager}}
--
This message was sent by Atlassian Jira
(v8.20.10#820010)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]