From 8ce079e9f0c2d52a54c1df0e2fb44541478739fc Mon Sep 17 00:00:00 2001 From: Simon Marlow <marlowsd@gmail.com> Date: Mon, 24 Oct 2011 13:29:32 +0100 Subject: [PATCH] fix race condition in yieldCapability() (#5552) See comment for details. I've tried quite hard, but haven't been able to make a small test case that reproduces the bug. --- rts/Capability.c | 27 ++++++++++++++++++++++++++- 1 file changed, 26 insertions(+), 1 deletion(-) diff --git a/rts/Capability.c b/rts/Capability.c index fe5dbdca4053..79c668fdfd8f 100644 --- a/rts/Capability.c +++ b/rts/Capability.c @@ -636,7 +636,15 @@ yieldCapability (Capability** pCap, Task *task) continue; } - if (task->incall->tso == NULL) { + if (task->cap != cap) { + // see Note [migrated bound threads] + debugTrace(DEBUG_sched, + "task has been migrated to cap %d", task->cap->no); + RELEASE_LOCK(&cap->lock); + continue; + } + + if (task->incall->tso == NULL) { ASSERT(cap->spare_workers != NULL); // if we're not at the front of the queue, release it // again. This is unlikely to happen. @@ -664,6 +672,23 @@ yieldCapability (Capability** pCap, Task *task) return; } +// Note [migrated bound threads] +// +// There's a tricky case where: +// - cap A is running an unbound thread T1 +// - there is a bound thread T2 at the head of the run queue on cap A +// - T1 makes a safe foreign call, the task bound to T2 is woken up on cap A +// - T1 returns quickly grabbing A again (T2 is still waking up on A) +// - T1 blocks, the scheduler migrates T2 to cap B +// - the task bound to T2 wakes up on cap B +// +// We take advantage of the following invariant: +// +// - A bound thread can only be migrated by the holder of the +// Capability on which the bound thread currently lives. So, if we +// hold Capabilty C, and task->cap == C, then task cannot be +// migrated under our feet. + /* ---------------------------------------------------------------------------- * prodCapability * -- GitLab