Browse Source

Fix edge case where a `Linearizer` could get stuck (#12358)

Just after a task acquires a contended `Linearizer` lock, it sleeps.
If the task is cancelled during this sleep, we need to release the lock.

Signed-off-by: Sean Quah <seanq@element.io>
tags/v1.57.0rc1
Sean Quah 2 years ago
committed by GitHub
parent
commit
79e7c2c426
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 53 additions and 5 deletions
  1. +1
    -0
      changelog.d/12358.misc
  2. +5
    -1
      synapse/util/async_helpers.py
  3. +47
    -4
      tests/util/test_linearizer.py

+ 1
- 0
changelog.d/12358.misc View File

@@ -0,0 +1 @@
Fix a long-standing bug where `Linearizer`s could get stuck if a cancellation were to happen at the wrong time.

+ 5
- 1
synapse/util/async_helpers.py View File

@@ -453,7 +453,11 @@ class Linearizer:
#
# This needs to happen while we hold the lock. We could put it on the
# exit path, but that would slow down the uncontended case.
await self._clock.sleep(0)
try:
await self._clock.sleep(0)
except CancelledError:
self._release_lock(key, entry)
raise

return entry



+ 47
- 4
tests/util/test_linearizer.py View File

@@ -13,7 +13,9 @@
# See the License for the specific language governing permissions and
# limitations under the License.

from typing import Callable, Hashable, Tuple
from typing import Hashable, Tuple

from typing_extensions import Protocol

from twisted.internet import defer, reactor
from twisted.internet.base import ReactorBase
@@ -25,10 +27,15 @@ from synapse.util.async_helpers import Linearizer
from tests import unittest


class UnblockFunction(Protocol):
def __call__(self, pump_reactor: bool = True) -> None:
...


class LinearizerTestCase(unittest.TestCase):
def _start_task(
self, linearizer: Linearizer, key: Hashable
) -> Tuple["Deferred[None]", "Deferred[None]", Callable[[], None]]:
) -> Tuple["Deferred[None]", "Deferred[None]", UnblockFunction]:
"""Starts a task which acquires the linearizer lock, blocks, then completes.

Args:
@@ -52,11 +59,12 @@ class LinearizerTestCase(unittest.TestCase):

d = defer.ensureDeferred(task())

def unblock() -> None:
def unblock(pump_reactor: bool = True) -> None:
unblock_d.callback(None)
# The next task, if it exists, will acquire the lock and require a kick of
# the reactor to advance.
self._pump()
if pump_reactor:
self._pump()

return d, acquired_d, unblock

@@ -212,3 +220,38 @@ class LinearizerTestCase(unittest.TestCase):
)
unblock3()
self.successResultOf(d3)

def test_cancellation_during_sleep(self) -> None:
"""Tests cancellation during the sleep just after waiting for a `Linearizer`."""
linearizer = Linearizer()

key = object()

d1, acquired_d1, unblock1 = self._start_task(linearizer, key)
self.assertTrue(acquired_d1.called)

# Create a second task, waiting for the first task.
d2, acquired_d2, _ = self._start_task(linearizer, key)
self.assertFalse(acquired_d2.called)

# Create a third task, waiting for the second task.
d3, acquired_d3, unblock3 = self._start_task(linearizer, key)
self.assertFalse(acquired_d3.called)

# Once the first task completes, cancel the waiting second task while it is
# sleeping just after acquiring the lock.
unblock1(pump_reactor=False)
self.successResultOf(d1)
d2.cancel()
self._pump()

self.assertTrue(d2.called)
self.failureResultOf(d2, CancelledError)

# The third task should continue running.
self.assertTrue(
acquired_d3.called,
"Third task did not get the lock after the second task was cancelled",
)
unblock3()
self.successResultOf(d3)

Loading…
Cancel
Save