Scille · touilleMan · May 27, 2021 · May 12, 2021 · May 12, 2021 · May 12, 2021
diff --git a/newsfragments/1730.bugfix.rst b/newsfragments/1730.bugfix.rst
@@ -0,0 +1 @@
+Fix possible crash when sync occurs right after a workspace reencryption.
diff --git a/parsec/core/sync_monitor.py b/parsec/core/sync_monitor.py
@@ -11,6 +11,7 @@
 from parsec.core.types import EntryID, WorkspaceRole
 from parsec.core.fs import (
     FSBackendOfflineError,
+    FSBadEncryptionRevision,
     FSWorkspaceNotFoundError,
     FSWorkspaceNoReadAccess,
     FSWorkspaceNoWriteAccess,
@@ -229,8 +230,11 @@ async def tick(self) -> float:
                 # modifications. Hence we can forget about this change given
                 # it's `self._local_changes` role to keep track of local changes.
                 pass
-            except FSWorkspaceInMaintenance:
-                # Not the right time for the sync, retry later
+            except (FSWorkspaceInMaintenance, FSBadEncryptionRevision):
+                # Not the right time for the sync, retry later.
+                # `FSBadEncryptionRevision` occurs if the reencryption is quick
+                # enough to start and finish before we process the sharing.reencrypted
+                # message so we try a sync with the old encryption revision.
                 min_due_time = now + MAINTENANCE_MIN_WAIT
                 self._remote_changes.add(entry_id)
 
@@ -257,8 +261,11 @@ async def tick(self) -> float:
                     # the write access in the future) but pretent it just accured
                     # to avoid a busy sync loop until `read_only` flag is updated.
                     self._local_changes[entry_id] = LocalChange(now)
-                except FSWorkspaceInMaintenance:
-                    # Not the right time for the sync, retry later
+                except (FSWorkspaceInMaintenance, FSBadEncryptionRevision):
+                    # Not the right time for the sync, retry later.
+                    # `FSBadEncryptionRevision` occurs if the reencryption is quick
+                    # enough to start and finish before we process the sharing.reencrypted
+                    # message so we try a sync with the old encryption revision.
                     min_due_time = now + MAINTENANCE_MIN_WAIT
                     self._local_changes[entry_id] = LocalChange(now)
 

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -13,6 +13,7 @@
 import contextlib
 import pendulum
 from unittest.mock import patch
+import logging
 import structlog
 import trio
 from trio.testing import MockClock
@@ -141,11 +142,29 @@ def _remove_colors(msg):
 
     def _assert_occured(self, log):
         __tracebackhide__ = True
-        assert any([r for r in self.records if log in _remove_colors(r.msg)])
+        record = next((r for r in self.records if log in _remove_colors(r.msg)), None)
+        assert record is not None
+        if not hasattr(self, "asserted_records"):
+            self.asserted_records = set()
+        self.asserted_records.add(record)
 
     LogCaptureFixture.assert_occured = _assert_occured
 
 
+@pytest.fixture(autouse=True)
+def no_logs_gte_error(caplog):
+    yield
+    # The test should use `caplog.assert_occured` to indicate a log was expected,
+    # otherwise we consider error logs as *actual* errors.
+    asserted_records = getattr(caplog, "asserted_records", set())
+    errors = [
+        record
+        for record in caplog.get_records("call")
+        if record.levelno >= logging.ERROR and record not in asserted_records
+    ]
+    assert not errors
+
+
 def patch_pytest_trio():
     # Fix while waiting for
     # https://github.com/python-trio/pytest-trio/issues/77

diff --git a/tests/core/backend_connection/test_authenticated_conn.py b/tests/core/backend_connection/test_authenticated_conn.py
@@ -104,7 +104,7 @@ async def test_init_with_backend_offline(event_bus, alice):
 
 @pytest.mark.trio
 @pytest.mark.parametrize("during_bootstrap", (True, False))
-async def test_monitor_crash(running_backend, event_bus, alice, during_bootstrap):
+async def test_monitor_crash(caplog, running_backend, event_bus, alice, during_bootstrap):
     async def _bad_monitor(*, task_status=trio.TASK_STATUS_IGNORED):
         if during_bootstrap:
             raise RuntimeError("D'oh !")
@@ -123,6 +123,9 @@ async def _bad_monitor(*, task_status=trio.TASK_STATUS_IGNORED):
                 {"status": BackendConnStatus.CRASHED, "status_exc": spy.ANY},
             )
             assert conn.status == BackendConnStatus.CRASHED
+            caplog.assert_occured(
+                "[exception] Unhandled exception            [parsec.core.backend_connection.authenticated]"
+            )
 
             # Test command not possible
             with pytest.raises(BackendNotAvailable) as exc:

diff --git a/tests/core/gui/test_workspaces_reencrypt.py b/tests/core/gui/test_workspaces_reencrypt.py
@@ -292,6 +292,7 @@ def _assert_error():
 )
 @customize_fixtures(logged_gui_as_admin=True)
 async def test_workspace_reencryption_do_one_batch_error(
+    caplog,
     aqtbot,
     running_backend,
     logged_gui,
@@ -332,6 +333,11 @@ def _assert_error():
         assert wk_button.button_reencrypt.isVisible()
 
     await aqtbot.wait_until(_assert_error)
+    # Unexpected error is logged
+    if error_type is Exception:
+        caplog.assert_occured(
+            "[exception] Uncatched error                [parsec.core.gui.trio_thread]"
+        )
 
 
 @pytest.mark.gui

diff --git a/tests/core/mountpoint/test_file_failures.py b/tests/core/mountpoint/test_file_failures.py
@@ -69,7 +69,7 @@ def test_empty_read_then_reopen(tmpdir, mountpoint_service):
 @pytest.mark.mountpoint
 @pytest.mark.skipif(sys.platform == "darwin", reason="TODO : crash on macOS")
 async def test_remote_error_event(
-    tmpdir, monkeypatch, running_backend, alice_user_fs, bob_user_fs, monitor
+    tmpdir, monkeypatch, caplog, running_backend, alice_user_fs, bob_user_fs, monitor
 ):
     wid = await create_shared_workspace("w1", bob_user_fs, alice_user_fs)
 
@@ -126,6 +126,11 @@ def _crash(*args, **kwargs):
             with alice_user_fs.event_bus.listen() as spy:
                 with pytest.raises(OSError):
                     os.mkdir(str(trio_w / "dummy"))
+            if sys.platform == "win32":
+                expected_log = "[exception] Unhandled exception in winfsp mountpoint [parsec.core.mountpoint.winfsp_operations]"
+            else:
+                expected_log = "[exception] Unhandled exception in fuse mountpoint [parsec.core.mountpoint.fuse_operations]"
+            caplog.assert_occured(expected_log)
             spy.assert_event_occured(CoreEvent.MOUNTPOINT_UNHANDLED_ERROR)
 
         await trio.to_thread.run_sync(_testbed_online)
diff --git a/tests/core/test_sync_monitor.py b/tests/core/test_sync_monitor.py
@@ -386,3 +386,53 @@ async def test_sync_monitor_while_changing_roles(
     await bob_core.wait_idle_monitors()
     info = await bob_workspace.path_info("/this-should-not-fail")
     assert not info["need_sync"]
+
+
+@pytest.mark.trio
+async def test_sync_with_concurrent_reencryption(
+    running_backend, alice_core, bob_user_fs, autojump_clock, monkeypatch
+):
+    # Create a shared workspace
+    wid = await create_shared_workspace("w", bob_user_fs, alice_core)
+    alice_workspace = alice_core.user_fs.get_workspace(wid)
+    bob_workspace = bob_user_fs.get_workspace(wid)
+
+    # Alice creates a files, let it sync
+    await alice_workspace.write_bytes("/test.txt", b"v1")
+    await alice_core.wait_idle_monitors()
+    await bob_user_fs.sync()
+
+    # Freeze Alice message processing so she won't process `sharing.reencrypted` messages
+    allow_message_processing = trio.Event()
+
+    async def _mockpoint_sleep():
+        await allow_message_processing.wait()
+
+    monkeypatch.setattr(
+        "parsec.core.messages_monitor.freeze_messages_monitor_mockpoint", _mockpoint_sleep
+    )
+
+    # Now Bob reencrypt the workspace
+    reencryption_job = await bob_user_fs.workspace_start_reencryption(wid)
+    await bob_user_fs.process_last_messages()
+    total, done = await reencryption_job.do_one_batch()
+    assert total == done  # Sanity check to make sure the encryption is finished
+
+    # Alice modify the workspace and try to do the sync...
+    await alice_workspace.write_bytes("/test.txt", b"v2")
+    # Sync monitor will try and fail to do the sync of the workspace
+    await trio.sleep(300)  # autojump, so not *really* 300s
+    assert not alice_core.are_monitors_idle()
+
+    # Now let Alice process the `sharing.reencrypted` messages, this should
+    # allow to do the sync
+    allow_message_processing.set()
+    with trio.fail_after(60):  # autojump, so not *really* 60s
+        await alice_core.wait_idle_monitors()
+
+    # Just make sure the sync is done
+    await bob_workspace.sync()
+    for workspace in (bob_workspace, alice_workspace):
+        info = await workspace.path_info("/test.txt")
+        assert not info["need_sync"]
+        assert info["base_version"] == 3
diff --git a/tests/test_nursery.py b/tests/test_nursery.py
@@ -15,7 +15,7 @@ async def test_open_service_nursery_exists():
 
 
 @pytest.mark.trio
-async def test_open_service_nursery_multierror_collapse():
+async def test_open_service_nursery_multierror_collapse(caplog):
     async def _raise(exc):
         raise exc
 
@@ -34,6 +34,8 @@ async def _raise(exc):
             nursery.start_soon(_raise, RuntimeError())
             await _raise(ZeroDivisionError(1, 2, 3))
 
+    caplog.assert_occured("[exception] A MultiError has been detected [parsec.utils]")
+
     exception = ctx.value
     assert isinstance(exception, ZeroDivisionError)
     assert exception.args == (1, 2, 3)