synapse/tests/storage/test_event_federation.py

#
# This file is licensed under the Affero General Public License (AGPL) version 3.
#
# Copyright (C) 2023 New Vector, Ltd
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as
# published by the Free Software Foundation, either version 3 of the
# License, or (at your option) any later version.
#
# See the GNU Affero General Public License for more details:
# <https://www.gnu.org/licenses/agpl-3.0.html>.
#
# Originally licensed under the Apache License, Version 2.0:
# <http://www.apache.org/licenses/LICENSE-2.0>.
#
# [This file includes modifications made by New Vector Limited]
#
#

import datetime
from typing import (
    Collection,
    Dict,
    FrozenSet,
    Iterable,
    List,
    Mapping,
    Set,
    Tuple,
    TypeVar,
    Union,
    cast,
)

import attr
from parameterized import parameterized

from twisted.test.proto_helpers import MemoryReactor

from synapse.api.constants import EventTypes
from synapse.api.room_versions import (
    KNOWN_ROOM_VERSIONS,
    EventFormatVersions,
    RoomVersion,
)
from synapse.events import EventBase
from synapse.rest import admin
from synapse.rest.client import login, room
from synapse.server import HomeServer
from synapse.storage.database import LoggingTransaction
from synapse.storage.types import Cursor
from synapse.synapse_rust.events import EventInternalMetadata
from synapse.types import JsonDict
from synapse.util import Clock, json_encoder

import tests.unittest
import tests.utils

# The silly auth graph we use to test the auth difference algorithm,
# where the top are the most recent events.
#
#   A   B
#    \ /
#  D  E
#  \  |
#   ` F   C
#     |  /|
#     G ´ |
#     | \ |
#     H   I
#     |   |
#     K   J

AUTH_GRAPH: Dict[str, List[str]] = {
    "a": ["e"],
    "b": ["e"],
    "c": ["g", "i"],
    "d": ["f"],
    "e": ["f"],
    "f": ["g"],
    "g": ["h", "i"],
    "h": ["k"],
    "i": ["j"],
    "k": [],
    "j": [],
}

DEPTH_GRAPH = {
    "a": 7,
    "b": 7,
    "c": 4,
    "d": 6,
    "e": 6,
    "f": 5,
    "g": 3,
    "h": 2,
    "i": 2,
    "k": 1,
    "j": 1,
}

T = TypeVar("T")


def get_all_topologically_sorted_orders(
    nodes: Iterable[T],
    graph: Mapping[T, Collection[T]],
) -> List[List[T]]:
    """Given a set of nodes and a graph, return all possible topological
    orderings.
    """

    # This is implemented by Kahn's algorithm, and forking execution each time
    # we have a choice over which node to consider next.

    degree_map = {node: 0 for node in nodes}
    reverse_graph: Dict[T, Set[T]] = {}

    for node, edges in graph.items():
        if node not in degree_map:
            continue

        for edge in set(edges):
            if edge in degree_map:
                degree_map[node] += 1

            reverse_graph.setdefault(edge, set()).add(node)
        reverse_graph.setdefault(node, set())

    zero_degree = [node for node, degree in degree_map.items() if degree == 0]

    return _get_all_topologically_sorted_orders_inner(
        reverse_graph, zero_degree, degree_map
    )


def _get_all_topologically_sorted_orders_inner(
    reverse_graph: Dict[T, Set[T]],
    zero_degree: List[T],
    degree_map: Dict[T, int],
) -> List[List[T]]:
    new_paths = []

    # Rather than only choosing *one* item from the list of nodes with zero
    # degree, we "fork" execution and run the algorithm for each node in the
    # zero degree.
    for node in zero_degree:
        new_degree_map = degree_map.copy()
        new_zero_degree = zero_degree.copy()
        new_zero_degree.remove(node)

        for edge in reverse_graph.get(node, []):
            if edge in new_degree_map:
                new_degree_map[edge] -= 1
                if new_degree_map[edge] == 0:
                    new_zero_degree.append(edge)

        paths = _get_all_topologically_sorted_orders_inner(
            reverse_graph, new_zero_degree, new_degree_map
        )
        for path in paths:
            path.insert(0, node)

        new_paths.extend(paths)

    if not new_paths:
        return [[]]

    return new_paths


def get_all_topologically_consistent_subsets(
    nodes: Iterable[T],
    graph: Mapping[T, Collection[T]],
) -> Set[FrozenSet[T]]:
    """Get all subsets of the graph where if node N is in the subgraph, then all
    nodes that can reach that node (i.e. for all X there exists a path X -> N)
    are in the subgraph.
    """
    all_topological_orderings = get_all_topologically_sorted_orders(nodes, graph)

    graph_subsets = set()
    for ordering in all_topological_orderings:
        ordering.reverse()

        for idx in range(len(ordering)):
            graph_subsets.add(frozenset(ordering[:idx]))

    return graph_subsets


@attr.s(auto_attribs=True, frozen=True, slots=True)
class _BackfillSetupInfo:
    room_id: str
    depth_map: Dict[str, int]


class EventFederationWorkerStoreTestCase(tests.unittest.HomeserverTestCase):
    servlets = [
        admin.register_servlets,
        room.register_servlets,
        login.register_servlets,
    ]

    def prepare(self, reactor: MemoryReactor, clock: Clock, hs: HomeServer) -> None:
        self.store = hs.get_datastores().main
        persist_events = hs.get_datastores().persist_events
        assert persist_events is not None
        self.persist_events = persist_events

    def test_get_prev_events_for_room(self) -> None:
        room_id = "@ROOM:local"

        # add a bunch of events and hashes to act as forward extremities
        def insert_event(txn: Cursor, i: int) -> None:
            event_id = "$event_%i:local" % i

            txn.execute(
                (
                    "INSERT INTO events ("
                    "   room_id, event_id, type, depth, topological_ordering,"
                    "   content, processed, outlier, stream_ordering) "
                    "VALUES (?, ?, 'm.test', ?, ?, 'test', ?, ?, ?)"
                ),
                (room_id, event_id, i, i, True, False, i),
            )

            txn.execute(
                (
                    "INSERT INTO event_forward_extremities (room_id, event_id) "
                    "VALUES (?, ?)"
                ),
                (room_id, event_id),
            )

        for i in range(20):
            self.get_success(
                self.store.db_pool.runInteraction("insert", insert_event, i)
            )

        # this should get the last ten
        r = self.get_success(self.store.get_prev_events_for_room(room_id))
        self.assertEqual(10, len(r))
        for i in range(10):
            self.assertEqual("$event_%i:local" % (19 - i), r[i])

    def test_get_rooms_with_many_extremities(self) -> None:
        room1 = "#room1"
        room2 = "#room2"
        room3 = "#room3"

        def insert_event(txn: LoggingTransaction, i: int, room_id: str) -> None:
            event_id = "$event_%i:local" % i

            # We need to insert into events table to get around the foreign key constraint.
            self.store.db_pool.simple_insert_txn(
                txn,
                table="events",
                values={
                    "instance_name": "master",
                    "stream_ordering": self.store._stream_id_gen.get_next_txn(txn),
                    "topological_ordering": 1,
                    "depth": 1,
                    "event_id": event_id,
                    "room_id": room_id,
                    "type": EventTypes.Message,
                    "processed": True,
                    "outlier": False,
                    "origin_server_ts": 0,
                    "received_ts": 0,
                    "sender": "@user:local",
                    "contains_url": False,
                    "state_key": None,
                    "rejection_reason": None,
                },
            )

            txn.execute(
                (
                    "INSERT INTO event_forward_extremities (room_id, event_id) "
                    "VALUES (?, ?)"
                ),
                (room_id, event_id),
            )

        for i in range(20):
            self.get_success(
                self.store.db_pool.runInteraction("insert", insert_event, i, room1)
            )
            self.get_success(
                self.store.db_pool.runInteraction(
                    "insert", insert_event, i + 100, room2
                )
            )
            self.get_success(
                self.store.db_pool.runInteraction(
                    "insert", insert_event, i + 200, room3
                )
            )

        # Test simple case
        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 5, []))
        self.assertEqual(len(r), 3)

        # Does filter work?

        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 5, [room1]))
        self.assertTrue(room2 in r)
        self.assertTrue(room3 in r)
        self.assertEqual(len(r), 2)

        r = self.get_success(
            self.store.get_rooms_with_many_extremities(5, 5, [room1, room2])
        )
        self.assertEqual(r, [room3])

        # Does filter and limit work?

        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 1, [room1]))
        self.assertTrue(r == [room2] or r == [room3])

    def _setup_auth_chain(self, use_chain_cover_index: bool) -> str:
        room_id = "@ROOM:local"

        # Mark the room as maybe having a cover index.

        def store_room(txn: LoggingTransaction) -> None:
            self.store.db_pool.simple_insert_txn(
                txn,
                "rooms",
                {
                    "room_id": room_id,
                    "creator": "room_creator_user_id",
                    "is_public": True,
                    "room_version": "6",
                    "has_auth_chain_index": use_chain_cover_index,
                },
            )

        self.get_success(self.store.db_pool.runInteraction("store_room", store_room))

        # We rudely fiddle with the appropriate tables directly, as that's much
        # easier than constructing events properly.

        def insert_event(txn: LoggingTransaction) -> None:
            stream_ordering = 0

            for event_id in AUTH_GRAPH:
                stream_ordering += 1
                depth = DEPTH_GRAPH[event_id]

                self.store.db_pool.simple_insert_txn(
                    txn,
                    table="events",
                    values={
                        "event_id": event_id,
                        "room_id": room_id,
                        "depth": depth,
                        "topological_ordering": depth,
                        "type": "m.test",
                        "processed": True,
                        "outlier": False,
                        "stream_ordering": stream_ordering,
                    },
                )

            self.persist_events._persist_event_auth_chain_txn(
                txn,
                [
                    cast(EventBase, FakeEvent(event_id, room_id, AUTH_GRAPH[event_id]))
                    for event_id in AUTH_GRAPH
                ],
            )

        self.get_success(
            self.store.db_pool.runInteraction(
                "insert",
                insert_event,
            )
        )

        return room_id

    @parameterized.expand([(True,), (False,)])
    def test_auth_chain_ids(self, use_chain_cover_index: bool) -> None:
        room_id = self._setup_auth_chain(use_chain_cover_index)

        # a and b have the same auth chain.
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["a"]))
        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["b"]))
        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
        auth_chain_ids = self.get_success(
            self.store.get_auth_chain_ids(room_id, ["a", "b"])
        )
        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])

        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["c"]))
        self.assertCountEqual(auth_chain_ids, ["g", "h", "i", "j", "k"])

        # d and e have the same auth chain.
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["d"]))
        self.assertCountEqual(auth_chain_ids, ["f", "g", "h", "i", "j", "k"])
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["e"]))
        self.assertCountEqual(auth_chain_ids, ["f", "g", "h", "i", "j", "k"])

        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["f"]))
        self.assertCountEqual(auth_chain_ids, ["g", "h", "i", "j", "k"])

        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["g"]))
        self.assertCountEqual(auth_chain_ids, ["h", "i", "j", "k"])

        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["h"]))
        self.assertEqual(auth_chain_ids, {"k"})

        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["i"]))
        self.assertEqual(auth_chain_ids, {"j"})

        # j and k have no parents.
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["j"]))
        self.assertEqual(auth_chain_ids, set())
        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["k"]))
        self.assertEqual(auth_chain_ids, set())

        # More complex input sequences.
        auth_chain_ids = self.get_success(
            self.store.get_auth_chain_ids(room_id, ["b", "c", "d"])
        )
        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])

        auth_chain_ids = self.get_success(
            self.store.get_auth_chain_ids(room_id, ["h", "i"])
        )
        self.assertCountEqual(auth_chain_ids, ["k", "j"])

        # e gets returned even though include_given is false, but it is in the
        # auth chain of b.
        auth_chain_ids = self.get_success(
            self.store.get_auth_chain_ids(room_id, ["b", "e"])
        )
        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])

        # Test include_given.
        auth_chain_ids = self.get_success(
            self.store.get_auth_chain_ids(room_id, ["i"], include_given=True)
        )
        self.assertCountEqual(auth_chain_ids, ["i", "j"])

    @parameterized.expand([(True,), (False,)])
    def test_auth_difference(self, use_chain_cover_index: bool) -> None:
        room_id = self._setup_auth_chain(use_chain_cover_index)

        # Now actually test that various combinations give the right result:
        self.assert_auth_diff_is_expected(room_id)

    @parameterized.expand(
        [
            [graph_subset]
            for graph_subset in get_all_topologically_consistent_subsets(
                AUTH_GRAPH, AUTH_GRAPH
            )
        ]
    )
    def test_auth_difference_partial(self, graph_subset: Collection[str]) -> None:
        """Test that if we only have a chain cover index on a partial subset of
        the room we still get the correct auth chain difference.

        We do this by removing the chain cover index for every valid subset of the
        graph.
        """
        room_id = self._setup_auth_chain(True)

        for event_id in graph_subset:
            # Remove chain cover from that event.
            self.get_success(
                self.store.db_pool.simple_delete(
                    table="event_auth_chains",
                    keyvalues={"event_id": event_id},
                    desc="test_auth_difference_partial_remove",
                )
            )
            self.get_success(
                self.store.db_pool.simple_insert(
                    table="event_auth_chain_to_calculate",
                    values={
                        "event_id": event_id,
                        "room_id": room_id,
                        "type": "",
                        "state_key": "",
                    },
                    desc="test_auth_difference_partial_remove",
                )
            )

        self.assert_auth_diff_is_expected(room_id)

    def assert_auth_diff_is_expected(self, room_id: str) -> None:
        """Assert the auth chain difference returns the correct answers."""
        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c", "e", "f"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b", "c"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"d"}])
        )
        self.assertSetEqual(difference, {"a", "b", "d", "e"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}, {"d"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c", "d", "e", "f"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"e"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}])
        )
        self.assertSetEqual(difference, set())

    def test_auth_difference_partial_cover(self) -> None:
        """Test that we correctly handle rooms where not all events have a chain
        cover calculated. This can happen in some obscure edge cases, including
        during the background update that calculates the chain cover for old
        rooms.
        """

        room_id = "@ROOM:local"

        # The silly auth graph we use to test the auth difference algorithm,
        # where the top are the most recent events.
        #
        #   A   B
        #    \ /
        #  D  E
        #  \  |
        #   ` F   C
        #     |  /|
        #     G ´ |
        #     | \ |
        #     H   I
        #     |   |
        #     K   J

        auth_graph: Dict[str, List[str]] = {
            "a": ["e"],
            "b": ["e"],
            "c": ["g", "i"],
            "d": ["f"],
            "e": ["f"],
            "f": ["g"],
            "g": ["h", "i"],
            "h": ["k"],
            "i": ["j"],
            "k": [],
            "j": [],
        }

        depth_map = {
            "a": 7,
            "b": 7,
            "c": 4,
            "d": 6,
            "e": 6,
            "f": 5,
            "g": 3,
            "h": 2,
            "i": 2,
            "k": 1,
            "j": 1,
        }

        # We rudely fiddle with the appropriate tables directly, as that's much
        # easier than constructing events properly.

        def insert_event(txn: LoggingTransaction) -> None:
            # First insert the room and mark it as having a chain cover.
            self.store.db_pool.simple_insert_txn(
                txn,
                "rooms",
                {
                    "room_id": room_id,
                    "creator": "room_creator_user_id",
                    "is_public": True,
                    "room_version": "6",
                    "has_auth_chain_index": True,
                },
            )

            stream_ordering = 0

            for event_id in auth_graph:
                stream_ordering += 1
                depth = depth_map[event_id]

                self.store.db_pool.simple_insert_txn(
                    txn,
                    table="events",
                    values={
                        "event_id": event_id,
                        "room_id": room_id,
                        "depth": depth,
                        "topological_ordering": depth,
                        "type": "m.test",
                        "processed": True,
                        "outlier": False,
                        "stream_ordering": stream_ordering,
                    },
                )

            # Insert all events apart from 'B'
            self.persist_events._persist_event_auth_chain_txn(
                txn,
                [
                    cast(EventBase, FakeEvent(event_id, room_id, auth_graph[event_id]))
                    for event_id in auth_graph
                    if event_id != "b"
                ],
            )

            # Now we insert the event 'B' without a chain cover, by temporarily
            # pretending the room doesn't have a chain cover.

            self.store.db_pool.simple_update_txn(
                txn,
                table="rooms",
                keyvalues={"room_id": room_id},
                updatevalues={"has_auth_chain_index": False},
            )

            self.persist_events._persist_event_auth_chain_txn(
                txn,
                [cast(EventBase, FakeEvent("b", room_id, auth_graph["b"]))],
            )

            self.store.db_pool.simple_update_txn(
                txn,
                table="rooms",
                keyvalues={"room_id": room_id},
                updatevalues={"has_auth_chain_index": True},
            )

        self.get_success(
            self.store.db_pool.runInteraction(
                "insert",
                insert_event,
            )
        )

        # Now actually test that various combinations give the right result:

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c", "e", "f"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b", "c"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"d"}])
        )
        self.assertSetEqual(difference, {"a", "b", "d", "e"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}, {"d"}])
        )
        self.assertSetEqual(difference, {"a", "b", "c", "d", "e", "f"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"e"}])
        )
        self.assertSetEqual(difference, {"a", "b"})

        difference = self.get_success(
            self.store.get_auth_chain_difference(room_id, [{"a"}])
        )
        self.assertSetEqual(difference, set())

    @parameterized.expand(
        [(room_version,) for room_version in KNOWN_ROOM_VERSIONS.values()]
    )
    def test_prune_inbound_federation_queue(self, room_version: RoomVersion) -> None:
        """Test that pruning of inbound federation queues work"""

        room_id = "some_room_id"

        def prev_event_format(prev_event_id: str) -> Union[Tuple[str, dict], str]:
            """Account for differences in prev_events format across room versions"""
            if room_version.event_format == EventFormatVersions.ROOM_V1_V2:
                return prev_event_id, {}

            return prev_event_id

        # Insert a bunch of events that all reference the previous one.
        self.get_success(
            self.store.db_pool.simple_insert_many(
                table="federation_inbound_events_staging",
                keys=(
                    "origin",
                    "room_id",
                    "received_ts",
                    "event_id",
                    "event_json",
                    "internal_metadata",
                ),
                values=[
                    (
                        "some_origin",
                        room_id,
                        0,
                        f"$fake_event_id_{i + 1}",
                        json_encoder.encode(
                            {"prev_events": [prev_event_format(f"$fake_event_id_{i}")]}
                        ),
                        "{}",
                    )
                    for i in range(500)
                ],
                desc="test_prune_inbound_federation_queue",
            )
        )

        # Calling prune once should return True, i.e. a prune happen. The second
        # time it shouldn't.
        pruned = self.get_success(
            self.store.prune_staged_events_in_room(room_id, room_version)
        )
        self.assertTrue(pruned)

        pruned = self.get_success(
            self.store.prune_staged_events_in_room(room_id, room_version)
        )
        self.assertFalse(pruned)

        # Assert that we only have a single event left in the queue, and that it
        # is the last one.
        count = self.get_success(
            self.store.db_pool.simple_select_one_onecol(
                table="federation_inbound_events_staging",
                keyvalues={"room_id": room_id},
                retcol="COUNT(*)",
                desc="test_prune_inbound_federation_queue",
            )
        )
        self.assertEqual(count, 1)

        next_staged_event_info = self.get_success(
            self.store.get_next_staged_event_id_for_room(room_id)
        )
        assert next_staged_event_info
        _, event_id = next_staged_event_info
        self.assertEqual(event_id, "$fake_event_id_500")

    def _setup_room_for_backfill_tests(self) -> _BackfillSetupInfo:
        """
        Sets up a room with various events and backward extremities to test
        backfill functions against.

        Returns:
            _BackfillSetupInfo including the `room_id` to test against and
            `depth_map` of events in the room
        """
        room_id = "!backfill-room-test:some-host"

        # The silly graph we use to test grabbing backward extremities,
        # where the top is the oldest events.
        #    1 (oldest)
        #    |
        #    2 ⹁
        #    |  \
        #    |   [b1, b2, b3]
        #    |   |
        #    |   A
        #    |  /
        #    3 {
        #    |  \
        #    |   [b4, b5, b6]
        #    |   |
        #    |   B
        #    |  /
        #    4 ´
        #    |
        #    5 (newest)

        event_graph: Dict[str, List[str]] = {
            "1": [],
            "2": ["1"],
            "3": ["2", "A"],
            "4": ["3", "B"],
            "5": ["4"],
            "A": ["b1", "b2", "b3"],
            "b1": ["2"],
            "b2": ["2"],
            "b3": ["2"],
            "B": ["b4", "b5", "b6"],
            "b4": ["3"],
            "b5": ["3"],
            "b6": ["3"],
        }

        depth_map: Dict[str, int] = {
            "1": 1,
            "2": 2,
            "b1": 3,
            "b2": 3,
            "b3": 3,
            "A": 4,
            "3": 5,
            "b4": 6,
            "b5": 6,
            "b6": 6,
            "B": 7,
            "4": 8,
            "5": 9,
        }

        # The events we have persisted on our server.
        # The rest are events in the room but not backfilled tet.
        our_server_events = {"5", "4", "B", "3", "A"}

        complete_event_dict_map: Dict[str, JsonDict] = {}
        stream_ordering = 0
        for event_id, prev_event_ids in event_graph.items():
            depth = depth_map[event_id]

            complete_event_dict_map[event_id] = {
                "event_id": event_id,
                "type": "test_regular_type",
                "room_id": room_id,
                "sender": "@sender",
                "prev_event_ids": prev_event_ids,
                "auth_event_ids": [],
                "origin_server_ts": stream_ordering,
                "depth": depth,
                "stream_ordering": stream_ordering,
                "content": {"body": "event" + event_id},
            }

            stream_ordering += 1

        def populate_db(txn: LoggingTransaction) -> None:
            # Insert the room to satisfy the foreign key constraint of
            # `event_failed_pull_attempts`
            self.store.db_pool.simple_insert_txn(
                txn,
                "rooms",
                {
                    "room_id": room_id,
                    "creator": "room_creator_user_id",
                    "is_public": True,
                    "room_version": "6",
                },
            )

            # Insert our server events
            for event_id in our_server_events:
                event_dict = complete_event_dict_map[event_id]

                self.store.db_pool.simple_insert_txn(
                    txn,
                    table="events",
                    values={
                        "event_id": event_dict.get("event_id"),
                        "type": event_dict.get("type"),
                        "room_id": event_dict.get("room_id"),
                        "depth": event_dict.get("depth"),
                        "topological_ordering": event_dict.get("depth"),
                        "stream_ordering": event_dict.get("stream_ordering"),
                        "processed": True,
                        "outlier": False,
                    },
                )

            # Insert the event edges
            for event_id in our_server_events:
                for prev_event_id in event_graph[event_id]:
                    self.store.db_pool.simple_insert_txn(
                        txn,
                        table="event_edges",
                        values={
                            "event_id": event_id,
                            "prev_event_id": prev_event_id,
                            "room_id": room_id,
                        },
                    )

            # Insert the backward extremities
            prev_events_of_our_events = {
                prev_event_id
                for our_server_event in our_server_events
                for prev_event_id in complete_event_dict_map[our_server_event][
                    "prev_event_ids"
                ]
            }
            backward_extremities = prev_events_of_our_events - our_server_events
            for backward_extremity in backward_extremities:
                self.store.db_pool.simple_insert_txn(
                    txn,
                    table="event_backward_extremities",
                    values={
                        "event_id": backward_extremity,
                        "room_id": room_id,
                    },
                )

        self.get_success(
            self.store.db_pool.runInteraction(
                "_setup_room_for_backfill_tests_populate_db",
                populate_db,
            )
        )

        return _BackfillSetupInfo(room_id=room_id, depth_map=depth_map)

    def test_get_backfill_points_in_room(self) -> None:
        """
        Test to make sure only backfill points that are older and come before
        the `current_depth` are returned.
        """
        setup_info = self._setup_room_for_backfill_tests()
        room_id = setup_info.room_id
        depth_map = setup_info.depth_map

        # Try at "B"
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["B"], limit=100)
        )
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        self.assertEqual(backfill_event_ids, ["b6", "b5", "b4", "2", "b3", "b2", "b1"])

        # Try at "A"
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
        )
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        # Event "2" has a depth of 2 but is not included here because we only
        # know the approximate depth of 5 from our event "3".
        self.assertListEqual(backfill_event_ids, ["b3", "b2", "b1"])

    def test_get_backfill_points_in_room_excludes_events_we_have_attempted(
        self,
    ) -> None:
        """
        Test to make sure that events we have attempted to backfill (and within
        backoff timeout duration) do not show up as an event to backfill again.
        """
        setup_info = self._setup_room_for_backfill_tests()
        room_id = setup_info.room_id
        depth_map = setup_info.depth_map

        # Record some attempts to backfill these events which will make
        # `get_backfill_points_in_room` exclude them because we
        # haven't passed the backoff interval.
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b5", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b4", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b3", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b2", "fake cause")
        )

        # No time has passed since we attempted to backfill ^

        # Try at "B"
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["B"], limit=100)
        )
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        # Only the backfill points that we didn't record earlier exist here.
        self.assertEqual(backfill_event_ids, ["b6", "2", "b1"])

    def test_get_backfill_points_in_room_attempted_event_retry_after_backoff_duration(
        self,
    ) -> None:
        """
        Test to make sure after we fake attempt to backfill event "b3" many times,
        we can see retry and see the "b3" again after the backoff timeout duration
        has exceeded.
        """
        setup_info = self._setup_room_for_backfill_tests()
        room_id = setup_info.room_id
        depth_map = setup_info.depth_map

        # Record some attempts to backfill these events which will make
        # `get_backfill_points_in_room` exclude them because we
        # haven't passed the backoff interval.
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b3", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
        )

        # Now advance time by 2 hours and we should only be able to see "b3"
        # because we have waited long enough for the single attempt (2^1 hours)
        # but we still shouldn't see "b1" because we haven't waited long enough
        # for this many attempts. We didn't do anything to "b2" so it should be
        # visible regardless.
        self.reactor.advance(datetime.timedelta(hours=2).total_seconds())

        # Try at "A" and make sure that "b1" is not in the list because we've
        # already attempted many times
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
        )
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        self.assertEqual(backfill_event_ids, ["b3", "b2"])

        # Now advance time by 20 hours (above 2^4 because we made 4 attemps) and
        # see if we can now backfill it
        self.reactor.advance(datetime.timedelta(hours=20).total_seconds())

        # Try at "A" again after we advanced enough time and we should see "b3" again
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
        )
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        self.assertEqual(backfill_event_ids, ["b3", "b2", "b1"])

    def test_get_backfill_points_in_room_works_after_many_failed_pull_attempts_that_could_naively_overflow(
        self,
    ) -> None:
        """
        A test that reproduces https://github.com/matrix-org/synapse/issues/13929 (Postgres only).

        Test to make sure we can still get backfill points after many failed pull
        attempts that cause us to backoff to the limit. Even if the backoff formula
        would tell us to wait for more seconds than can be expressed in a 32 bit
        signed int.
        """
        setup_info = self._setup_room_for_backfill_tests()
        room_id = setup_info.room_id
        depth_map = setup_info.depth_map

        # Pretend that we have tried and failed 10 times to backfill event b1.
        for _ in range(10):
            self.get_success(
                self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
            )

        # If the backoff periods grow without limit:
        # After the first failed attempt, we would have backed off for 1 << 1 = 2 hours.
        # After the second failed attempt we would have backed off for 1 << 2 = 4 hours,
        # so after the 10th failed attempt we should backoff for 1 << 10 == 1024 hours.
        # Wait 1100 hours just so we have a nice round number.
        self.reactor.advance(datetime.timedelta(hours=1100).total_seconds())

        # 1024 hours in milliseconds is 1024 * 3600000, which exceeds the largest 32 bit
        # signed integer. The bug we're reproducing is that this overflow causes an
        # error in postgres preventing us from fetching a set of backwards extremities
        # to retry fetching.
        backfill_points = self.get_success(
            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
        )

        # We should aim to fetch all backoff points: b1's latest backoff period has
        # expired, and we haven't tried the rest.
        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
        self.assertEqual(backfill_event_ids, ["b3", "b2", "b1"])

    def test_get_event_ids_with_failed_pull_attempts(self) -> None:
        """
        Test to make sure we properly get event_ids based on whether they have any
        failed pull attempts.
        """
        # Create the room
        user_id = self.register_user("alice", "test")
        tok = self.login("alice", "test")
        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)

        self.get_success(
            self.store.record_event_failed_pull_attempt(
                room_id, "$failed_event_id1", "fake cause"
            )
        )
        self.get_success(
            self.store.record_event_failed_pull_attempt(
                room_id, "$failed_event_id2", "fake cause"
            )
        )

        event_ids_with_failed_pull_attempts = self.get_success(
            self.store.get_event_ids_with_failed_pull_attempts(
                event_ids=[
                    "$failed_event_id1",
                    "$fresh_event_id1",
                    "$failed_event_id2",
                    "$fresh_event_id2",
                ]
            )
        )

        self.assertEqual(
            event_ids_with_failed_pull_attempts,
            {"$failed_event_id1", "$failed_event_id2"},
        )

    def test_get_event_ids_to_not_pull_from_backoff(self) -> None:
        """
        Test to make sure only event IDs we should backoff from are returned.
        """
        # Create the room
        user_id = self.register_user("alice", "test")
        tok = self.login("alice", "test")
        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)

        failure_time = self.clock.time_msec()
        self.get_success(
            self.store.record_event_failed_pull_attempt(
                room_id, "$failed_event_id", "fake cause"
            )
        )

        event_ids_with_backoff = self.get_success(
            self.store.get_event_ids_to_not_pull_from_backoff(
                room_id=room_id, event_ids=["$failed_event_id", "$normal_event_id"]
            )
        )

        self.assertEqual(
            event_ids_with_backoff,
            # We expect a 2^1 hour backoff after a single failed attempt.
            {"$failed_event_id": failure_time + 2 * 60 * 60 * 1000},
        )

    def test_get_event_ids_to_not_pull_from_backoff_retry_after_backoff_duration(
        self,
    ) -> None:
        """
        Test to make sure no event IDs are returned after the backoff duration has
        elapsed.
        """
        # Create the room
        user_id = self.register_user("alice", "test")
        tok = self.login("alice", "test")
        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)

        self.get_success(
            self.store.record_event_failed_pull_attempt(
                room_id, "$failed_event_id", "fake cause"
            )
        )

        # Now advance time by 2 hours so we wait long enough for the single failed
        # attempt (2^1 hours).
        self.reactor.advance(datetime.timedelta(hours=2).total_seconds())

        event_ids_with_backoff = self.get_success(
            self.store.get_event_ids_to_not_pull_from_backoff(
                room_id=room_id, event_ids=["$failed_event_id", "$normal_event_id"]
            )
        )
        # Since this function only returns events we should backoff from, time has
        # elapsed past the backoff range so there is no events to backoff from.
        self.assertEqual(event_ids_with_backoff, {})


@attr.s(auto_attribs=True)
class FakeEvent:
    event_id: str
    room_id: str
    auth_events: List[str]

    type = "foo"
    state_key = "foo"

    internal_metadata = EventInternalMetadata({})

    def auth_event_ids(self) -> List[str]:
        return self.auth_events

    def is_state(self) -> bool:
        return True
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								#
-												Update license headers

											
										
										
											2023-11-21 21:29:58 +01:00
+								# This file is licensed under the Affero General Public License (AGPL) version 3.
 								#
 								# Copyright (C) 2023 New Vector, Ltd
 								#
 								# This program is free software: you can redistribute it and/or modify
 								# it under the terms of the GNU Affero General Public License as
 								# published by the Free Software Foundation, either version 3 of the
 								# License, or (at your option) any later version.
 								#
 								# See the GNU Affero General Public License for more details:
 								# <https://www.gnu.org/licenses/agpl-3.0.html>.
 								#
 								# Originally licensed under the Apache License, Version 2.0:
 								# <http://www.apache.org/licenses/LICENSE-2.0>.
 								#
 								# [This file includes modifications made by New Vector Limited]
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								#
 								#
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								import datetime
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								from typing import (
 								    Collection,
 								    Dict,
 								    FrozenSet,
 								    Iterable,
 								    List,
 								    Mapping,
 								    Set,
 								    Tuple,
 								    TypeVar,
 								    Union,
 								    cast,
 								)
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								import attr
 								from parameterized import parameterized
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								from twisted.test.proto_helpers import MemoryReactor
-												Add foreign key constraint to `event_forward_extremities`. (#15751)


											
										
										
											2023-07-05 11:43:19 +02:00
+								from synapse.api.constants import EventTypes
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								from synapse.api.room_versions import (
 								    KNOWN_ROOM_VERSIONS,
 								    EventFormatVersions,
 								    RoomVersion,
 								)
-												Port `EventInternalMetadata` class to Rust (#16782)

There are a couple of things we need to be careful of here:

1. The current python code does no validation when loading from the DB,
so we need to be careful to ignore such errors (at least on jki.re there
are some old events with internal metadata fields of the wrong type).
2. We want to be memory efficient, as we often have many hundreds of
thousands of events in the cache at a time.

---------

Co-authored-by: Quentin Gliech <quenting@element.io>
											
										
										
											2024-01-08 15:06:48 +01:00
+								from synapse.events import EventBase
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								from synapse.rest import admin
 								from synapse.rest.client import login, room
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								from synapse.server import HomeServer
 								from synapse.storage.database import LoggingTransaction
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								from synapse.storage.types import Cursor
-												Port `EventInternalMetadata` class to Rust (#16782)

There are a couple of things we need to be careful of here:

1. The current python code does no validation when loading from the DB,
so we need to be careful to ignore such errors (at least on jki.re there
are some old events with internal metadata fields of the wrong type).
2. We want to be memory efficient, as we often have many hundreds of
thousands of events in the cache at a time.

---------

Co-authored-by: Quentin Gliech <quenting@element.io>
											
										
										
											2024-01-08 15:06:48 +01:00
+								from synapse.synapse_rust.events import EventInternalMetadata
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								from synapse.types import JsonDict
 								from synapse.util import Clock, json_encoder
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								import tests.unittest
 								import tests.utils
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								# The silly auth graph we use to test the auth difference algorithm,
 								# where the top are the most recent events.
 								#
 								#   A   B
 								#    \ /
 								#  D  E
 								#  \  |
 								#   ` F   C
 								#     |  /|
 								#     G ´ |
 								#     | \ |
 								#     H   I
 								#     |   |
 								#     K   J
 								AUTH_GRAPH: Dict[str, List[str]] = {
 								    "a": ["e"],
 								    "b": ["e"],
 								    "c": ["g", "i"],
 								    "d": ["f"],
 								    "e": ["f"],
 								    "f": ["g"],
 								    "g": ["h", "i"],
 								    "h": ["k"],
 								    "i": ["j"],
 								    "k": [],
 								    "j": [],
 								}
 								DEPTH_GRAPH = {
 								    "a": 7,
 								    "b": 7,
 								    "c": 4,
 								    "d": 6,
 								    "e": 6,
 								    "f": 5,
 								    "g": 3,
 								    "h": 2,
 								    "i": 2,
 								    "k": 1,
 								    "j": 1,
 								}
 								T = TypeVar("T")
 								def get_all_topologically_sorted_orders(
 								    nodes: Iterable[T],
 								    graph: Mapping[T, Collection[T]],
 								) -> List[List[T]]:
 								    """Given a set of nodes and a graph, return all possible topological
 								    orderings.
 								    """
 								    # This is implemented by Kahn's algorithm, and forking execution each time
 								    # we have a choice over which node to consider next.
 								    degree_map = {node: 0 for node in nodes}
 								    reverse_graph: Dict[T, Set[T]] = {}
 								    for node, edges in graph.items():
 								        if node not in degree_map:
 								            continue
 								        for edge in set(edges):
 								            if edge in degree_map:
 								                degree_map[node] += 1
 								            reverse_graph.setdefault(edge, set()).add(node)
 								        reverse_graph.setdefault(node, set())
 								    zero_degree = [node for node, degree in degree_map.items() if degree == 0]
 								    return _get_all_topologically_sorted_orders_inner(
 								        reverse_graph, zero_degree, degree_map
 								    )
 								def _get_all_topologically_sorted_orders_inner(
 								    reverse_graph: Dict[T, Set[T]],
 								    zero_degree: List[T],
 								    degree_map: Dict[T, int],
 								) -> List[List[T]]:
 								    new_paths = []
 								    # Rather than only choosing *one* item from the list of nodes with zero
 								    # degree, we "fork" execution and run the algorithm for each node in the
 								    # zero degree.
 								    for node in zero_degree:
 								        new_degree_map = degree_map.copy()
 								        new_zero_degree = zero_degree.copy()
 								        new_zero_degree.remove(node)
 								        for edge in reverse_graph.get(node, []):
 								            if edge in new_degree_map:
 								                new_degree_map[edge] -= 1
 								                if new_degree_map[edge] == 0:
 								                    new_zero_degree.append(edge)
 								        paths = _get_all_topologically_sorted_orders_inner(
 								            reverse_graph, new_zero_degree, new_degree_map
 								        )
 								        for path in paths:
 								            path.insert(0, node)
 								        new_paths.extend(paths)
 								    if not new_paths:
 								        return [[]]
 								    return new_paths
 								def get_all_topologically_consistent_subsets(
 								    nodes: Iterable[T],
 								    graph: Mapping[T, Collection[T]],
 								) -> Set[FrozenSet[T]]:
 								    """Get all subsets of the graph where if node N is in the subgraph, then all
 								    nodes that can reach that node (i.e. for all X there exists a path X -> N)
 								    are in the subgraph.
 								    """
 								    all_topological_orderings = get_all_topologically_sorted_orders(nodes, graph)
 								    graph_subsets = set()
 								    for ordering in all_topological_orderings:
 								        ordering.reverse()
 								        for idx in range(len(ordering)):
 								            graph_subsets.add(frozenset(ordering[:idx]))
 								    return graph_subsets
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								@attr.s(auto_attribs=True, frozen=True, slots=True)
 								class _BackfillSetupInfo:
 								    room_id: str
 								    depth_map: Dict[str, int]
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								class EventFederationWorkerStoreTestCase(tests.unittest.HomeserverTestCase):
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								    servlets = [
 								        admin.register_servlets,
 								        room.register_servlets,
 								        login.register_servlets,
 								    ]
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								    def prepare(self, reactor: MemoryReactor, clock: Clock, hs: HomeServer) -> None:
-												Remove `HomeServer.get_datastore()` (#12031)

The presence of this method was confusing, and mostly present for backwards
compatibility. Let's get rid of it.

Part of #11733

											
										
										
											2022-02-23 12:04:02 +01:00
+								        self.store = hs.get_datastores().main
-												Add final type hint to tests.unittest. (#15072)

Adds a return type to HomeServerTestCase.make_homeserver and deal
with any variables which are no longer Any.
											
										
										
											2023-02-14 20:03:35 +01:00
+								        persist_events = hs.get_datastores().persist_events
 								        assert persist_events is not None
 								        self.persist_events = persist_events
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_get_prev_events_for_room(self) -> None:
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								        room_id = "@ROOM:local"
 								        # add a bunch of events and hashes to act as forward extremities
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        def insert_event(txn: Cursor, i: int) -> None:
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								            event_id = "$event_%i:local" % i
 								            txn.execute(
-												Run black.

											
										
										
											2018-08-10 15:54:09 +02:00
+								                (
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								                    "INSERT INTO events ("
 								                    "   room_id, event_id, type, depth, topological_ordering,"
-												Fix tests on postgresql (#3740)


											
										
										
											2018-09-03 18:21:48 +02:00
+								                    "   content, processed, outlier, stream_ordering) "
 								                    "VALUES (?, ?, 'm.test', ?, ?, 'test', ?, ?, ?)"
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								                ),
-												Fix tests on postgresql (#3740)


											
										
										
											2018-09-03 18:21:48 +02:00
+								                (room_id, event_id, i, i, True, False, i),
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								            )
 								            txn.execute(
-												Run black.

											
										
										
											2018-08-10 15:54:09 +02:00
+								                (
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								                    "INSERT INTO event_forward_extremities (room_id, event_id) "
 								                    "VALUES (?, ?)"
 								                ),
 								                (room_id, event_id),
 								            )
-												Update ruff config (#16283)

Enable additional checks & clean-up unneeded configuration.
											
										
										
											2023-09-08 17:24:36 +02:00
+								        for i in range(20):
-												Rename database classes to make some sense (#8033)


											
										
										
											2020-08-05 22:38:57 +02:00
+								            self.get_success(
 								                self.store.db_pool.runInteraction("insert", insert_event, i)
 								            )
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
-												Remove unused get_prev_events_and_hashes_for_room

											
										
										
											2020-01-03 17:30:51 +01:00
+								        # this should get the last ten
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        r = self.get_success(self.store.get_prev_events_for_room(room_id))
-												Avoid creating events with huge numbers of prev_events

In most cases, we limit the number of prev_events for a given event to 10
events. This fixes a particular code path which created events with huge
numbers of prev_events.

											
										
										
											2018-04-16 19:41:37 +02:00
+								        self.assertEqual(10, len(r))
-												Update ruff config (#16283)

Enable additional checks & clean-up unneeded configuration.
											
										
										
											2023-09-08 17:24:36 +02:00
+								        for i in range(10):
-												Remove unused get_prev_events_and_hashes_for_room

											
										
										
											2020-01-03 17:30:51 +01:00
+								            self.assertEqual("$event_%i:local" % (19 - i), r[i])
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_get_rooms_with_many_extremities(self) -> None:
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								        room1 = "#room1"
 								        room2 = "#room2"
 								        room3 = "#room3"
-												Add foreign key constraint to `event_forward_extremities`. (#15751)


											
										
										
											2023-07-05 11:43:19 +02:00
+								        def insert_event(txn: LoggingTransaction, i: int, room_id: str) -> None:
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								            event_id = "$event_%i:local" % i
-												Add foreign key constraint to `event_forward_extremities`. (#15751)


											
										
										
											2023-07-05 11:43:19 +02:00
 								            # We need to insert into events table to get around the foreign key constraint.
 								            self.store.db_pool.simple_insert_txn(
 								                txn,
 								                table="events",
 								                values={
 								                    "instance_name": "master",
 								                    "stream_ordering": self.store._stream_id_gen.get_next_txn(txn),
 								                    "topological_ordering": 1,
 								                    "depth": 1,
 								                    "event_id": event_id,
 								                    "room_id": room_id,
 								                    "type": EventTypes.Message,
 								                    "processed": True,
 								                    "outlier": False,
 								                    "origin_server_ts": 0,
 								                    "received_ts": 0,
 								                    "sender": "@user:local",
 								                    "contains_url": False,
 								                    "state_key": None,
 								                    "rejection_reason": None,
 								                },
 								            )
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								            txn.execute(
 								                (
 								                    "INSERT INTO event_forward_extremities (room_id, event_id) "
 								                    "VALUES (?, ?)"
 								                ),
 								                (room_id, event_id),
 								            )
-												Update ruff config (#16283)

Enable additional checks & clean-up unneeded configuration.
											
										
										
											2023-09-08 17:24:36 +02:00
+								        for i in range(20):
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								            self.get_success(
-												Rename database classes to make some sense (#8033)


											
										
										
											2020-08-05 22:38:57 +02:00
+								                self.store.db_pool.runInteraction("insert", insert_event, i, room1)
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								            )
 								            self.get_success(
-												Add foreign key constraint to `event_forward_extremities`. (#15751)


											
										
										
											2023-07-05 11:43:19 +02:00
+								                self.store.db_pool.runInteraction(
 								                    "insert", insert_event, i + 100, room2
 								                )
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								            )
 								            self.get_success(
-												Add foreign key constraint to `event_forward_extremities`. (#15751)


											
										
										
											2023-07-05 11:43:19 +02:00
+								                self.store.db_pool.runInteraction(
 								                    "insert", insert_event, i + 200, room3
 								                )
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								            )
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
 								        # Test simple case
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 5, []))
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								        self.assertEqual(len(r), 3)
 								        # Does filter work?
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 5, [room1]))
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								        self.assertTrue(room2 in r)
 								        self.assertTrue(room3 in r)
 								        self.assertEqual(len(r), 2)
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        r = self.get_success(
 								            self.store.get_rooms_with_many_extremities(5, 5, [room1, room2])
 								        )
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								        self.assertEqual(r, [room3])
 								        # Does filter and limit work?
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        r = self.get_success(self.store.get_rooms_with_many_extremities(5, 1, [room1]))
-												Fix dummy event insertion consent bug (#6053)

Fixes #5905
											
										
										
											2019-09-26 12:47:53 +02:00
+								        self.assertTrue(r == [room2] or r == [room3])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								    def _setup_auth_chain(self, use_chain_cover_index: bool) -> str:
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        room_id = "@ROOM:local"
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								        # Mark the room as maybe having a cover index.
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        def store_room(txn: LoggingTransaction) -> None:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            self.store.db_pool.simple_insert_txn(
 								                txn,
 								                "rooms",
 								                {
 								                    "room_id": room_id,
 								                    "creator": "room_creator_user_id",
 								                    "is_public": True,
 								                    "room_version": "6",
 								                    "has_auth_chain_index": use_chain_cover_index,
 								                },
 								            )
 								        self.get_success(self.store.db_pool.runInteraction("store_room", store_room))
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        # We rudely fiddle with the appropriate tables directly, as that's much
 								        # easier than constructing events properly.
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        def insert_event(txn: LoggingTransaction) -> None:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            stream_ordering = 0
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								            for event_id in AUTH_GRAPH:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                stream_ordering += 1
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								                depth = DEPTH_GRAPH[event_id]
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
 								                self.store.db_pool.simple_insert_txn(
 								                    txn,
 								                    table="events",
 								                    values={
 								                        "event_id": event_id,
 								                        "room_id": room_id,
 								                        "depth": depth,
 								                        "topological_ordering": depth,
 								                        "type": "m.test",
 								                        "processed": True,
 								                        "outlier": False,
 								                        "stream_ordering": stream_ordering,
 								                    },
 								                )
-												Add final type hint to tests.unittest. (#15072)

Adds a return type to HomeServerTestCase.make_homeserver and deal
with any variables which are no longer Any.
											
										
										
											2023-02-14 20:03:35 +01:00
+								            self.persist_events._persist_event_auth_chain_txn(
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                txn,
 								                [
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								                    cast(EventBase, FakeEvent(event_id, room_id, AUTH_GRAPH[event_id]))
 								                    for event_id in AUTH_GRAPH
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                ],
 								            )
 								        self.get_success(
 								            self.store.db_pool.runInteraction(
 								                "insert",
 								                insert_event,
 								            )
-												Update black, and run auto formatting over the codebase (#9381)

 - Update black version to the latest
 - Run black auto formatting over the codebase
    - Run autoformatting according to [`docs/code_style.md
`](https://github.com/matrix-org/synapse/blob/80d6dc9783aa80886a133756028984dbf8920168/docs/code_style.md)
 - Update `code_style.md` docs around installing black to use the correct version
											
										
										
											2021-02-16 23:32:34 +01:00
+								        )
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								        return room_id
 								    @parameterized.expand([(True,), (False,)])
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_auth_chain_ids(self, use_chain_cover_index: bool) -> None:
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								        room_id = self._setup_auth_chain(use_chain_cover_index)
 								        # a and b have the same auth chain.
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["a"]))
 								        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["b"]))
 								        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(
 								            self.store.get_auth_chain_ids(room_id, ["a", "b"])
 								        )
 								        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["c"]))
 								        self.assertCountEqual(auth_chain_ids, ["g", "h", "i", "j", "k"])
 								        # d and e have the same auth chain.
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["d"]))
 								        self.assertCountEqual(auth_chain_ids, ["f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["e"]))
 								        self.assertCountEqual(auth_chain_ids, ["f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["f"]))
 								        self.assertCountEqual(auth_chain_ids, ["g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["g"]))
 								        self.assertCountEqual(auth_chain_ids, ["h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["h"]))
-												Implement MSC3706: partial state in `/send_join` response (#11967)

* Make `get_auth_chain_ids` return a Set

It has a set internally, and a set is often useful where it gets used, so let's
avoid converting to an intermediate list.

* Minor refactors in `on_send_join_request`

A little bit of non-functional groundwork

* Implement MSC3706: partial state in /send_join response
											
										
										
											2022-02-12 11:44:16 +01:00
+								        self.assertEqual(auth_chain_ids, {"k"})
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["i"]))
-												Implement MSC3706: partial state in `/send_join` response (#11967)

* Make `get_auth_chain_ids` return a Set

It has a set internally, and a set is often useful where it gets used, so let's
avoid converting to an intermediate list.

* Minor refactors in `on_send_join_request`

A little bit of non-functional groundwork

* Implement MSC3706: partial state in /send_join response
											
										
										
											2022-02-12 11:44:16 +01:00
+								        self.assertEqual(auth_chain_ids, {"j"})
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
 								        # j and k have no parents.
 								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["j"]))
-												Implement MSC3706: partial state in `/send_join` response (#11967)

* Make `get_auth_chain_ids` return a Set

It has a set internally, and a set is often useful where it gets used, so let's
avoid converting to an intermediate list.

* Minor refactors in `on_send_join_request`

A little bit of non-functional groundwork

* Implement MSC3706: partial state in /send_join response
											
										
										
											2022-02-12 11:44:16 +01:00
+								        self.assertEqual(auth_chain_ids, set())
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								        auth_chain_ids = self.get_success(self.store.get_auth_chain_ids(room_id, ["k"]))
-												Implement MSC3706: partial state in `/send_join` response (#11967)

* Make `get_auth_chain_ids` return a Set

It has a set internally, and a set is often useful where it gets used, so let's
avoid converting to an intermediate list.

* Minor refactors in `on_send_join_request`

A little bit of non-functional groundwork

* Implement MSC3706: partial state in /send_join response
											
										
										
											2022-02-12 11:44:16 +01:00
+								        self.assertEqual(auth_chain_ids, set())
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
 								        # More complex input sequences.
 								        auth_chain_ids = self.get_success(
 								            self.store.get_auth_chain_ids(room_id, ["b", "c", "d"])
 								        )
 								        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
 								        auth_chain_ids = self.get_success(
 								            self.store.get_auth_chain_ids(room_id, ["h", "i"])
 								        )
 								        self.assertCountEqual(auth_chain_ids, ["k", "j"])
 								        # e gets returned even though include_given is false, but it is in the
 								        # auth chain of b.
 								        auth_chain_ids = self.get_success(
 								            self.store.get_auth_chain_ids(room_id, ["b", "e"])
 								        )
 								        self.assertCountEqual(auth_chain_ids, ["e", "f", "g", "h", "i", "j", "k"])
 								        # Test include_given.
 								        auth_chain_ids = self.get_success(
 								            self.store.get_auth_chain_ids(room_id, ["i"], include_given=True)
 								        )
 								        self.assertCountEqual(auth_chain_ids, ["i", "j"])
 								    @parameterized.expand([(True,), (False,)])
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_auth_difference(self, use_chain_cover_index: bool) -> None:
-												Use the chain cover index in get_auth_chain_ids. (#9576)

This uses a simplified version of get_chain_cover_difference to calculate
auth chain of events.
											
										
										
											2021-03-10 15:57:59 +01:00
+								        room_id = self._setup_auth_chain(use_chain_cover_index)
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        # Now actually test that various combinations give the right result:
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								        self.assert_auth_diff_is_expected(room_id)
 								    @parameterized.expand(
 								        [
 								            [graph_subset]
 								            for graph_subset in get_all_topologically_consistent_subsets(
 								                AUTH_GRAPH, AUTH_GRAPH
 								            )
 								        ]
 								    )
 								    def test_auth_difference_partial(self, graph_subset: Collection[str]) -> None:
 								        """Test that if we only have a chain cover index on a partial subset of
 								        the room we still get the correct auth chain difference.
 								        We do this by removing the chain cover index for every valid subset of the
 								        graph.
 								        """
 								        room_id = self._setup_auth_chain(True)
 								        for event_id in graph_subset:
 								            # Remove chain cover from that event.
 								            self.get_success(
 								                self.store.db_pool.simple_delete(
 								                    table="event_auth_chains",
 								                    keyvalues={"event_id": event_id},
 								                    desc="test_auth_difference_partial_remove",
 								                )
 								            )
 								            self.get_success(
 								                self.store.db_pool.simple_insert(
 								                    table="event_auth_chain_to_calculate",
 								                    values={
 								                        "event_id": event_id,
 								                        "room_id": room_id,
 								                        "type": "",
 								                        "state_key": "",
 								                    },
 								                    desc="test_auth_difference_partial_remove",
 								                )
 								            )
 								        self.assert_auth_diff_is_expected(room_id)
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Speed up state res in rare case we don't have all events (#16116)

If we don't have all the auth events in a room then not all state events will have a chain cover index. Even so, we can still use the chain cover index on the events that do have it, rather than bailing and using the slower functions.

This situation should not arise for newly persisted rooms, as we check we have the full auth chain for each event, but can happen for existing rooms.

c.f. #15245
											
										
										
											2023-08-18 16:32:06 +02:00
+								    def assert_auth_diff_is_expected(self, room_id: str) -> None:
 								        """Assert the auth chain difference returns the correct answers."""
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b", "c", "e", "f"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b", "c"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b", "c"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"d"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b", "d", "e"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}, {"d"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b", "c", "d", "e", "f"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"e"}])
 								        )
 								        self.assertSetEqual(difference, {"a", "b"})
 								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}])
 								        )
 								        self.assertSetEqual(difference, set())
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_auth_difference_partial_cover(self) -> None:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        """Test that we correctly handle rooms where not all events have a chain
 								        cover calculated. This can happen in some obscure edge cases, including
 								        during the background update that calculates the chain cover for old
 								        rooms.
 								        """
 								        room_id = "@ROOM:local"
 								        # The silly auth graph we use to test the auth difference algorithm,
 								        # where the top are the most recent events.
 								        #
 								        #   A   B
 								        #    \ /
 								        #  D  E
 								        #  \  |
 								        #   ` F   C
 								        #     |  /|
 								        #     G ´ |
 								        #     | \ |
 								        #     H   I
 								        #     |   |
 								        #     K   J
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        auth_graph: Dict[str, List[str]] = {
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            "a": ["e"],
 								            "b": ["e"],
 								            "c": ["g", "i"],
 								            "d": ["f"],
 								            "e": ["f"],
 								            "f": ["g"],
 								            "g": ["h", "i"],
 								            "h": ["k"],
 								            "i": ["j"],
 								            "k": [],
 								            "j": [],
 								        }
 								        depth_map = {
 								            "a": 7,
 								            "b": 7,
 								            "c": 4,
 								            "d": 6,
 								            "e": 6,
 								            "f": 5,
 								            "g": 3,
 								            "h": 2,
 								            "i": 2,
 								            "k": 1,
 								            "j": 1,
 								        }
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        # We rudely fiddle with the appropriate tables directly, as that's much
 								        # easier than constructing events properly.
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        def insert_event(txn: LoggingTransaction) -> None:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            # First insert the room and mark it as having a chain cover.
-												Rename database classes to make some sense (#8033)


											
										
										
											2020-08-05 22:38:57 +02:00
+								            self.store.db_pool.simple_insert_txn(
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								                txn,
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                "rooms",
 								                {
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								                    "room_id": room_id,
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                    "creator": "room_creator_user_id",
 								                    "is_public": True,
 								                    "room_version": "6",
 								                    "has_auth_chain_index": True,
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								                },
 								            )
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            stream_ordering = 0
 								            for event_id in auth_graph:
 								                stream_ordering += 1
 								                depth = depth_map[event_id]
 								                self.store.db_pool.simple_insert_txn(
 								                    txn,
 								                    table="events",
 								                    values={
 								                        "event_id": event_id,
 								                        "room_id": room_id,
 								                        "depth": depth,
 								                        "topological_ordering": depth,
 								                        "type": "m.test",
 								                        "processed": True,
 								                        "outlier": False,
 								                        "stream_ordering": stream_ordering,
 								                    },
 								                )
 								            # Insert all events apart from 'B'
-												Add final type hint to tests.unittest. (#15072)

Adds a return type to HomeServerTestCase.make_homeserver and deal
with any variables which are no longer Any.
											
										
										
											2023-02-14 20:03:35 +01:00
+								            self.persist_events._persist_event_auth_chain_txn(
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								                txn,
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                [
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								                    cast(EventBase, FakeEvent(event_id, room_id, auth_graph[event_id]))
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                    for event_id in auth_graph
 								                    if event_id != "b"
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								                ],
 								            )
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            # Now we insert the event 'B' without a chain cover, by temporarily
 								            # pretending the room doesn't have a chain cover.
 								            self.store.db_pool.simple_update_txn(
 								                txn,
 								                table="rooms",
 								                keyvalues={"room_id": room_id},
 								                updatevalues={"has_auth_chain_index": False},
 								            )
-												Add final type hint to tests.unittest. (#15072)

Adds a return type to HomeServerTestCase.make_homeserver and deal
with any variables which are no longer Any.
											
										
										
											2023-02-14 20:03:35 +01:00
+								            self.persist_events._persist_event_auth_chain_txn(
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								                txn,
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								                [cast(EventBase, FakeEvent("b", room_id, auth_graph["b"]))],
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								            )
 								            self.store.db_pool.simple_update_txn(
 								                txn,
 								                table="rooms",
 								                keyvalues={"room_id": room_id},
 								                updatevalues={"has_auth_chain_index": True},
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								            )
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        self.get_success(
 								            self.store.db_pool.runInteraction(
 								                "insert",
 								                insert_event,
 								            )
-												Update black, and run auto formatting over the codebase (#9381)

 - Update black version to the latest
 - Run black auto formatting over the codebase
    - Run autoformatting according to [`docs/code_style.md
`](https://github.com/matrix-org/synapse/blob/80d6dc9783aa80886a133756028984dbf8920168/docs/code_style.md)
 - Update `code_style.md` docs around installing black to use the correct version
											
										
										
											2021-02-16 23:32:34 +01:00
+								        )
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        # Now actually test that various combinations give the right result:
 								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b"})
 								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b", "c", "e", "f"})
 								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b", "c"})
-												Correctly handle unpersisted events when calculating auth chain difference. (#8827)

We do state res with unpersisted events when calculating the new current state of the room, so that should be the only thing impacted. I don't think this is tooooo big of a deal as:

1. the next time a state event happens in the room the current state should correct itself;
2. in the common case all the unpersisted events' auth events will be pulled in by other state, so will still return the correct result (or one which is sufficiently close to not affect the result); and
3. we mostly use the state at an event to do important operations, which isn't affected by this.
											
										
										
											2020-12-02 16:22:37 +01:00
+								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a", "c"}, {"b", "c"}])
-												Correctly handle unpersisted events when calculating auth chain difference. (#8827)

We do state res with unpersisted events when calculating the new current state of the room, so that should be the only thing impacted. I don't think this is tooooo big of a deal as:

1. the next time a state event happens in the room the current state should correct itself;
2. in the common case all the unpersisted events' auth events will be pulled in by other state, so will still return the correct result (or one which is sufficiently close to not affect the result); and
3. we mostly use the state at an event to do important operations, which isn't affected by this.
											
										
										
											2020-12-02 16:22:37 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b"})
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"d"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b", "d", "e"})
 								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"c"}, {"d"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b", "c", "d", "e", "f"})
 								        difference = self.get_success(
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								            self.store.get_auth_chain_difference(room_id, [{"a"}, {"b"}, {"e"}])
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        )
 								        self.assertSetEqual(difference, {"a", "b"})
-												Pass room_id to get_auth_chain_difference (#8879)

This is so that we can choose which algorithm to use based on the room ID.


											
										
										
											2020-12-04 16:52:49 +01:00
+								        difference = self.get_success(
 								            self.store.get_auth_chain_difference(room_id, [{"a"}])
 								        )
-												Improve get auth chain difference algorithm. (#7095)

It was originally implemented by pulling the full auth chain of all
state sets out of the database and doing set comparison. However, that
can take a lot work if the state and auth chains are large.

Instead, lets try and fetch the auth chains at the same time and
calculate the difference on the fly, allowing us to bail early if all
the auth chains converge. Assuming that the auth chains do converge more
often than not, this should improve performance. Hopefully.

											
										
										
											2020-03-18 17:46:41 +01:00
+								        self.assertSetEqual(difference, set())
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								    @parameterized.expand(
 								        [(room_version,) for room_version in KNOWN_ROOM_VERSIONS.values()]
 								    )
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_prune_inbound_federation_queue(self, room_version: RoomVersion) -> None:
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								        """Test that pruning of inbound federation queues work"""
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
 								        room_id = "some_room_id"
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								        def prev_event_format(prev_event_id: str) -> Union[Tuple[str, dict], str]:
 								            """Account for differences in prev_events format across room versions"""
-												Rename the `EventFormatVersions` enum values so that they line up with room version numbers. (#13706)


											
										
										
											2022-09-07 12:08:20 +02:00
+								            if room_version.event_format == EventFormatVersions.ROOM_V1_V2:
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								                return prev_event_id, {}
 								            return prev_event_id
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								        # Insert a bunch of events that all reference the previous one.
 								        self.get_success(
 								            self.store.db_pool.simple_insert_many(
 								                table="federation_inbound_events_staging",
-												Replace uses of simple_insert_many with simple_insert_many_values. (#11742)

This should be (slightly) more efficient and it is simpler
to have a single method for inserting multiple values.
											
										
										
											2022-01-14 01:44:18 +01:00
+								                keys=(
 								                    "origin",
 								                    "room_id",
 								                    "received_ts",
 								                    "event_id",
 								                    "event_json",
 								                    "internal_metadata",
 								                ),
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								                values=[
-												Replace uses of simple_insert_many with simple_insert_many_values. (#11742)

This should be (slightly) more efficient and it is simpler
to have a single method for inserting multiple values.
											
										
										
											2022-01-14 01:44:18 +01:00
+								                    (
 								                        "some_origin",
 								                        room_id,
 ,
 								                        f"$fake_event_id_{i + 1}",
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								                        json_encoder.encode(
 								                            {"prev_events": [prev_event_format(f"$fake_event_id_{i}")]}
 								                        ),
-												Replace uses of simple_insert_many with simple_insert_many_values. (#11742)

This should be (slightly) more efficient and it is simpler
to have a single method for inserting multiple values.
											
										
										
											2022-01-14 01:44:18 +01:00
+								                        "{}",
 								                    )
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								                    for i in range(500)
 								                ],
 								                desc="test_prune_inbound_federation_queue",
 								            )
 								        )
 								        # Calling prune once should return True, i.e. a prune happen. The second
 								        # time it shouldn't.
 								        pruned = self.get_success(
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								            self.store.prune_staged_events_in_room(room_id, room_version)
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								        )
 								        self.assertTrue(pruned)
 								        pruned = self.get_success(
-												Fix logic for dropping old events in fed queue (#11806)

Co-authored-by: Brendan Abolivier <babolivier@matrix.org>
Co-authored-by: Richard van der Hoff <richard@matrix.org>
											
										
										
											2022-01-24 13:20:01 +01:00
+								            self.store.prune_staged_events_in_room(room_id, room_version)
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								        )
 								        self.assertFalse(pruned)
 								        # Assert that we only have a single event left in the queue, and that it
 								        # is the last one.
 								        count = self.get_success(
 								            self.store.db_pool.simple_select_one_onecol(
 								                table="federation_inbound_events_staging",
 								                keyvalues={"room_id": room_id},
-												Remove redundant `COALESCE()`s around `COUNT()`s in database queries (#11570)

`COUNT()` never returns `NULL`. A `COUNT(*)` over 0 rows is 0 and a
`COUNT(NULL)` is also 0.

											
										
										
											2021-12-14 13:34:30 +01:00
+								                retcol="COUNT(*)",
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								                desc="test_prune_inbound_federation_queue",
 								            )
 								        )
 								        self.assertEqual(count, 1)
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        next_staged_event_info = self.get_success(
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								            self.store.get_next_staged_event_id_for_room(room_id)
 								        )
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        assert next_staged_event_info
 								        _, event_id = next_staged_event_info
-												Prune inbound federation queues if they get too long (#10390)


											
										
										
											2021-08-02 15:37:25 +02:00
+								        self.assertEqual(event_id, "$fake_event_id_500")
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								    def _setup_room_for_backfill_tests(self) -> _BackfillSetupInfo:
 								        """
 								        Sets up a room with various events and backward extremities to test
 								        backfill functions against.
 								        Returns:
 								            _BackfillSetupInfo including the `room_id` to test against and
 								            `depth_map` of events in the room
 								        """
 								        room_id = "!backfill-room-test:some-host"
 								        # The silly graph we use to test grabbing backward extremities,
 								        # where the top is the oldest events.
 								        #    1 (oldest)
 								        #    |
 								        #    2 ⹁
 								        #    |  \
 								        #    |   [b1, b2, b3]
 								        #    |   |
 								        #    |   A
 								        #    |  /
 								        #    3 {
 								        #    |  \
 								        #    |   [b4, b5, b6]
 								        #    |   |
 								        #    |   B
 								        #    |  /
 								        #    4 ´
 								        #    |
 								        #    5 (newest)
 								        event_graph: Dict[str, List[str]] = {
 								            "1": [],
 								            "2": ["1"],
 								            "3": ["2", "A"],
 								            "4": ["3", "B"],
 								            "5": ["4"],
 								            "A": ["b1", "b2", "b3"],
 								            "b1": ["2"],
 								            "b2": ["2"],
 								            "b3": ["2"],
 								            "B": ["b4", "b5", "b6"],
 								            "b4": ["3"],
 								            "b5": ["3"],
 								            "b6": ["3"],
 								        }
 								        depth_map: Dict[str, int] = {
 								            "1": 1,
 								            "2": 2,
 								            "b1": 3,
 								            "b2": 3,
 								            "b3": 3,
 								            "A": 4,
 								            "3": 5,
 								            "b4": 6,
 								            "b5": 6,
 								            "b6": 6,
 								            "B": 7,
 								            "4": 8,
 								            "5": 9,
 								        }
 								        # The events we have persisted on our server.
 								        # The rest are events in the room but not backfilled tet.
 								        our_server_events = {"5", "4", "B", "3", "A"}
 								        complete_event_dict_map: Dict[str, JsonDict] = {}
 								        stream_ordering = 0
 								        for event_id, prev_event_ids in event_graph.items():
 								            depth = depth_map[event_id]
 								            complete_event_dict_map[event_id] = {
 								                "event_id": event_id,
 								                "type": "test_regular_type",
 								                "room_id": room_id,
 								                "sender": "@sender",
 								                "prev_event_ids": prev_event_ids,
 								                "auth_event_ids": [],
 								                "origin_server_ts": stream_ordering,
 								                "depth": depth,
 								                "stream_ordering": stream_ordering,
 								                "content": {"body": "event" + event_id},
 								            }
 								            stream_ordering += 1
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								        def populate_db(txn: LoggingTransaction) -> None:
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								            # Insert the room to satisfy the foreign key constraint of
 								            # `event_failed_pull_attempts`
 								            self.store.db_pool.simple_insert_txn(
 								                txn,
 								                "rooms",
 								                {
 								                    "room_id": room_id,
 								                    "creator": "room_creator_user_id",
 								                    "is_public": True,
 								                    "room_version": "6",
 								                },
 								            )
 								            # Insert our server events
 								            for event_id in our_server_events:
 								                event_dict = complete_event_dict_map[event_id]
 								                self.store.db_pool.simple_insert_txn(
 								                    txn,
 								                    table="events",
 								                    values={
 								                        "event_id": event_dict.get("event_id"),
 								                        "type": event_dict.get("type"),
 								                        "room_id": event_dict.get("room_id"),
 								                        "depth": event_dict.get("depth"),
 								                        "topological_ordering": event_dict.get("depth"),
 								                        "stream_ordering": event_dict.get("stream_ordering"),
 								                        "processed": True,
 								                        "outlier": False,
 								                    },
 								                )
 								            # Insert the event edges
 								            for event_id in our_server_events:
 								                for prev_event_id in event_graph[event_id]:
 								                    self.store.db_pool.simple_insert_txn(
 								                        txn,
 								                        table="event_edges",
 								                        values={
 								                            "event_id": event_id,
 								                            "prev_event_id": prev_event_id,
 								                            "room_id": room_id,
 								                        },
 								                    )
 								            # Insert the backward extremities
 								            prev_events_of_our_events = {
 								                prev_event_id
 								                for our_server_event in our_server_events
 								                for prev_event_id in complete_event_dict_map[our_server_event][
 								                    "prev_event_ids"
 								                ]
 								            }
 								            backward_extremities = prev_events_of_our_events - our_server_events
 								            for backward_extremity in backward_extremities:
 								                self.store.db_pool.simple_insert_txn(
 								                    txn,
 								                    table="event_backward_extremities",
 								                    values={
 								                        "event_id": backward_extremity,
 								                        "room_id": room_id,
 								                    },
 								                )
 								        self.get_success(
 								            self.store.db_pool.runInteraction(
 								                "_setup_room_for_backfill_tests_populate_db",
 								                populate_db,
 								            )
 								        )
 								        return _BackfillSetupInfo(room_id=room_id, depth_map=depth_map)
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_get_backfill_points_in_room(self) -> None:
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        """
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        Test to make sure only backfill points that are older and come before
 								        the `current_depth` are returned.
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        """
 								        setup_info = self._setup_room_for_backfill_tests()
 								        room_id = setup_info.room_id
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        depth_map = setup_info.depth_map
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        # Try at "B"
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        backfill_points = self.get_success(
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								            self.store.get_backfill_points_in_room(room_id, depth_map["B"], limit=100)
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        )
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
-												Fix overflows in /messages backfill calculation (#13936)

* Reproduce bug
* Compute `least_function` first
* Substitute `least_function` with an f-string
* Bugfix: avoid overflow

Co-authored-by: Eric Eastwood <erice@element.io>
											
										
										
											2022-09-30 12:54:53 +02:00
+								        self.assertEqual(backfill_event_ids, ["b6", "b5", "b4", "2", "b3", "b2", "b1"])
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        # Try at "A"
 								        backfill_points = self.get_success(
 								            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
 								        )
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
 								        # Event "2" has a depth of 2 but is not included here because we only
 								        # know the approximate depth of 5 from our event "3".
 								        self.assertListEqual(backfill_event_ids, ["b3", "b2", "b1"])
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								    def test_get_backfill_points_in_room_excludes_events_we_have_attempted(
 								        self,
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    ) -> None:
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        """
 								        Test to make sure that events we have attempted to backfill (and within
 								        backoff timeout duration) do not show up as an event to backfill again.
 								        """
 								        setup_info = self._setup_room_for_backfill_tests()
 								        room_id = setup_info.room_id
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        depth_map = setup_info.depth_map
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
 								        # Record some attempts to backfill these events which will make
 								        # `get_backfill_points_in_room` exclude them because we
 								        # haven't passed the backoff interval.
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b5", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b4", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b3", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b2", "fake cause")
 								        )
 								        # No time has passed since we attempted to backfill ^
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        # Try at "B"
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        backfill_points = self.get_success(
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								            self.store.get_backfill_points_in_room(room_id, depth_map["B"], limit=100)
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        )
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
 								        # Only the backfill points that we didn't record earlier exist here.
-												Fix overflows in /messages backfill calculation (#13936)

* Reproduce bug
* Compute `least_function` first
* Substitute `least_function` with an f-string
* Bugfix: avoid overflow

Co-authored-by: Eric Eastwood <erice@element.io>
											
										
										
											2022-09-30 12:54:53 +02:00
+								        self.assertEqual(backfill_event_ids, ["b6", "2", "b1"])
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
 								    def test_get_backfill_points_in_room_attempted_event_retry_after_backoff_duration(
 								        self,
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    ) -> None:
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        """
 								        Test to make sure after we fake attempt to backfill event "b3" many times,
 								        we can see retry and see the "b3" again after the backoff timeout duration
 								        has exceeded.
 								        """
 								        setup_info = self._setup_room_for_backfill_tests()
 								        room_id = setup_info.room_id
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        depth_map = setup_info.depth_map
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
 								        # Record some attempts to backfill these events which will make
 								        # `get_backfill_points_in_room` exclude them because we
 								        # haven't passed the backoff interval.
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b3", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
 								        )
 								        # Now advance time by 2 hours and we should only be able to see "b3"
 								        # because we have waited long enough for the single attempt (2^1 hours)
 								        # but we still shouldn't see "b1" because we haven't waited long enough
 								        # for this many attempts. We didn't do anything to "b2" so it should be
 								        # visible regardless.
 								        self.reactor.advance(datetime.timedelta(hours=2).total_seconds())
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        # Try at "A" and make sure that "b1" is not in the list because we've
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        # already attempted many times
 								        backfill_points = self.get_success(
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        )
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
-												Fix overflows in /messages backfill calculation (#13936)

* Reproduce bug
* Compute `least_function` first
* Substitute `least_function` with an f-string
* Bugfix: avoid overflow

Co-authored-by: Eric Eastwood <erice@element.io>
											
										
										
											2022-09-30 12:54:53 +02:00
+								        self.assertEqual(backfill_event_ids, ["b3", "b2"])
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
 								        # Now advance time by 20 hours (above 2^4 because we made 4 attemps) and
 								        # see if we can now backfill it
 								        self.reactor.advance(datetime.timedelta(hours=20).total_seconds())
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								        # Try at "A" again after we advanced enough time and we should see "b3" again
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        backfill_points = self.get_success(
-												Limit and filter the number of backfill points to get from the database (#13879)

There is no need to grab thousands of backfill points when we only need 5 to make the `/backfill` request with. We need to grab a few extra in case the first few aren't visible in the history.

Previously, we grabbed thousands of backfill points from the database, then sorted and filtered them in the app. Fetching the 4.6k backfill points for `#matrix:matrix.org` from the database takes ~50ms - ~570ms so it's not like this saves a lot of time 🤷. But it might save us more time now that `get_backfill_points_in_room`/`get_insertion_event_backward_extremities_in_room` are more complicated after https://github.com/matrix-org/synapse/pull/13635 

This PR moves the filtering and limiting to the SQL query so we just have less data to work with in the first place.

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-28 22:26:16 +02:00
+								            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
+								        )
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
-												Fix overflows in /messages backfill calculation (#13936)

* Reproduce bug
* Compute `least_function` first
* Substitute `least_function` with an f-string
* Bugfix: avoid overflow

Co-authored-by: Eric Eastwood <erice@element.io>
											
										
										
											2022-09-30 12:54:53 +02:00
+								        self.assertEqual(backfill_event_ids, ["b3", "b2", "b1"])
 								    def test_get_backfill_points_in_room_works_after_many_failed_pull_attempts_that_could_naively_overflow(
 								        self,
 								    ) -> None:
 								        """
-												Use full GitHub links instead of bare issue numbers. (#16637)


											
										
										
											2023-11-15 14:02:11 +01:00
+								        A test that reproduces https://github.com/matrix-org/synapse/issues/13929 (Postgres only).
-												Fix overflows in /messages backfill calculation (#13936)

* Reproduce bug
* Compute `least_function` first
* Substitute `least_function` with an f-string
* Bugfix: avoid overflow

Co-authored-by: Eric Eastwood <erice@element.io>
											
										
										
											2022-09-30 12:54:53 +02:00
 								        Test to make sure we can still get backfill points after many failed pull
 								        attempts that cause us to backoff to the limit. Even if the backoff formula
 								        would tell us to wait for more seconds than can be expressed in a 32 bit
 								        signed int.
 								        """
 								        setup_info = self._setup_room_for_backfill_tests()
 								        room_id = setup_info.room_id
 								        depth_map = setup_info.depth_map
 								        # Pretend that we have tried and failed 10 times to backfill event b1.
 								        for _ in range(10):
 								            self.get_success(
 								                self.store.record_event_failed_pull_attempt(room_id, "b1", "fake cause")
 								            )
 								        # If the backoff periods grow without limit:
 								        # After the first failed attempt, we would have backed off for 1 << 1 = 2 hours.
 								        # After the second failed attempt we would have backed off for 1 << 2 = 4 hours,
 								        # so after the 10th failed attempt we should backoff for 1 << 10 == 1024 hours.
 								        # Wait 1100 hours just so we have a nice round number.
 								        self.reactor.advance(datetime.timedelta(hours=1100).total_seconds())
 								        # 1024 hours in milliseconds is 1024 * 3600000, which exceeds the largest 32 bit
 								        # signed integer. The bug we're reproducing is that this overflow causes an
 								        # error in postgres preventing us from fetching a set of backwards extremities
 								        # to retry fetching.
 								        backfill_points = self.get_success(
 								            self.store.get_backfill_points_in_room(room_id, depth_map["A"], limit=100)
 								        )
 								        # We should aim to fetch all backoff points: b1's latest backoff period has
 								        # expired, and we haven't tried the rest.
 								        backfill_event_ids = [backfill_point[0] for backfill_point in backfill_points]
 								        self.assertEqual(backfill_event_ids, ["b3", "b2", "b1"])
-												Only try to backfill event if we haven't tried before recently (#13635)

Only try to backfill event if we haven't tried before recently (exponential backoff). No need to keep trying the same backfill point that fails over and over.

Fix https://github.com/matrix-org/synapse/issues/13622
Fix https://github.com/matrix-org/synapse/issues/8451

Follow-up to https://github.com/matrix-org/synapse/pull/13589

Part of https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2022-09-23 21:01:29 +02:00
-												Process previously failed backfill events in the background (#15585)

Process previously failed backfill events in the background because they are bound to fail again and we don't need to waste time holding up the request for something that is bound to fail again.

Fix https://github.com/matrix-org/synapse/issues/13623

Follow-up to https://github.com/matrix-org/synapse/issues/13621 and https://github.com/matrix-org/synapse/issues/13622

Part of making `/messages` faster: https://github.com/matrix-org/synapse/issues/13356
											
										
										
											2023-05-25 06:22:24 +02:00
+								    def test_get_event_ids_with_failed_pull_attempts(self) -> None:
 								        """
 								        Test to make sure we properly get event_ids based on whether they have any
 								        failed pull attempts.
 								        """
 								        # Create the room
 								        user_id = self.register_user("alice", "test")
 								        tok = self.login("alice", "test")
 								        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(
 								                room_id, "$failed_event_id1", "fake cause"
 								            )
 								        )
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(
 								                room_id, "$failed_event_id2", "fake cause"
 								            )
 								        )
 								        event_ids_with_failed_pull_attempts = self.get_success(
 								            self.store.get_event_ids_with_failed_pull_attempts(
 								                event_ids=[
 								                    "$failed_event_id1",
 								                    "$fresh_event_id1",
 								                    "$failed_event_id2",
 								                    "$fresh_event_id2",
 								                ]
 								            )
 								        )
 								        self.assertEqual(
 								            event_ids_with_failed_pull_attempts,
 								            {"$failed_event_id1", "$failed_event_id2"},
 								        )
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def test_get_event_ids_to_not_pull_from_backoff(self) -> None:
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								        """
 								        Test to make sure only event IDs we should backoff from are returned.
 								        """
 								        # Create the room
 								        user_id = self.register_user("alice", "test")
 								        tok = self.login("alice", "test")
 								        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)
-												Fix spinloop during partial state sync when a prev event is in backoff (#15351)

Previously, we would spin in a tight loop until
`update_state_for_partial_state_event` stopped raising
`FederationPullAttemptBackoffError`s. Replace the spinloop with a wait
until the backoff period has expired.

Signed-off-by: Sean Quah <seanq@matrix.org>
											
										
										
											2023-03-30 14:36:41 +02:00
+								        failure_time = self.clock.time_msec()
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(
 								                room_id, "$failed_event_id", "fake cause"
 								            )
 								        )
-												Fix spinloop during partial state sync when a prev event is in backoff (#15351)

Previously, we would spin in a tight loop until
`update_state_for_partial_state_event` stopped raising
`FederationPullAttemptBackoffError`s. Replace the spinloop with a wait
until the backoff period has expired.

Signed-off-by: Sean Quah <seanq@matrix.org>
											
										
										
											2023-03-30 14:36:41 +02:00
+								        event_ids_with_backoff = self.get_success(
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								            self.store.get_event_ids_to_not_pull_from_backoff(
 								                room_id=room_id, event_ids=["$failed_event_id", "$normal_event_id"]
 								            )
 								        )
-												Fix spinloop during partial state sync when a prev event is in backoff (#15351)

Previously, we would spin in a tight loop until
`update_state_for_partial_state_event` stopped raising
`FederationPullAttemptBackoffError`s. Replace the spinloop with a wait
until the backoff period has expired.

Signed-off-by: Sean Quah <seanq@matrix.org>
											
										
										
											2023-03-30 14:36:41 +02:00
+								        self.assertEqual(
 								            event_ids_with_backoff,
 								            # We expect a 2^1 hour backoff after a single failed attempt.
 								            {"$failed_event_id": failure_time + 2 * 60 * 60 * 1000},
 								        )
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
 								    def test_get_event_ids_to_not_pull_from_backoff_retry_after_backoff_duration(
 								        self,
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    ) -> None:
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								        """
 								        Test to make sure no event IDs are returned after the backoff duration has
 								        elapsed.
 								        """
 								        # Create the room
 								        user_id = self.register_user("alice", "test")
 								        tok = self.login("alice", "test")
 								        room_id = self.helper.create_room_as(room_creator=user_id, tok=tok)
 								        self.get_success(
 								            self.store.record_event_failed_pull_attempt(
 								                room_id, "$failed_event_id", "fake cause"
 								            )
 								        )
 								        # Now advance time by 2 hours so we wait long enough for the single failed
 								        # attempt (2^1 hours).
 								        self.reactor.advance(datetime.timedelta(hours=2).total_seconds())
-												Fix spinloop during partial state sync when a prev event is in backoff (#15351)

Previously, we would spin in a tight loop until
`update_state_for_partial_state_event` stopped raising
`FederationPullAttemptBackoffError`s. Replace the spinloop with a wait
until the backoff period has expired.

Signed-off-by: Sean Quah <seanq@matrix.org>
											
										
										
											2023-03-30 14:36:41 +02:00
+								        event_ids_with_backoff = self.get_success(
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
+								            self.store.get_event_ids_to_not_pull_from_backoff(
 								                room_id=room_id, event_ids=["$failed_event_id", "$normal_event_id"]
 								            )
 								        )
 								        # Since this function only returns events we should backoff from, time has
 								        # elapsed past the backoff range so there is no events to backoff from.
-												Fix spinloop during partial state sync when a prev event is in backoff (#15351)

Previously, we would spin in a tight loop until
`update_state_for_partial_state_event` stopped raising
`FederationPullAttemptBackoffError`s. Replace the spinloop with a wait
until the backoff period has expired.

Signed-off-by: Sean Quah <seanq@matrix.org>
											
										
										
											2023-03-30 14:36:41 +02:00
+								        self.assertEqual(event_ids_with_backoff, {})
-												Stop getting missing `prev_events` after we already know their signature is invalid (#13816)

While https://github.com/matrix-org/synapse/pull/13635 stops us from doing the slow thing after we've already done it once, this PR stops us from doing one of the slow things in the first place.

Related to
 - https://github.com/matrix-org/synapse/issues/13622
    - https://github.com/matrix-org/synapse/pull/13635
 - https://github.com/matrix-org/synapse/issues/13676

Part of https://github.com/matrix-org/synapse/issues/13356

Follow-up to https://github.com/matrix-org/synapse/pull/13815 which tracks event signature failures.

With this PR, we avoid the call to the costly `_get_state_ids_after_missing_prev_event` because the signature failure will count as an attempt before and we filter events based on the backoff before calling `_get_state_ids_after_missing_prev_event` now.

For example, this will save us 156s out of the 185s total that this `matrix.org` `/messages` request. If you want to see the full Jaeger trace of this, you can drag and drop this `trace.json` into your own Jaeger, https://gist.github.com/MadLittleMods/4b12d0d0afe88c2f65ffcc907306b761

To explain this exact scenario around `/messages` -> backfill, we call `/backfill` and first check the signatures of the 100 events. We see bad signature for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` and `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` (both member events). Then we process the 98 events remaining that have valid signatures but one of the events references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event`. So we have to do the whole `_get_state_ids_after_missing_prev_event` rigmarole which pulls in those same events which fail again because the signatures are still invalid.

 - `backfill`
    - `outgoing-federation-request` `/backfill`
    - `_check_sigs_and_hash_and_fetch`
       - `_check_sigs_and_hash_and_fetch_one` for each event received over backfill
          - ❗ `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
          - ❗ `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` fails with `Signature on retrieved event was invalid.`: `unable to verify signature for sender domain xxx: 401: Failed to find any key to satisfy: _FetchKeyRequest(...)`
   - `_process_pulled_events`
      - `_process_pulled_event` for each validated event
         - ❗ Event `$Q0iMdqtz3IJYfZQU2Xk2WjB5NDF8Gg8cFSYYyKQgKJ0` references `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` as a `prev_event` which is missing so we try to get it
            - `_get_state_ids_after_missing_prev_event`
               - `outgoing-federation-request` `/state_ids`
               - ❗ `get_pdu` for `$luA4l7QHhf_jadH3mI-AyFqho0U2Q-IXXUbGSMq6h6M` which fails the signature check again
               - ❗ `get_pdu` for `$zuOn2Rd2vsC7SUia3Hp3r6JSkSFKcc5j3QTTqW_0jDw` which fails the signature check

											
										
										
											2022-10-15 07:36:49 +02:00
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								@attr.s(auto_attribs=True)
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								class FakeEvent:
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    event_id: str
 								    room_id: str
 								    auth_events: List[str]
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
 								    type = "foo"
 								    state_key = "foo"
-												Port `EventInternalMetadata` class to Rust (#16782)

There are a couple of things we need to be careful of here:

1. The current python code does no validation when loading from the DB,
so we need to be careful to ignore such errors (at least on jki.re there
are some old events with internal metadata fields of the wrong type).
2. We want to be memory efficient, as we often have many hundreds of
thousands of events in the cache at a time.

---------

Co-authored-by: Quentin Gliech <quenting@element.io>
											
										
										
											2024-01-08 15:06:48 +01:00
+								    internal_metadata = EventInternalMetadata({})
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def auth_event_ids(self) -> List[str]:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        return self.auth_events
-												Require types in tests.storage. (#14646)

Adds missing type hints to `tests.storage` package
and does not allow untyped definitions.
											
										
										
											2022-12-09 18:36:32 +01:00
+								    def is_state(self) -> bool:
-												Use a chain cover index to efficiently calculate auth chain difference (#8868)


											
										
										
											2021-01-11 17:09:22 +01:00
+								        return True