From dc3d504f9b95d5093c204e39c2ca6fa102a62688 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Wed, 1 Dec 2021 20:06:25 +0000 Subject: [PATCH 01/23] comment wait_for_sync_for_user --- synapse/handlers/sync.py | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 891435c14daf..cddc680a6125 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -334,6 +334,19 @@ async def _wait_for_sync_for_user( full_state: bool, cache_context: ResponseCacheContext[SyncRequestKey], ) -> SyncResult: + """The start of the machinery that produces a /sync response. + + See https://spec.matrix.org/v1.1/client-server-api/#syncing for full details. + + This method does high-level bookkeeping: + - tracking the kind of sync in the logging context + - deleting any to_device messages whose delivery has been acknowledged. + - deciding if we should dispatch an instant or delayed response + - marking the sync as being lazily loaded, if appropriate + + Computing the body of the response beings in the next method, + `current_sync_for_user`. + """ if since_token is None: sync_type = "initial_sync" elif full_state: @@ -363,7 +376,7 @@ async def _wait_for_sync_for_user( sync_config, since_token, full_state=full_state ) else: - + # Otherwise, we wait for something to happen and report it to the user. async def current_sync_callback( before_token: StreamToken, after_token: StreamToken ) -> SyncResult: From 39a376d9128585309729cd1f30e74eb109ca0281 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Wed, 1 Dec 2021 20:06:38 +0000 Subject: [PATCH 02/23] Comment current_sync_for_user --- synapse/handlers/sync.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index cddc680a6125..7a2e646fa0f7 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -415,7 +415,12 @@ async def current_sync_for_user( since_token: Optional[StreamToken] = None, full_state: bool = False, ) -> SyncResult: - """Get the sync for client needed to match what the server has now.""" + """Get the sync for client needed to match what the server has now. + + This is a wrapper around generate_sync_result which starts an open tracing span + to track the sync. Delve to generate_sync_result for the next level of your + indoctrination. + """ with start_active_span("current_sync_for_user"): log_kv({"since_token": since_token}) sync_result = await self.generate_sync_result( From 7da68f701ad4124bba4c86fb027fa39dd4bbf0db Mon Sep 17 00:00:00 2001 From: David Robertson Date: Wed, 1 Dec 2021 20:10:22 +0000 Subject: [PATCH 03/23] Comment generate_sync_result --- synapse/handlers/sync.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 7a2e646fa0f7..e13355f8cf83 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1060,7 +1060,18 @@ async def generate_sync_result( since_token: Optional[StreamToken] = None, full_state: bool = False, ) -> SyncResult: - """Generates a sync result.""" + """Generates the response body of a sync result. + + This is represented by a `SyncResult` struct, which is built from small pieces + using a `SyncResultBuilder`. See also + https://spec.matrix.org/v1.1/client-server-api/#get_matrixclientv3sync + the `sync_result_builder` is passed as a mutable ("inout") parameter to various + helper functions. These retrieve and process the data which forms the sync body, + often writing to the `sync_result_builder` to store their output. + + At the end, we transfer data from the `sync_result_builder` to a new `SyncResult` + instance to signify that the sync calculation is complete. + """ # NB: The now_token gets changed by some of the generate_sync_* methods, # this is due to some of the underlying streams not supporting the ability # to query up to a given point. From a91bf8bbd137eee95824f6353021eb06db5b8fd7 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Wed, 1 Dec 2021 20:10:47 +0000 Subject: [PATCH 04/23] Comment _generate_sync_entry_for_to_device --- synapse/handlers/sync.py | 24 ++++++++++++++++-------- 1 file changed, 16 insertions(+), 8 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index e13355f8cf83..ded006f3c349 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1373,14 +1373,22 @@ async def _generate_sync_entry_for_to_device( async def _generate_sync_entry_for_account_data( self, sync_result_builder: "SyncResultBuilder" ) -> Dict[str, Dict[str, JsonDict]]: - """Generates the account data portion of the sync response. Populates - `sync_result_builder` with the result. + """Generates the account data portion of the sync response. + + Account data (called "Client Config" in the spec) can be set either globally + or for a specific room. Account data consists of a list of events which + accumulate state, much like a room. + + This function retrieves global and per-room account data. The former is written + to the given `sync_result_builder`. The latter is returned directly, to be + later written to the `sync_result_builder` on a room-by-room basis. Args: sync_result_builder Returns: - A dictionary containing the per room account data. + A dictionary whose keys (room ids) map to the per room account data for that + room. """ sync_config = sync_result_builder.sync_config user_id = sync_result_builder.sync_config.user.to_string() @@ -1388,7 +1396,7 @@ async def _generate_sync_entry_for_account_data( if since_token and not sync_result_builder.full_state: ( - account_data, + global_account_data, account_data_by_room, ) = await self.store.get_updated_account_data_for_user( user_id, since_token.account_data_key @@ -1399,23 +1407,23 @@ async def _generate_sync_entry_for_account_data( ) if push_rules_changed: - account_data["m.push_rules"] = await self.push_rules_for_user( + global_account_data["m.push_rules"] = await self.push_rules_for_user( sync_config.user ) else: ( - account_data, + global_account_data, account_data_by_room, ) = await self.store.get_account_data_for_user(sync_config.user.to_string()) - account_data["m.push_rules"] = await self.push_rules_for_user( + global_account_data["m.push_rules"] = await self.push_rules_for_user( sync_config.user ) account_data_for_user = await sync_config.filter_collection.filter_account_data( [ {"type": account_data_type, "content": content} - for account_data_type, content in account_data.items() + for account_data_type, content in global_account_data.items() ] ) From 326bc742a872448ba8258925e7bd5d1664456e93 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Wed, 1 Dec 2021 20:11:12 +0000 Subject: [PATCH 05/23] Comment _generate_sync_entry_for_rooms --- synapse/handlers/sync.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index ded006f3c349..96879586027f 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1497,15 +1497,20 @@ async def _generate_sync_entry_for_rooms( """Generates the rooms portion of the sync response. Populates the `sync_result_builder` with the result. + In the response that reaches the client, rooms are divided into four categories: + `invite`, `join`, `knock`, `leave`. These aren't the same as the four sets of + room ids returned by this function. + Args: sync_result_builder account_data_by_room: Dictionary of per room account data Returns: Returns a 4-tuple of - `(newly_joined_rooms, newly_joined_or_invited_users, + `(newly_joined_rooms, newly_joined_or_invited_or_knocked_users, newly_left_rooms, newly_left_users)` """ + # Start by fetching all ephemeral events in rooms we've joined (if required). user_id = sync_result_builder.sync_config.user.to_string() block_all_room_ephemeral = ( sync_result_builder.since_token is None From d107917accabfc9da97d7422ac4fe0d7349c8cf0 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 10:45:25 +0000 Subject: [PATCH 06/23] Small refactor in _get_all_rooms --- synapse/handlers/sync.py | 10 +--------- 1 file changed, 1 insertion(+), 9 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 96879586027f..aa96c5be8544 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1895,16 +1895,8 @@ async def _get_all_rooms( now_token = sync_result_builder.now_token sync_config = sync_result_builder.sync_config - membership_list = ( - Membership.INVITE, - Membership.KNOCK, - Membership.JOIN, - Membership.LEAVE, - Membership.BAN, - ) - room_list = await self.store.get_rooms_for_local_user_where_membership_is( - user_id=user_id, membership_list=membership_list + user_id=user_id, membership_list=Membership.LIST, ) room_entries = [] From fd66d02d9191de7b5c242389aa091060c6d1fb24 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 11:00:09 +0000 Subject: [PATCH 07/23] Comment for and rename inside _have_rooms_changed --- synapse/handlers/sync.py | 14 ++++++++++---- 1 file changed, 10 insertions(+), 4 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index aa96c5be8544..bacdd09d5c53 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1632,6 +1632,8 @@ async def _have_rooms_changed( ) -> bool: """Returns whether there may be any new events that should be sent down the sync. Returns True if there are. + + Does not modify the `sync_result_builder`. """ user_id = sync_result_builder.sync_config.user.to_string() since_token = sync_result_builder.since_token @@ -1639,12 +1641,13 @@ async def _have_rooms_changed( assert since_token - # Get a list of membership change events that have happened. - rooms_changed = await self.store.get_membership_changes_for_user( + # Get a list of membership change events that have happened to the user + # requesting the sync. + membership_changes = await self.store.get_membership_changes_for_user( user_id, since_token.room_key, now_token.room_key ) - if rooms_changed: + if membership_changes: return True stream_id = since_token.room_key.stream @@ -1656,7 +1659,10 @@ async def _have_rooms_changed( async def _get_rooms_changed( self, sync_result_builder: "SyncResultBuilder", ignored_users: FrozenSet[str] ) -> _RoomChanges: - """Gets the the changes that have happened since the last sync.""" + """Gets the the changes that have happened since the last sync. + + The sync_result_builder is not modified by this function. + """ user_id = sync_result_builder.sync_config.user.to_string() since_token = sync_result_builder.since_token now_token = sync_result_builder.now_token From ef9482aa2e9a335ff045fdfeb2358e3605b591c1 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 12:21:10 +0000 Subject: [PATCH 08/23] Comments to stream.py --- synapse/storage/databases/main/stream.py | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/synapse/storage/databases/main/stream.py b/synapse/storage/databases/main/stream.py index 42dc807d17ff..a9e56105038f 100644 --- a/synapse/storage/databases/main/stream.py +++ b/synapse/storage/databases/main/stream.py @@ -497,7 +497,7 @@ async def get_room_events_stream_for_room( oldest `limit` events. Returns: - The list of events (in ascending order) and the token from the start + The list of events (in ascending stream order) and the token from the start of the chunk of events returned. """ if from_key == to_key: @@ -510,7 +510,7 @@ async def get_room_events_stream_for_room( if not has_changed: return [], from_key - def f(txn): + def f(txn: LoggingTransaction) -> List[_EventDictReturn]: # To handle tokens with a non-empty instance_map we fetch more # results than necessary and then filter down min_from_id = from_key.stream @@ -565,6 +565,12 @@ def f(txn): async def get_membership_changes_for_user( self, user_id: str, from_key: RoomStreamToken, to_key: RoomStreamToken ) -> List[EventBase]: + """Fetch membership membership events for a given user. + + All such events whose stream ordering lies in the range (from_key, to_key] + are returned. Events are ordered by ascending stream order. + """ + # Start by ruling out cases where a DB query is not necessary. if from_key == to_key: return [] @@ -575,7 +581,7 @@ async def get_membership_changes_for_user( if not has_changed: return [] - def f(txn): + def f(txn: LoggingTransaction) -> List[_EventDictReturn]: # To handle tokens with a non-empty instance_map we fetch more # results than necessary and then filter down min_from_id = from_key.stream From f7fdab3550489518bfd40329d9bb83a67a8d8a12 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 16:27:01 +0000 Subject: [PATCH 09/23] Typo fix --- synapse/handlers/sync.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index bacdd09d5c53..32b45d339b0c 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -578,7 +578,7 @@ async def _load_filtered_recents( # that have happened since `since_key` up to `end_key`, so we # can just use `get_room_events_stream_for_room`. # Otherwise, we want to return the last N events in the room - # in toplogical ordering. + # in topological ordering. if since_key: events, end_key = await self.store.get_room_events_stream_for_room( room_id, From 9932b6da5b0b810d0ff9bdd5f8c478b043053854 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 16:27:56 +0000 Subject: [PATCH 10/23] Comment for _get_rooms_changed --- synapse/handlers/sync.py | 21 +++++++++++++++++---- 1 file changed, 17 insertions(+), 4 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 32b45d339b0c..8afac7cbde9b 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1670,13 +1670,21 @@ async def _get_rooms_changed( assert since_token - # Get a list of membership change events that have happened. - rooms_changed = await self.store.get_membership_changes_for_user( + # The spec notes: + # > When a sync is limited, the server MUST return membership events for events + # > in the gap (between since and the start of the returned timeline), regardless + # > as to whether or not they are redundant. + # We fetch such events here, but we only seem to use them for categorising rooms + # as newly joined, newly left, invited or knocked. + # TODO: we've already called this function and ran this query in + # _have_rooms_changed. We could keep the results in memory to avoid a + # second query, at the cost of more complicated source code. + membership_change_events = await self.store.get_membership_changes_for_user( user_id, since_token.room_key, now_token.room_key ) mem_change_events_by_room_id: Dict[str, List[EventBase]] = {} - for event in rooms_changed: + for event in membership_change_events: mem_change_events_by_room_id.setdefault(event.room_id, []).append(event) newly_joined_rooms = [] @@ -1685,6 +1693,9 @@ async def _get_rooms_changed( invited = [] knocked = [] for room_id, events in mem_change_events_by_room_id.items(): + # The body of this loop will add this room to at least one of the five lists + # above. Things get messy if you've e.g. joined, left, joined then left the + # room all in the same sync period. logger.debug( "Membership changes in %s: [%s]", room_id, @@ -1829,7 +1840,9 @@ async def _get_rooms_changed( timeline_limit = sync_config.filter_collection.timeline_limit() - # Get all events for rooms we're currently joined to. + # Get all events since the `from_key` in rooms we're currently joined to. + # If there are too many, we get the most recent events only. This leaves + # a "gap" in the timeline, as described by the spec for /sync. room_to_events = await self.store.get_room_events_stream_for_rooms( room_ids=sync_result_builder.joined_room_ids, from_key=since_token.room_key, From 6a506c4641dcf39fa08a5c8b8d69f38704c365ff Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 16:30:03 +0000 Subject: [PATCH 11/23] Fix URL line break --- synapse/handlers/sync.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 8afac7cbde9b..41f3301b1fbd 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -2265,8 +2265,7 @@ def _calculate_state( # to only include membership events for the senders in the timeline. # In practice, we can do this by removing them from the p_ids list, # which is the list of relevant state we know we have already sent to the client. - # see https://github.com/matrix-org/synapse/pull/2970 - # /files/efcdacad7d1b7f52f879179701c7e0d9b763511f#r204732809 + # see https://github.com/matrix-org/synapse/pull/2970/files/efcdacad7d1b7f52f879179701c7e0d9b763511f#r204732809 if lazy_load_members: p_ids.difference_update( From 4a995ce63f96892f8e0c547d298116a815f6cbb4 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 16:37:17 +0000 Subject: [PATCH 12/23] Changelog --- changelog.d/11494.misc | 1 + 1 file changed, 1 insertion(+) create mode 100644 changelog.d/11494.misc diff --git a/changelog.d/11494.misc b/changelog.d/11494.misc new file mode 100644 index 000000000000..7afd7d3a0727 --- /dev/null +++ b/changelog.d/11494.misc @@ -0,0 +1 @@ +Add comments to various parts of the `/sync` handler. \ No newline at end of file From 15c022da607b112c1c1ccd9dfd85b447928edbbc Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 18:41:28 +0000 Subject: [PATCH 13/23] linty --- synapse/handlers/sync.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 41f3301b1fbd..f443df255723 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1915,7 +1915,8 @@ async def _get_all_rooms( sync_config = sync_result_builder.sync_config room_list = await self.store.get_rooms_for_local_user_where_membership_is( - user_id=user_id, membership_list=Membership.LIST, + user_id=user_id, + membership_list=Membership.LIST, ) room_entries = [] From 3eca8bc0c6ad68afce3c1e1992ac9d3dfacdaee0 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:10:51 +0000 Subject: [PATCH 14/23] Fix a couple of typos Co-authored-by: Patrick Cloke --- synapse/handlers/sync.py | 2 +- synapse/storage/databases/main/stream.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index f443df255723..f23a77e78053 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -344,7 +344,7 @@ async def _wait_for_sync_for_user( - deciding if we should dispatch an instant or delayed response - marking the sync as being lazily loaded, if appropriate - Computing the body of the response beings in the next method, + Computing the body of the response begins in the next method, `current_sync_for_user`. """ if since_token is None: diff --git a/synapse/storage/databases/main/stream.py b/synapse/storage/databases/main/stream.py index a9e56105038f..54b0f5a865f4 100644 --- a/synapse/storage/databases/main/stream.py +++ b/synapse/storage/databases/main/stream.py @@ -565,7 +565,7 @@ def f(txn: LoggingTransaction) -> List[_EventDictReturn]: async def get_membership_changes_for_user( self, user_id: str, from_key: RoomStreamToken, to_key: RoomStreamToken ) -> List[EventBase]: - """Fetch membership membership events for a given user. + """Fetch membership events for a given user. All such events whose stream ordering lies in the range (from_key, to_key] are returned. Events are ordered by ascending stream order. From d9c3c15fff996ae4833e01e1db85be377efce019 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:09:16 +0000 Subject: [PATCH 15/23] Rewrite current_sync_for_user docstring --- synapse/handlers/sync.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index f23a77e78053..a85d106c72e5 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -415,10 +415,10 @@ async def current_sync_for_user( since_token: Optional[StreamToken] = None, full_state: bool = False, ) -> SyncResult: - """Get the sync for client needed to match what the server has now. + """Generates the response body of a sync result, represented as a SyncResult. - This is a wrapper around generate_sync_result which starts an open tracing span - to track the sync. Delve to generate_sync_result for the next level of your + This is a wrapper around `generate_sync_result` which starts an open tracing + span to track the sync. See `generate_sync_result` for the next part of your indoctrination. """ with start_active_span("current_sync_for_user"): From 6908482ada5ce2783c0eba0f99a5e5a0636ce391 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:14:14 +0000 Subject: [PATCH 16/23] Use explicit inequality signs --- synapse/storage/databases/main/stream.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/synapse/storage/databases/main/stream.py b/synapse/storage/databases/main/stream.py index 54b0f5a865f4..cd3b5674de5b 100644 --- a/synapse/storage/databases/main/stream.py +++ b/synapse/storage/databases/main/stream.py @@ -567,8 +567,9 @@ async def get_membership_changes_for_user( ) -> List[EventBase]: """Fetch membership events for a given user. - All such events whose stream ordering lies in the range (from_key, to_key] - are returned. Events are ordered by ascending stream order. + All such events whose stream ordering `s` lies in the range + `from_key < s <= to_key` are returned. Events are ordered by ascending stream + order. """ # Start by ruling out cases where a DB query is not necessary. if from_key == to_key: From 52929d0c3fb981add7b74853b3bfcb1ebfa7942a Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:14:37 +0000 Subject: [PATCH 17/23] Itemise the 4-tuple --- synapse/handlers/sync.py | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index a85d106c72e5..510cad6222f5 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1506,9 +1506,11 @@ async def _generate_sync_entry_for_rooms( account_data_by_room: Dictionary of per room account data Returns: - Returns a 4-tuple of - `(newly_joined_rooms, newly_joined_or_invited_or_knocked_users, - newly_left_rooms, newly_left_users)` + Returns a 4-tuple whose entries are: + - newly_joined_rooms + - newly_joined_or_invited_or_knocked_users, + - newly_left_rooms + - newly_left_users """ # Start by fetching all ephemeral events in rooms we've joined (if required). user_id = sync_result_builder.sync_config.user.to_string() From 3954082eefba6bf985c74427433e42d4ab195a1a Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:35:45 +0000 Subject: [PATCH 18/23] Expand comments in _get_rooms_changed --- synapse/handlers/sync.py | 23 +++++++++++++++++++++-- 1 file changed, 21 insertions(+), 2 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 510cad6222f5..2dedcd40b93e 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1661,7 +1661,22 @@ async def _have_rooms_changed( async def _get_rooms_changed( self, sync_result_builder: "SyncResultBuilder", ignored_users: FrozenSet[str] ) -> _RoomChanges: - """Gets the the changes that have happened since the last sync. + """Determine the changes in rooms to report to the user. + + Ideally, we want to report all events whose stream ordering `s` lies in the + range `since_token < s <= now_token`, where the two tokens are read from the + sync_result_builder. + + If there are too many events in that range to report, things get complicated. + In this situation we return a truncated list of the most recent events, and + indicate in the response that there is a "gap" of omitted events. Additionally: + + - we include a "state_delta", to describethe changes in state over the gap, + - we include all membership events applying to the user making the request, + even those in the gap. + + See the spec for the rationale: + https://spec.matrix.org/v1.1/client-server-api/#syncing The sync_result_builder is not modified by this function. """ @@ -1672,10 +1687,14 @@ async def _get_rooms_changed( assert since_token - # The spec notes: + # The spec + # https://spec.matrix.org/v1.1/client-server-api/#get_matrixclientv3sync + # notes that membership events need special consideration: + # # > When a sync is limited, the server MUST return membership events for events # > in the gap (between since and the start of the returned timeline), regardless # > as to whether or not they are redundant. + # # We fetch such events here, but we only seem to use them for categorising rooms # as newly joined, newly left, invited or knocked. # TODO: we've already called this function and ran this query in From d0c15cc60ad727354bcbd68e732da217cb681caa Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:40:19 +0000 Subject: [PATCH 19/23] Comment _get_all_rooms --- synapse/handlers/sync.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 2dedcd40b93e..09b0f9aa814d 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1924,6 +1924,10 @@ async def _get_all_rooms( ) -> _RoomChanges: """Returns entries for all rooms for the user. + Like `_get_rooms_changed`, but assumes the `since_token` is `None`. + + This function does not modify the sync_result_builder. + Args: sync_result_builder ignored_users: Set of users ignored by user. From a165e27504c4f05c22877973c2bb0c6423b27d2f Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:40:32 +0000 Subject: [PATCH 20/23] Explicitly describe order in get_recent_events_for_room --- synapse/storage/databases/main/stream.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/synapse/storage/databases/main/stream.py b/synapse/storage/databases/main/stream.py index cd3b5674de5b..57aab5525937 100644 --- a/synapse/storage/databases/main/stream.py +++ b/synapse/storage/databases/main/stream.py @@ -641,7 +641,7 @@ async def get_recent_events_for_room( Returns: A list of events and a token pointing to the start of the returned - events. The events returned are in ascending order. + events. The events returned are in ascending topological order. """ rows, token = await self.get_recent_event_ids_for_room( From 90dd4dab50fc0ca9a07d2f9e977b5259e48f708d Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:41:09 +0000 Subject: [PATCH 21/23] Add type annotations for the five lists I think mypy can deduce these, but I find it helpful as a reader to have them. --- synapse/handlers/sync.py | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 09b0f9aa814d..17d4d8649813 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1708,11 +1708,11 @@ async def _get_rooms_changed( for event in membership_change_events: mem_change_events_by_room_id.setdefault(event.room_id, []).append(event) - newly_joined_rooms = [] - newly_left_rooms = [] - room_entries = [] - invited = [] - knocked = [] + newly_joined_rooms: List[str] + newly_left_rooms: List[str] + room_entries: List[RoomSyncResultBuilder] + invited: List[InvitedSyncResult] + knocked: List[KnockedSyncResult] for room_id, events in mem_change_events_by_room_id.items(): # The body of this loop will add this room to at least one of the five lists # above. Things get messy if you've e.g. joined, left, joined then left the From 9a0a16b92aef4ed8c8e12df0a554221a1e3c9bc7 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 19:46:30 +0000 Subject: [PATCH 22/23] Oops, re-create empty lists! --- synapse/handlers/sync.py | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 17d4d8649813..703df0634baa 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1708,11 +1708,11 @@ async def _get_rooms_changed( for event in membership_change_events: mem_change_events_by_room_id.setdefault(event.room_id, []).append(event) - newly_joined_rooms: List[str] - newly_left_rooms: List[str] - room_entries: List[RoomSyncResultBuilder] - invited: List[InvitedSyncResult] - knocked: List[KnockedSyncResult] + newly_joined_rooms: List[str] = [] + newly_left_rooms: List[str] = [] + room_entries: List[RoomSyncResultBuilder] = [] + invited: List[InvitedSyncResult] = [] + knocked: List[KnockedSyncResult] = [] for room_id, events in mem_change_events_by_room_id.items(): # The body of this loop will add this room to at least one of the five lists # above. Things get messy if you've e.g. joined, left, joined then left the From c04d7e27c2467468bc37a3ad95c21dae9ca0f7b5 Mon Sep 17 00:00:00 2001 From: David Robertson Date: Thu, 2 Dec 2021 20:33:10 +0000 Subject: [PATCH 23/23] Typo fixes, thanks Patrick! Co-authored-by: Patrick Cloke --- synapse/handlers/sync.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/synapse/handlers/sync.py b/synapse/handlers/sync.py index 703df0634baa..53d4627147d4 100644 --- a/synapse/handlers/sync.py +++ b/synapse/handlers/sync.py @@ -1508,7 +1508,7 @@ async def _generate_sync_entry_for_rooms( Returns: Returns a 4-tuple whose entries are: - newly_joined_rooms - - newly_joined_or_invited_or_knocked_users, + - newly_joined_or_invited_or_knocked_users - newly_left_rooms - newly_left_users """ @@ -1671,7 +1671,7 @@ async def _get_rooms_changed( In this situation we return a truncated list of the most recent events, and indicate in the response that there is a "gap" of omitted events. Additionally: - - we include a "state_delta", to describethe changes in state over the gap, + - we include a "state_delta", to describe the changes in state over the gap, - we include all membership events applying to the user making the request, even those in the gap.