Skip to content
This repository has been archived by the owner on Apr 26, 2024. It is now read-only.

Replace EventContext fields prev_group and delta_ids with field state_group_deltas #15233

Merged
merged 28 commits into from
Jun 13, 2023
Merged
Show file tree
Hide file tree
Changes from 22 commits
Commits
Show all changes
28 commits
Select commit Hold shift + click to select a range
bbaf807
remove fields prev_group and delta_ids and add field state_group_deltas
H-Shay Mar 9, 2023
e89cbb6
check context.state_group_deltas for possible state delta
H-Shay Mar 9, 2023
82ea621
update tests
H-Shay Mar 9, 2023
e8b8186
newsfragment
H-Shay Mar 9, 2023
d6e858c
fix lints
H-Shay Mar 9, 2023
6486e1f
properly serialize/deserialize context.state_group_deltas
H-Shay Mar 9, 2023
430ea51
lint
H-Shay Mar 9, 2023
59cbe10
fix changelog
H-Shay Mar 15, 2023
1f19617
Merge branch 'develop' into shay/kill_prev_with_fire
H-Shay May 2, 2023
75ad4a1
Merge branch 'develop' into shay/kill_prev_with_fire
H-Shay May 10, 2023
492968c
clarify state_group_deltas and create function to build them
H-Shay May 16, 2023
60765d9
fix mypy
H-Shay May 16, 2023
3a2ea21
remove extraneous space
H-Shay May 16, 2023
10c853e
Update synapse/events/snapshot.py
H-Shay May 17, 2023
0784641
Update synapse/events/snapshot.py
H-Shay May 17, 2023
91504ae
refactors
H-Shay May 17, 2023
839af7a
Merge branch 'shay/kill_prev_with_fire' of https://github.com/matrix-…
H-Shay May 17, 2023
9e9df0c
make state group deltas non-optional
H-Shay May 17, 2023
962ec1c
add upgrade notes about incompatible versions over replication
H-Shay May 17, 2023
effa597
Merge branch 'develop' into shay/kill_prev_with_fire
H-Shay May 17, 2023
28b025b
Update upgrade.md
H-Shay May 17, 2023
6ac912a
Update upgrade.md
H-Shay May 17, 2023
b5ed756
fix stupid errors
H-Shay May 18, 2023
77a58db
formatting/doc change
H-Shay May 18, 2023
5277a75
Merge branch 'develop' into shay/kill_prev_with_fire
H-Shay Jun 6, 2023
fa0a671
fix numbers
H-Shay Jun 6, 2023
49866ea
make serialization backwards/forwards compatible
H-Shay Jun 12, 2023
1b8769a
fix stray space upgrade.md
H-Shay Jun 12, 2023
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions changelog.d/15233.misc
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Replace `EventContext` fields `prev_group` and `delta_ids` with field `state_group_deltas`.
13 changes: 13 additions & 0 deletions docs/upgrade.md
Original file line number Diff line number Diff line change
Expand Up @@ -88,6 +88,19 @@ process, for example:
dpkg -i matrix-synapse-py3_1.3.0+stretch1_amd64.deb
```

# Upgrading to v1.85.0

## Changes to event replication

Synapse has changed the format of `EventContext` which impacts how events to be persisted
are sent over replication. This is a forwards- and backwards-incompatible change: v1.84.0 and below workers will not be
able to send events to v1.85.0 workers or main process over replication, and vice versa.
If the master is updated to v1.85.0 then the workers must be updated to v1.84.0 for event replication to
function.
This will also require a restart of the upgraded workers.
H-Shay marked this conversation as resolved.
Show resolved Hide resolved

Once all workers are upgraded to v1.85.0 and restarted event replication will be able to resume.
H-Shay marked this conversation as resolved.
Show resolved Hide resolved

# Upgrading to v1.84.0

## Deprecation of `worker_replication_*` configuration settings
Expand Down
197 changes: 147 additions & 50 deletions synapse/events/snapshot.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@
# See the License for the specific language governing permissions and
# limitations under the License.
from abc import ABC, abstractmethod
from typing import TYPE_CHECKING, List, Optional, Tuple
from typing import TYPE_CHECKING, Dict, List, Optional, Tuple

import attr
from immutabledict import immutabledict
Expand Down Expand Up @@ -106,33 +106,32 @@ class EventContext(UnpersistedEventContextBase):
state_delta_due_to_event: If `state_group` and `state_group_before_event` are not None
then this is the delta of the state between the two groups.

prev_group: If it is known, ``state_group``'s prev_group. Note that this being
None does not necessarily mean that ``state_group`` does not have
a prev_group!
state_group_deltas: If not empty, this is a dict collecting a mapping of the state
difference between state groups.

If the event is a state event, this is normally the same as
``state_group_before_event``.
The keys are a tuple of two integers: the initial group and final state group.
The corresponding value is a state map representing the state delta between
these state groups.

If ``state_group`` is None (ie, the event is an outlier), ``prev_group``
will always also be ``None``.
The dictionary is expected to have at most two entries with state groups of:

Note that this *not* (necessarily) the state group associated with
``_prev_state_ids``.
1. The state group before the event and after the event.
2. The state group preceding the state group before the event and the
state group before the event.

delta_ids: If ``prev_group`` is not None, the state delta between ``prev_group``
and ``state_group``.
This information is collected and stored as part of an optimization for persisting
events.

partial_state: if True, we may be storing this event with a temporary,
incomplete state.
"""

_storage: "StorageControllers"
state_group_deltas: Dict[Tuple[int, int], StateMap[str]]
rejected: Optional[str] = None
_state_group: Optional[int] = None
state_group_before_event: Optional[int] = None
_state_delta_due_to_event: Optional[StateMap[str]] = None
prev_group: Optional[int] = None
delta_ids: Optional[StateMap[str]] = None
app_service: Optional[ApplicationService] = None

partial_state: bool = False
Expand All @@ -144,16 +143,14 @@ def with_state(
state_group_before_event: Optional[int],
state_delta_due_to_event: Optional[StateMap[str]],
partial_state: bool,
prev_group: Optional[int] = None,
delta_ids: Optional[StateMap[str]] = None,
state_group_deltas: Dict[Tuple[int, int], StateMap[str]],
) -> "EventContext":
return EventContext(
storage=storage,
state_group=state_group,
state_group_before_event=state_group_before_event,
state_delta_due_to_event=state_delta_due_to_event,
prev_group=prev_group,
delta_ids=delta_ids,
state_group_deltas=state_group_deltas,
partial_state=partial_state,
)

Expand All @@ -162,7 +159,7 @@ def for_outlier(
storage: "StorageControllers",
) -> "EventContext":
"""Return an EventContext instance suitable for persisting an outlier event"""
return EventContext(storage=storage)
return EventContext(storage=storage, state_group_deltas={})

async def persist(self, event: EventBase) -> "EventContext":
return self
Expand All @@ -177,16 +174,14 @@ async def serialize(self, event: EventBase, store: "DataStore") -> JsonDict:
Returns:
The serialized event.
"""

return {
"state_group": self._state_group,
"state_group_before_event": self.state_group_before_event,
"rejected": self.rejected,
"prev_group": self.prev_group,
"state_group_deltas": _encode_state_group_delta(self.state_group_deltas),
"state_delta_due_to_event": _encode_state_dict(
self._state_delta_due_to_event
),
"delta_ids": _encode_state_dict(self.delta_ids),
"app_service_id": self.app_service.id if self.app_service else None,
"partial_state": self.partial_state,
}
Expand All @@ -209,11 +204,10 @@ def deserialize(storage: "StorageControllers", input: JsonDict) -> "EventContext
storage=storage,
state_group=input["state_group"],
state_group_before_event=input["state_group_before_event"],
prev_group=input["prev_group"],
state_group_deltas=_decode_state_group_delta(input["state_group_deltas"]),
clokep marked this conversation as resolved.
Show resolved Hide resolved
state_delta_due_to_event=_decode_state_dict(
input["state_delta_due_to_event"]
),
delta_ids=_decode_state_dict(input["delta_ids"]),
rejected=input["rejected"],
partial_state=input.get("partial_state", False),
)
Expand Down Expand Up @@ -344,7 +338,7 @@ class UnpersistedEventContext(UnpersistedEventContextBase):
_storage: "StorageControllers"
state_group_before_event: Optional[int]
state_group_after_event: Optional[int]
state_delta_due_to_event: Optional[dict]
state_delta_due_to_event: Optional[StateMap[str]]
prev_group_for_state_group_before_event: Optional[int]
delta_ids_to_state_group_before_event: Optional[StateMap[str]]
partial_state: bool
Expand Down Expand Up @@ -375,26 +369,16 @@ async def batch_persist_unpersisted_contexts(

events_and_persisted_context = []
for event, unpersisted_context in amended_events_and_context:
if event.is_state():
context = EventContext(
storage=unpersisted_context._storage,
state_group=unpersisted_context.state_group_after_event,
state_group_before_event=unpersisted_context.state_group_before_event,
state_delta_due_to_event=unpersisted_context.state_delta_due_to_event,
partial_state=unpersisted_context.partial_state,
prev_group=unpersisted_context.state_group_before_event,
delta_ids=unpersisted_context.state_delta_due_to_event,
)
else:
context = EventContext(
storage=unpersisted_context._storage,
state_group=unpersisted_context.state_group_after_event,
state_group_before_event=unpersisted_context.state_group_before_event,
state_delta_due_to_event=unpersisted_context.state_delta_due_to_event,
partial_state=unpersisted_context.partial_state,
prev_group=unpersisted_context.prev_group_for_state_group_before_event,
delta_ids=unpersisted_context.delta_ids_to_state_group_before_event,
)
state_group_deltas = unpersisted_context._build_state_group_deltas()

context = EventContext(
storage=unpersisted_context._storage,
state_group=unpersisted_context.state_group_after_event,
state_group_before_event=unpersisted_context.state_group_before_event,
state_delta_due_to_event=unpersisted_context.state_delta_due_to_event,
partial_state=unpersisted_context.partial_state,
state_group_deltas=state_group_deltas,
)
events_and_persisted_context.append((event, context))
return events_and_persisted_context

Expand Down Expand Up @@ -447,28 +431,97 @@ async def persist(self, event: EventBase) -> EventContext:

# if the event isn't a state event the state group doesn't change
if not self.state_delta_due_to_event:
state_group_after_event = self.state_group_before_event
self.state_group_after_event = self.state_group_before_event

# otherwise if it is a state event we need to get a state group for it
else:
state_group_after_event = await self._storage.state.store_state_group(
self.state_group_after_event = await self._storage.state.store_state_group(
event.event_id,
event.room_id,
prev_group=self.state_group_before_event,
delta_ids=self.state_delta_due_to_event,
current_state_ids=None,
)
H-Shay marked this conversation as resolved.
Show resolved Hide resolved

state_group_deltas = self._build_state_group_deltas()

return EventContext.with_state(
storage=self._storage,
state_group=state_group_after_event,
state_group=self.state_group_after_event,
state_group_before_event=self.state_group_before_event,
state_delta_due_to_event=self.state_delta_due_to_event,
state_group_deltas=state_group_deltas,
partial_state=self.partial_state,
prev_group=self.state_group_before_event,
delta_ids=self.state_delta_due_to_event,
)

def _build_state_group_deltas(
self,
) -> Dict[Tuple[int, int], StateMap]:
H-Shay marked this conversation as resolved.
Show resolved Hide resolved
"""
Internal function to take an UnpersistedEventContext and collect any known deltas
between the state groups associated with the context. This information is used in an
optimization when persisting events.
H-Shay marked this conversation as resolved.
Show resolved Hide resolved
"""
state_group_deltas = {}

# if we know the state group before the event and after the event, add them and the
# state delta between them to state_group_deltas
if self.state_group_before_event and self.state_group_after_event:
# if we have the state groups we should have the delta
assert self.state_delta_due_to_event is not None
state_group_deltas[
(
self.state_group_before_event,
self.state_group_after_event,
)
] = self.state_delta_due_to_event

# the state group before the event may also have a state group which precedes it, if
# we have that and the state group before the event, add them and the state
# delta between them to state_group_deltas
if (
self.prev_group_for_state_group_before_event
and self.state_group_before_event
):
# if we have both state groups we should have the delta between them
assert self.delta_ids_to_state_group_before_event is not None
state_group_deltas[
(
self.prev_group_for_state_group_before_event,
self.state_group_before_event,
)
] = self.delta_ids_to_state_group_before_event

return state_group_deltas


def _encode_state_group_delta(
state_group_delta: Dict[Tuple[int, int], StateMap[str]]
) -> List[Tuple[int, int, Optional[List[Tuple[str, str, str]]]]]:
if not state_group_delta:
return []

state_group_delta_encoded = []
for key, value in state_group_delta.items():
state_group_delta_encoded.append((key[0], key[1], _encode_state_dict(value)))

return state_group_delta_encoded


def _decode_state_group_delta(
input: List[Tuple[int, int, List[Tuple[str, str, str]]]]
) -> Dict[Tuple[int, int], StateMap[str]]:
if not input:
return {}

state_group_deltas = {}
for state_group_1, state_group_2, state_dict in input:
state_map = _decode_state_dict(state_dict)
assert state_map is not None
state_group_deltas[(state_group_1, state_group_2)] = state_map

return state_group_deltas


def _encode_state_dict(
state_dict: Optional[StateMap[str]],
Expand All @@ -490,3 +543,47 @@ def _decode_state_dict(
return None

return immutabledict({(etype, state_key): v for etype, state_key, v in input})


def _build_state_group_deltas(
H-Shay marked this conversation as resolved.
Show resolved Hide resolved
unpersisted_ctx: UnpersistedEventContext,
) -> Dict[Tuple[int, int], StateMap]:
H-Shay marked this conversation as resolved.
Show resolved Hide resolved
"""
Internal function to take an UnpersistedEventContext and collect any known deltas
between the state groups associated with the context. This information is used in an
optimization when persisting events.
"""
state_group_deltas = {}

# if we know the state group before the event and after the event, add them and the
# state delta between them to state_group_deltas
if (
unpersisted_ctx.state_group_before_event
and unpersisted_ctx.state_group_after_event
):
# if we have the state groups we should have the delta
assert unpersisted_ctx.state_delta_due_to_event is not None
state_group_deltas[
(
unpersisted_ctx.state_group_before_event,
unpersisted_ctx.state_group_after_event,
)
] = unpersisted_ctx.state_delta_due_to_event

# the state group before the event may also have a state group which precedes it, if
# we have that and the state group before the event, add them and the state
# delta between them to state_group_deltas
if (
unpersisted_ctx.prev_group_for_state_group_before_event
and unpersisted_ctx.state_group_before_event
):
# if we have both state groups we should have the delta between them
assert unpersisted_ctx.delta_ids_to_state_group_before_event is not None
state_group_deltas[
(
unpersisted_ctx.prev_group_for_state_group_before_event,
unpersisted_ctx.state_group_before_event,
)
] = unpersisted_ctx.delta_ids_to_state_group_before_event

return state_group_deltas
5 changes: 2 additions & 3 deletions synapse/storage/controllers/persist_events.py
Original file line number Diff line number Diff line change
Expand Up @@ -839,9 +839,8 @@ async def _get_new_state_after_events(
"group" % (ev.event_id,)
)
continue

if ctx.prev_group:
state_group_deltas[(ctx.prev_group, ctx.state_group)] = ctx.delta_ids
if ctx.state_group_deltas:
state_group_deltas.update(ctx.state_group_deltas)

# We need to map the event_ids to their state groups. First, let's
# check if the event is one we're persisting, in which case we can
Expand Down
3 changes: 1 addition & 2 deletions tests/events/test_snapshot.py
Original file line number Diff line number Diff line change
Expand Up @@ -101,8 +101,7 @@ def _check_serialize_deserialize(
self.assertEqual(
context.state_group_before_event, d_context.state_group_before_event
)
self.assertEqual(context.prev_group, d_context.prev_group)
self.assertEqual(context.delta_ids, d_context.delta_ids)
self.assertEqual(context.state_group_deltas, d_context.state_group_deltas)
self.assertEqual(context.app_service, d_context.app_service)

self.assertEqual(
Expand Down
5 changes: 4 additions & 1 deletion tests/storage/test_event_chain.py
Original file line number Diff line number Diff line change
Expand Up @@ -401,7 +401,10 @@ def _persist(txn: LoggingTransaction) -> None:
assert persist_events_store is not None
persist_events_store._store_event_txn(
txn,
[(e, EventContext(self.hs.get_storage_controllers())) for e in events],
[
(e, EventContext(self.hs.get_storage_controllers(), {}))
for e in events
],
)

# Actually call the function that calculates the auth chain stuff.
Expand Down
11 changes: 8 additions & 3 deletions tests/test_state.py
Original file line number Diff line number Diff line change
Expand Up @@ -555,10 +555,15 @@ def test_annotate_with_old_state(
(e.event_id for e in old_state + [event]), current_state_ids.values()
)

self.assertIsNotNone(context.state_group_before_event)
assert context.state_group_before_event is not None
assert context.state_group is not None
self.assertEqual(
context.state_group_deltas.get(
(context.state_group_before_event, context.state_group)
),
{(event.type, event.state_key): event.event_id},
)
self.assertNotEqual(context.state_group_before_event, context.state_group)
self.assertEqual(context.state_group_before_event, context.prev_group)
self.assertEqual({("state", ""): event.event_id}, context.delta_ids)

@defer.inlineCallbacks
def test_trivial_annotate_message(
Expand Down