2018-07-25 09:32:05 -06:00
|
|
|
# Copyright 2018 New Vector Ltd
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
import logging
|
2022-02-08 05:44:39 -07:00
|
|
|
from typing import TYPE_CHECKING, List, Tuple
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
from twisted.web.server import Request
|
|
|
|
|
|
|
|
from synapse.api.room_versions import KNOWN_ROOM_VERSIONS, RoomVersion
|
|
|
|
from synapse.events import EventBase, make_event_from_dict
|
2018-07-25 09:32:05 -06:00
|
|
|
from synapse.events.snapshot import EventContext
|
2022-02-08 05:44:39 -07:00
|
|
|
from synapse.http.server import HttpServer
|
2018-07-25 09:32:05 -06:00
|
|
|
from synapse.replication.http._base import ReplicationEndpoint
|
2022-02-08 05:44:39 -07:00
|
|
|
from synapse.types import JsonDict
|
2018-07-25 09:32:05 -06:00
|
|
|
from synapse.util.metrics import Measure
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
if TYPE_CHECKING:
|
|
|
|
from synapse.server import HomeServer
|
2022-02-08 05:44:39 -07:00
|
|
|
from synapse.storage.databases.main import DataStore
|
2021-10-22 11:15:41 -06:00
|
|
|
|
2018-07-25 09:32:05 -06:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
class ReplicationFederationSendEventsRestServlet(ReplicationEndpoint):
|
|
|
|
"""Handles events newly received from federation, including persisting and
|
2020-05-22 07:21:54 -06:00
|
|
|
notifying. Returns the maximum stream ID of the persisted events.
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
The API looks like:
|
|
|
|
|
|
|
|
POST /_synapse/replication/fed_send_events/:txn_id
|
|
|
|
|
|
|
|
{
|
|
|
|
"events": [{
|
|
|
|
"event": { .. serialized event .. },
|
2020-03-05 08:46:44 -07:00
|
|
|
"room_version": .., // "1", "2", "3", etc: the version of the room
|
|
|
|
// containing the event
|
|
|
|
"event_format_version": .., // 1,2,3 etc: the event format version
|
2018-07-25 09:32:05 -06:00
|
|
|
"internal_metadata": { .. serialized internal_metadata .. },
|
2021-03-17 06:33:18 -06:00
|
|
|
"outlier": true|false,
|
2018-07-25 09:32:05 -06:00
|
|
|
"rejected_reason": .., // The event.rejected_reason field
|
|
|
|
"context": { .. serialized event context .. },
|
|
|
|
}],
|
|
|
|
"backfilled": false
|
2020-05-22 07:21:54 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
200 OK
|
|
|
|
|
|
|
|
{
|
|
|
|
"max_stream_id": 32443,
|
|
|
|
}
|
Handle race between persisting an event and un-partial stating a room (#13100)
Whenever we want to persist an event, we first compute an event context,
which includes the state at the event and a flag indicating whether the
state is partial. After a lot of processing, we finally try to store the
event in the database, which can fail for partial state events when the
containing room has been un-partial stated in the meantime.
We detect the race as a foreign key constraint failure in the data store
layer and turn it into a special `PartialStateConflictError` exception,
which makes its way up to the method in which we computed the event
context.
To make things difficult, the exception needs to cross a replication
request: `/fed_send_events` for events coming over federation and
`/send_event` for events from clients. We transport the
`PartialStateConflictError` as a `409 Conflict` over replication and
turn `409`s back into `PartialStateConflictError`s on the worker making
the request.
All client events go through
`EventCreationHandler.handle_new_client_event`, which is called in
*a lot* of places. Instead of trying to update all the code which
creates client events, we turn the `PartialStateConflictError` into a
`429 Too Many Requests` in
`EventCreationHandler.handle_new_client_event` and hope that clients
take it as a hint to retry their request.
On the federation event side, there are 7 places which compute event
contexts. 4 of them use outlier event contexts:
`FederationEventHandler._auth_and_persist_outliers_inner`,
`FederationHandler.do_knock`, `FederationHandler.on_invite_request` and
`FederationHandler.do_remotely_reject_invite`. These events won't have
the partial state flag, so we do not need to do anything for then.
The remaining 3 paths which create events are
`FederationEventHandler.process_remote_join`,
`FederationEventHandler.on_send_membership_event` and
`FederationEventHandler._process_received_pdu`.
We can't experience the race in `process_remote_join`, unless we're
handling an additional join into a partial state room, which currently
blocks, so we make no attempt to handle it correctly.
`on_send_membership_event` is only called by
`FederationServer._on_send_membership_event`, so we catch the
`PartialStateConflictError` there and retry just once.
`_process_received_pdu` is called by `on_receive_pdu` for incoming
events and `_process_pulled_event` for backfill. The latter should never
try to persist partial state events, so we ignore it. We catch the
`PartialStateConflictError` in `on_receive_pdu` and retry just once.
Refering to the graph of code paths in
https://github.com/matrix-org/synapse/issues/12988#issuecomment-1156857648
may make the above make more sense.
Signed-off-by: Sean Quah <seanq@matrix.org>
2022-07-05 09:12:52 -06:00
|
|
|
|
|
|
|
Responds with a 409 when a `PartialStateConflictError` is raised due to an event
|
|
|
|
context that needs to be recomputed due to the un-partial stating of a room.
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
NAME = "fed_send_events"
|
|
|
|
PATH_ARGS = ()
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2020-09-18 07:56:44 -06:00
|
|
|
super().__init__(hs)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2022-05-31 06:17:50 -06:00
|
|
|
self._storage_controllers = hs.get_storage_controllers()
|
2018-07-25 09:32:05 -06:00
|
|
|
self.clock = hs.get_clock()
|
2021-08-26 14:41:44 -06:00
|
|
|
self.federation_event_handler = hs.get_federation_event_handler()
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
@staticmethod
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _serialize_payload( # type: ignore[override]
|
|
|
|
store: "DataStore",
|
|
|
|
room_id: str,
|
|
|
|
event_and_contexts: List[Tuple[EventBase, EventContext]],
|
|
|
|
backfilled: bool,
|
|
|
|
) -> JsonDict:
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
Args:
|
|
|
|
store
|
2022-02-08 05:44:39 -07:00
|
|
|
room_id
|
|
|
|
event_and_contexts
|
|
|
|
backfilled: Whether or not the events are the result of backfilling
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
event_payloads = []
|
|
|
|
for event, context in event_and_contexts:
|
2020-08-03 05:12:55 -06:00
|
|
|
serialized_context = await context.serialize(event, store)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
event_payloads.append(
|
|
|
|
{
|
|
|
|
"event": event.get_pdu_json(),
|
2020-03-05 08:46:44 -07:00
|
|
|
"room_version": event.room_version.identifier,
|
2019-01-24 04:14:07 -07:00
|
|
|
"event_format_version": event.format_version,
|
2018-07-25 09:32:05 -06:00
|
|
|
"internal_metadata": event.internal_metadata.get_dict(),
|
2021-03-17 06:33:18 -06:00
|
|
|
"outlier": event.internal_metadata.is_outlier(),
|
2018-07-25 09:32:05 -06:00
|
|
|
"rejected_reason": event.rejected_reason,
|
|
|
|
"context": serialized_context,
|
|
|
|
}
|
|
|
|
)
|
2019-06-20 03:32:02 -06:00
|
|
|
|
2020-09-14 03:16:41 -06:00
|
|
|
payload = {
|
|
|
|
"events": event_payloads,
|
|
|
|
"backfilled": backfilled,
|
|
|
|
"room_id": room_id,
|
|
|
|
}
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2019-07-23 07:00:55 -06:00
|
|
|
return payload
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2023-01-18 12:35:29 -07:00
|
|
|
async def _handle_request(self, request: Request, content: JsonDict) -> Tuple[int, JsonDict]: # type: ignore[override]
|
2018-07-25 09:32:05 -06:00
|
|
|
with Measure(self.clock, "repl_fed_send_events_parse"):
|
2020-09-14 03:16:41 -06:00
|
|
|
room_id = content["room_id"]
|
2018-07-25 09:32:05 -06:00
|
|
|
backfilled = content["backfilled"]
|
|
|
|
|
|
|
|
event_payloads = content["events"]
|
|
|
|
|
|
|
|
event_and_contexts = []
|
|
|
|
for event_payload in event_payloads:
|
|
|
|
event_dict = event_payload["event"]
|
2020-03-05 08:46:44 -07:00
|
|
|
room_ver = KNOWN_ROOM_VERSIONS[event_payload["room_version"]]
|
2018-07-25 09:32:05 -06:00
|
|
|
internal_metadata = event_payload["internal_metadata"]
|
|
|
|
rejected_reason = event_payload["rejected_reason"]
|
2019-01-24 04:14:07 -07:00
|
|
|
|
2020-03-05 08:46:44 -07:00
|
|
|
event = make_event_from_dict(
|
|
|
|
event_dict, room_ver, internal_metadata, rejected_reason
|
|
|
|
)
|
2021-03-17 06:33:18 -06:00
|
|
|
event.internal_metadata.outlier = event_payload["outlier"]
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2019-12-20 03:32:02 -07:00
|
|
|
context = EventContext.deserialize(
|
2022-05-31 06:17:50 -06:00
|
|
|
self._storage_controllers, event_payload["context"]
|
2019-12-20 03:32:02 -07:00
|
|
|
)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
event_and_contexts.append((event, context))
|
|
|
|
|
2023-10-14 10:57:27 -06:00
|
|
|
logger.info(
|
|
|
|
"Got batch of %i events to persist to room %s",
|
|
|
|
len(event_and_contexts),
|
|
|
|
room_id,
|
|
|
|
)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2021-08-26 14:41:44 -06:00
|
|
|
max_stream_id = await self.federation_event_handler.persist_events_and_notify(
|
2020-09-14 03:16:41 -06:00
|
|
|
room_id, event_and_contexts, backfilled
|
2018-07-25 09:32:05 -06:00
|
|
|
)
|
|
|
|
|
2020-05-22 07:21:54 -06:00
|
|
|
return 200, {"max_stream_id": max_stream_id}
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
|
|
|
|
class ReplicationFederationSendEduRestServlet(ReplicationEndpoint):
|
|
|
|
"""Handles EDUs newly received from federation, including persisting and
|
|
|
|
notifying.
|
2018-08-09 03:23:49 -06:00
|
|
|
|
|
|
|
Request format:
|
|
|
|
|
|
|
|
POST /_synapse/replication/fed_send_edu/:edu_type/:txn_id
|
|
|
|
|
|
|
|
{
|
|
|
|
"origin": ...,
|
|
|
|
"content: { ... }
|
|
|
|
}
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
NAME = "fed_send_edu"
|
|
|
|
PATH_ARGS = ("edu_type",)
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2020-09-18 07:56:44 -06:00
|
|
|
super().__init__(hs)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2018-07-25 09:32:05 -06:00
|
|
|
self.clock = hs.get_clock()
|
|
|
|
self.registry = hs.get_federation_registry()
|
|
|
|
|
|
|
|
@staticmethod
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _serialize_payload( # type: ignore[override]
|
|
|
|
edu_type: str, origin: str, content: JsonDict
|
|
|
|
) -> JsonDict:
|
2018-07-25 09:32:05 -06:00
|
|
|
return {"origin": origin, "content": content}
|
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _handle_request( # type: ignore[override]
|
2023-01-18 12:35:29 -07:00
|
|
|
self, request: Request, content: JsonDict, edu_type: str
|
2022-02-08 05:44:39 -07:00
|
|
|
) -> Tuple[int, JsonDict]:
|
2023-01-18 12:35:29 -07:00
|
|
|
origin = content["origin"]
|
|
|
|
edu_content = content["content"]
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2018-08-17 04:11:06 -06:00
|
|
|
logger.info("Got %r edu from %s", edu_type, origin)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
await self.registry.on_edu(edu_type, origin, edu_content)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
return 200, {}
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
|
|
|
|
class ReplicationGetQueryRestServlet(ReplicationEndpoint):
|
|
|
|
"""Handle responding to queries from federation.
|
2018-08-09 03:23:49 -06:00
|
|
|
|
|
|
|
Request format:
|
|
|
|
|
|
|
|
POST /_synapse/replication/fed_query/:query_type
|
|
|
|
|
|
|
|
{
|
|
|
|
"args": { ... }
|
|
|
|
}
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
NAME = "fed_query"
|
|
|
|
PATH_ARGS = ("query_type",)
|
|
|
|
|
|
|
|
# This is a query, so let's not bother caching
|
|
|
|
CACHE = False
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2020-09-18 07:56:44 -06:00
|
|
|
super().__init__(hs)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2018-07-25 09:32:05 -06:00
|
|
|
self.clock = hs.get_clock()
|
|
|
|
self.registry = hs.get_federation_registry()
|
|
|
|
|
|
|
|
@staticmethod
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _serialize_payload(query_type: str, args: JsonDict) -> JsonDict: # type: ignore[override]
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
Args:
|
2022-02-08 05:44:39 -07:00
|
|
|
query_type
|
|
|
|
args: The arguments received for the given query type
|
2018-07-25 09:32:05 -06:00
|
|
|
"""
|
|
|
|
return {"args": args}
|
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _handle_request( # type: ignore[override]
|
2023-01-18 12:35:29 -07:00
|
|
|
self, request: Request, content: JsonDict, query_type: str
|
2022-02-08 05:44:39 -07:00
|
|
|
) -> Tuple[int, JsonDict]:
|
2023-01-18 12:35:29 -07:00
|
|
|
args = content["args"]
|
|
|
|
args["origin"] = content["origin"]
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2021-02-19 02:50:41 -07:00
|
|
|
logger.info("Got %r query from %s", query_type, args["origin"])
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2019-10-29 07:00:51 -06:00
|
|
|
result = await self.registry.on_query(query_type, args)
|
2018-07-25 09:32:05 -06:00
|
|
|
|
2019-08-30 09:28:26 -06:00
|
|
|
return 200, result
|
2018-07-25 09:32:05 -06:00
|
|
|
|
|
|
|
|
2018-08-09 03:29:48 -06:00
|
|
|
class ReplicationCleanRoomRestServlet(ReplicationEndpoint):
|
|
|
|
"""Called to clean up any data in DB for a given room, ready for the
|
|
|
|
server to join the room.
|
|
|
|
|
|
|
|
Request format:
|
|
|
|
|
2020-02-26 09:58:33 -07:00
|
|
|
POST /_synapse/replication/fed_cleanup_room/:room_id/:txn_id
|
2018-08-09 03:29:48 -06:00
|
|
|
|
|
|
|
{}
|
|
|
|
"""
|
|
|
|
|
|
|
|
NAME = "fed_cleanup_room"
|
|
|
|
PATH_ARGS = ("room_id",)
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2020-09-18 07:56:44 -06:00
|
|
|
super().__init__(hs)
|
2018-08-09 03:29:48 -06:00
|
|
|
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2018-08-09 03:29:48 -06:00
|
|
|
|
|
|
|
@staticmethod
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _serialize_payload(room_id: str) -> JsonDict: # type: ignore[override]
|
2018-08-09 03:29:48 -06:00
|
|
|
"""
|
|
|
|
Args:
|
2022-02-08 05:44:39 -07:00
|
|
|
room_id
|
2018-08-09 03:29:48 -06:00
|
|
|
"""
|
|
|
|
return {}
|
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _handle_request( # type: ignore[override]
|
2023-01-18 12:35:29 -07:00
|
|
|
self, request: Request, content: JsonDict, room_id: str
|
2022-02-08 05:44:39 -07:00
|
|
|
) -> Tuple[int, JsonDict]:
|
2019-10-29 07:00:51 -06:00
|
|
|
await self.store.clean_room_for_join(room_id)
|
2018-08-09 03:29:48 -06:00
|
|
|
|
2019-08-30 09:28:26 -06:00
|
|
|
return 200, {}
|
2018-08-09 03:29:48 -06:00
|
|
|
|
|
|
|
|
2020-11-13 09:24:04 -07:00
|
|
|
class ReplicationStoreRoomOnOutlierMembershipRestServlet(ReplicationEndpoint):
|
2020-02-26 09:58:33 -07:00
|
|
|
"""Called to clean up any data in DB for a given room, ready for the
|
|
|
|
server to join the room.
|
|
|
|
|
|
|
|
Request format:
|
|
|
|
|
2020-11-13 09:24:04 -07:00
|
|
|
POST /_synapse/replication/store_room_on_outlier_membership/:room_id/:txn_id
|
2020-02-26 09:58:33 -07:00
|
|
|
|
|
|
|
{
|
|
|
|
"room_version": "1",
|
|
|
|
}
|
|
|
|
"""
|
|
|
|
|
2020-11-13 09:24:04 -07:00
|
|
|
NAME = "store_room_on_outlier_membership"
|
2020-02-26 09:58:33 -07:00
|
|
|
PATH_ARGS = ("room_id",)
|
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2020-02-26 09:58:33 -07:00
|
|
|
super().__init__(hs)
|
|
|
|
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2020-02-26 09:58:33 -07:00
|
|
|
|
|
|
|
@staticmethod
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _serialize_payload(room_id: str, room_version: RoomVersion) -> JsonDict: # type: ignore[override]
|
2020-02-26 09:58:33 -07:00
|
|
|
return {"room_version": room_version.identifier}
|
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
async def _handle_request( # type: ignore[override]
|
2023-01-18 12:35:29 -07:00
|
|
|
self, request: Request, content: JsonDict, room_id: str
|
2022-02-08 05:44:39 -07:00
|
|
|
) -> Tuple[int, JsonDict]:
|
2020-02-26 09:58:33 -07:00
|
|
|
room_version = KNOWN_ROOM_VERSIONS[content["room_version"]]
|
2020-11-13 09:24:04 -07:00
|
|
|
await self.store.maybe_store_room_on_outlier_membership(room_id, room_version)
|
2020-02-26 09:58:33 -07:00
|
|
|
return 200, {}
|
|
|
|
|
|
|
|
|
2022-02-08 05:44:39 -07:00
|
|
|
def register_servlets(hs: "HomeServer", http_server: HttpServer) -> None:
|
2018-07-25 09:32:05 -06:00
|
|
|
ReplicationFederationSendEventsRestServlet(hs).register(http_server)
|
|
|
|
ReplicationFederationSendEduRestServlet(hs).register(http_server)
|
|
|
|
ReplicationGetQueryRestServlet(hs).register(http_server)
|
2018-08-09 03:29:48 -06:00
|
|
|
ReplicationCleanRoomRestServlet(hs).register(http_server)
|
2020-11-13 09:24:04 -07:00
|
|
|
ReplicationStoreRoomOnOutlierMembershipRestServlet(hs).register(http_server)
|