2016-01-06 21:26:29 -07:00
|
|
|
# Copyright 2015, 2016 OpenMarket Ltd
|
2020-01-31 09:50:13 -07:00
|
|
|
# Copyright 2020 The Matrix.org Foundation C.I.C.
|
2015-02-03 08:00:42 -07:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2017-09-19 05:20:11 -06:00
|
|
|
import logging
|
2022-10-03 13:53:29 -06:00
|
|
|
from typing import TYPE_CHECKING, Awaitable, Callable, Optional
|
2018-07-09 00:09:20 -06:00
|
|
|
|
2021-09-30 09:13:59 -06:00
|
|
|
from synapse.api.constants import MAX_DEPTH, EventContentFields, EventTypes, Membership
|
2018-07-09 00:09:20 -06:00
|
|
|
from synapse.api.errors import Codes, SynapseError
|
2020-03-19 06:22:56 -06:00
|
|
|
from synapse.api.room_versions import EventFormatVersions, RoomVersion
|
2017-09-19 05:20:11 -06:00
|
|
|
from synapse.crypto.event_signing import check_event_content_hash
|
2020-02-28 05:31:07 -07:00
|
|
|
from synapse.crypto.keyring import Keyring
|
2020-02-07 08:30:04 -07:00
|
|
|
from synapse.events import EventBase, make_event_from_dict
|
2020-05-14 11:24:01 -06:00
|
|
|
from synapse.events.utils import prune_event, validate_canonicaljson
|
2018-07-13 13:53:01 -06:00
|
|
|
from synapse.http.servlet import assert_params_in_dict
|
2022-08-23 20:53:37 -06:00
|
|
|
from synapse.logging.opentracing import log_kv, trace
|
2020-01-31 09:50:13 -07:00
|
|
|
from synapse.types import JsonDict, get_domain_from_id
|
2015-02-03 08:00:42 -07:00
|
|
|
|
2021-10-22 11:15:41 -06:00
|
|
|
if TYPE_CHECKING:
|
|
|
|
from synapse.server import HomeServer
|
|
|
|
|
|
|
|
|
2015-02-03 08:00:42 -07:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
2022-05-31 16:32:56 -06:00
|
|
|
class InvalidEventSignatureError(RuntimeError):
|
|
|
|
"""Raised when the signature on an event is invalid.
|
|
|
|
|
|
|
|
The stringification of this exception is just the error message without reference
|
|
|
|
to the event id. The event id is available as a property.
|
|
|
|
"""
|
|
|
|
|
|
|
|
def __init__(self, message: str, event_id: str):
|
|
|
|
super().__init__(message)
|
|
|
|
self.event_id = event_id
|
|
|
|
|
|
|
|
|
2020-09-04 04:54:56 -06:00
|
|
|
class FederationBase:
|
2021-10-22 11:15:41 -06:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2018-03-12 08:07:39 -06:00
|
|
|
self.hs = hs
|
|
|
|
|
|
|
|
self.server_name = hs.hostname
|
|
|
|
self.keyring = hs.get_keyring()
|
2023-04-17 18:57:40 -06:00
|
|
|
self._spam_checker_module_callbacks = hs.get_module_api_callbacks().spam_checker
|
2022-02-23 04:04:02 -07:00
|
|
|
self.store = hs.get_datastores().main
|
2018-03-12 08:07:39 -06:00
|
|
|
self._clock = hs.get_clock()
|
2022-06-06 02:24:12 -06:00
|
|
|
self._storage_controllers = hs.get_storage_controllers()
|
2016-06-15 08:12:59 -06:00
|
|
|
|
2022-08-23 20:53:37 -06:00
|
|
|
@trace
|
2021-06-08 04:07:46 -06:00
|
|
|
async def _check_sigs_and_hash(
|
2022-10-03 13:53:29 -06:00
|
|
|
self,
|
|
|
|
room_version: RoomVersion,
|
|
|
|
pdu: EventBase,
|
|
|
|
record_failure_callback: Optional[
|
|
|
|
Callable[[EventBase, str], Awaitable[None]]
|
|
|
|
] = None,
|
2021-06-08 04:07:46 -06:00
|
|
|
) -> EventBase:
|
|
|
|
"""Checks that event is correctly signed by the sending server.
|
2017-09-19 05:20:11 -06:00
|
|
|
|
2022-02-22 05:17:10 -07:00
|
|
|
Also checks the content hash, and redacts the event if there is a mismatch.
|
|
|
|
|
|
|
|
Also runs the event through the spam checker; if it fails, redacts the event
|
|
|
|
and flags it as soft-failed.
|
|
|
|
|
2017-09-19 05:20:11 -06:00
|
|
|
Args:
|
2021-06-08 04:07:46 -06:00
|
|
|
room_version: The room version of the PDU
|
|
|
|
pdu: the event to be checked
|
2022-10-03 13:53:29 -06:00
|
|
|
record_failure_callback: A callback to run whenever the given event
|
|
|
|
fails signature or hash checks. This includes exceptions
|
|
|
|
that would be normally be thrown/raised but also things like
|
|
|
|
checking for event tampering where we just return the redacted
|
|
|
|
event.
|
2015-02-03 08:00:42 -07:00
|
|
|
|
|
|
|
Returns:
|
2021-06-08 04:07:46 -06:00
|
|
|
* the original event if the checks pass
|
|
|
|
* a redacted version of the event (if the signature
|
2022-05-31 16:32:56 -06:00
|
|
|
matched but the hash did not). In this case a warning will be logged.
|
2022-02-22 05:17:10 -07:00
|
|
|
|
|
|
|
Raises:
|
2022-05-31 16:32:56 -06:00
|
|
|
InvalidEventSignatureError if the signature check failed. Nothing
|
|
|
|
will be logged in this case.
|
2022-02-22 05:17:10 -07:00
|
|
|
"""
|
2022-10-03 13:53:29 -06:00
|
|
|
try:
|
|
|
|
await _check_sigs_on_pdu(self.keyring, room_version, pdu)
|
|
|
|
except InvalidEventSignatureError as exc:
|
|
|
|
if record_failure_callback:
|
|
|
|
await record_failure_callback(pdu, str(exc))
|
|
|
|
raise exc
|
2021-06-08 04:07:46 -06:00
|
|
|
|
|
|
|
if not check_event_content_hash(pdu):
|
|
|
|
# let's try to distinguish between failures because the event was
|
|
|
|
# redacted (which are somewhat expected) vs actual ball-tampering
|
|
|
|
# incidents.
|
|
|
|
#
|
|
|
|
# This is just a heuristic, so we just assume that if the keys are
|
|
|
|
# about the same between the redacted and received events, then the
|
|
|
|
# received event was probably a redacted copy (but we then use our
|
|
|
|
# *actual* redacted copy to be on the safe side.)
|
|
|
|
redacted_event = prune_event(pdu)
|
|
|
|
if set(redacted_event.keys()) == set(pdu.keys()) and set(
|
|
|
|
redacted_event.content.keys()
|
|
|
|
) == set(pdu.content.keys()):
|
2022-05-31 16:32:56 -06:00
|
|
|
logger.debug(
|
2021-06-08 04:07:46 -06:00
|
|
|
"Event %s seems to have been redacted; using our redacted copy",
|
|
|
|
pdu.event_id,
|
2020-12-11 12:05:15 -07:00
|
|
|
)
|
2022-08-23 20:53:37 -06:00
|
|
|
log_kv(
|
|
|
|
{
|
|
|
|
"message": "Event seems to have been redacted; using our redacted copy",
|
|
|
|
"event_id": pdu.event_id,
|
|
|
|
}
|
|
|
|
)
|
2021-06-08 04:07:46 -06:00
|
|
|
else:
|
2019-10-31 04:23:24 -06:00
|
|
|
logger.warning(
|
2021-06-08 04:07:46 -06:00
|
|
|
"Event %s content has been tampered, redacting",
|
2018-09-06 16:56:47 -06:00
|
|
|
pdu.event_id,
|
2017-09-19 18:32:42 -06:00
|
|
|
)
|
2022-08-23 20:53:37 -06:00
|
|
|
log_kv(
|
|
|
|
{
|
|
|
|
"message": "Event content has been tampered, redacting",
|
|
|
|
"event_id": pdu.event_id,
|
|
|
|
}
|
|
|
|
)
|
2022-10-03 13:53:29 -06:00
|
|
|
if record_failure_callback:
|
|
|
|
await record_failure_callback(
|
|
|
|
pdu, "Event content has been tampered with"
|
|
|
|
)
|
2021-06-08 04:07:46 -06:00
|
|
|
return redacted_event
|
2015-02-03 08:00:42 -07:00
|
|
|
|
2023-04-17 18:57:40 -06:00
|
|
|
spam_check = await self._spam_checker_module_callbacks.check_event_for_spam(pdu)
|
2021-06-08 04:07:46 -06:00
|
|
|
|
2023-04-17 18:57:40 -06:00
|
|
|
if spam_check != self._spam_checker_module_callbacks.NOT_SPAM:
|
2021-06-29 04:08:06 -06:00
|
|
|
logger.warning("Event contains spam, soft-failing %s", pdu.event_id)
|
2022-08-23 20:53:37 -06:00
|
|
|
log_kv(
|
|
|
|
{
|
|
|
|
"message": "Event contains spam, redacting (to save disk space) "
|
|
|
|
"as well as soft-failing (to stop using the event in prev_events)",
|
|
|
|
"event_id": pdu.event_id,
|
|
|
|
}
|
|
|
|
)
|
2021-06-29 04:08:06 -06:00
|
|
|
# we redact (to save disk space) as well as soft-failing (to stop
|
|
|
|
# using the event in prev_events).
|
|
|
|
redacted_event = prune_event(pdu)
|
|
|
|
redacted_event.internal_metadata.soft_failed = True
|
|
|
|
return redacted_event
|
2015-02-03 08:00:42 -07:00
|
|
|
|
2021-06-08 04:07:46 -06:00
|
|
|
return pdu
|
2017-12-30 11:40:19 -07:00
|
|
|
|
|
|
|
|
2022-08-23 20:53:37 -06:00
|
|
|
@trace
|
2021-06-08 04:07:46 -06:00
|
|
|
async def _check_sigs_on_pdu(
|
|
|
|
keyring: Keyring, room_version: RoomVersion, pdu: EventBase
|
|
|
|
) -> None:
|
2018-09-03 18:09:12 -06:00
|
|
|
"""Check that the given events are correctly signed
|
|
|
|
|
|
|
|
Args:
|
2020-02-28 05:31:07 -07:00
|
|
|
keyring: keyring object to do the checks
|
|
|
|
room_version: the room version of the PDUs
|
|
|
|
pdus: the events to be checked
|
2022-05-31 16:32:56 -06:00
|
|
|
|
|
|
|
Raises:
|
|
|
|
InvalidEventSignatureError if the event wasn't correctly signed.
|
2018-09-03 18:09:12 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
# we want to check that the event is signed by:
|
|
|
|
#
|
2019-01-29 15:35:36 -07:00
|
|
|
# (a) the sender's server
|
2018-09-03 18:09:12 -06:00
|
|
|
#
|
|
|
|
# - except in the case of invites created from a 3pid invite, which are exempt
|
|
|
|
# from this check, because the sender has to match that of the original 3pid
|
|
|
|
# invite, but the event may come from a different HS, for reasons that I don't
|
|
|
|
# entirely grok (why do the senders have to match? and if they do, why doesn't the
|
|
|
|
# joining server ask the inviting server to do the switcheroo with
|
|
|
|
# exchange_third_party_invite?).
|
|
|
|
#
|
|
|
|
# That's pretty awful, since redacting such an invite will render it invalid
|
|
|
|
# (because it will then look like a regular invite without a valid signature),
|
|
|
|
# and signatures are *supposed* to be valid whether or not an event has been
|
|
|
|
# redacted. But this isn't the worst of the ways that 3pid invites are broken.
|
|
|
|
#
|
2019-01-29 15:35:36 -07:00
|
|
|
# (b) for V1 and V2 rooms, the server which created the event_id
|
|
|
|
#
|
2018-09-03 18:09:12 -06:00
|
|
|
# let's start by getting the domain for each pdu, and flattening the event back
|
|
|
|
# to JSON.
|
2019-01-29 10:21:48 -07:00
|
|
|
|
|
|
|
# First we check that the sender event is signed by the sender's domain
|
|
|
|
# (except if its a 3pid invite, in which case it may be sent by any server)
|
2022-05-31 16:32:56 -06:00
|
|
|
sender_domain = get_domain_from_id(pdu.sender)
|
2021-06-08 04:07:46 -06:00
|
|
|
if not _is_invite_via_3pid(pdu):
|
|
|
|
try:
|
|
|
|
await keyring.verify_event_for_server(
|
2022-05-31 16:32:56 -06:00
|
|
|
sender_domain,
|
2021-06-08 04:07:46 -06:00
|
|
|
pdu,
|
|
|
|
pdu.origin_server_ts if room_version.enforce_key_validity else 0,
|
2019-06-05 03:38:25 -06:00
|
|
|
)
|
2021-06-08 04:07:46 -06:00
|
|
|
except Exception as e:
|
2022-05-31 16:32:56 -06:00
|
|
|
raise InvalidEventSignatureError(
|
|
|
|
f"unable to verify signature for sender domain {sender_domain}: {e}",
|
2021-06-08 04:07:46 -06:00
|
|
|
pdu.event_id,
|
2022-05-31 16:32:56 -06:00
|
|
|
) from None
|
2018-09-03 18:09:12 -06:00
|
|
|
|
2019-01-29 10:21:48 -07:00
|
|
|
# now let's look for events where the sender's domain is different to the
|
|
|
|
# event id's domain (normally only the case for joins/leaves), and add additional
|
|
|
|
# checks. Only do this if the room version has a concept of event ID domain
|
2019-04-01 03:24:38 -06:00
|
|
|
# (ie, the room version uses old-style non-hash event IDs).
|
2022-09-07 04:08:20 -06:00
|
|
|
if room_version.event_format == EventFormatVersions.ROOM_V1_V2:
|
2022-05-31 16:32:56 -06:00
|
|
|
event_domain = get_domain_from_id(pdu.event_id)
|
|
|
|
if event_domain != sender_domain:
|
|
|
|
try:
|
|
|
|
await keyring.verify_event_for_server(
|
|
|
|
event_domain,
|
|
|
|
pdu,
|
|
|
|
pdu.origin_server_ts if room_version.enforce_key_validity else 0,
|
2021-06-08 04:07:46 -06:00
|
|
|
)
|
2022-05-31 16:32:56 -06:00
|
|
|
except Exception as e:
|
|
|
|
raise InvalidEventSignatureError(
|
|
|
|
f"unable to verify signature for event domain {event_domain}: {e}",
|
|
|
|
pdu.event_id,
|
|
|
|
) from None
|
2019-04-25 13:53:10 -06:00
|
|
|
|
2021-07-26 10:17:00 -06:00
|
|
|
# If this is a join event for a restricted room it may have been authorised
|
|
|
|
# via a different server from the sending server. Check those signatures.
|
|
|
|
if (
|
|
|
|
room_version.msc3083_join_rules
|
|
|
|
and pdu.type == EventTypes.Member
|
|
|
|
and pdu.membership == Membership.JOIN
|
2021-09-30 09:13:59 -06:00
|
|
|
and EventContentFields.AUTHORISING_USER in pdu.content
|
2021-07-26 10:17:00 -06:00
|
|
|
):
|
|
|
|
authorising_server = get_domain_from_id(
|
2021-09-30 09:13:59 -06:00
|
|
|
pdu.content[EventContentFields.AUTHORISING_USER]
|
2021-07-26 10:17:00 -06:00
|
|
|
)
|
|
|
|
try:
|
|
|
|
await keyring.verify_event_for_server(
|
|
|
|
authorising_server,
|
|
|
|
pdu,
|
|
|
|
pdu.origin_server_ts if room_version.enforce_key_validity else 0,
|
|
|
|
)
|
|
|
|
except Exception as e:
|
2022-05-31 16:32:56 -06:00
|
|
|
raise InvalidEventSignatureError(
|
|
|
|
f"unable to verify signature for authorising serve {authorising_server}: {e}",
|
|
|
|
pdu.event_id,
|
|
|
|
) from None
|
2021-07-26 10:17:00 -06:00
|
|
|
|
2018-09-03 18:09:12 -06:00
|
|
|
|
2020-02-28 05:31:07 -07:00
|
|
|
def _is_invite_via_3pid(event: EventBase) -> bool:
|
2018-09-03 18:09:12 -06:00
|
|
|
return (
|
|
|
|
event.type == EventTypes.Member
|
|
|
|
and event.membership == Membership.INVITE
|
|
|
|
and "third_party_invite" in event.content
|
|
|
|
)
|
|
|
|
|
|
|
|
|
Refactor the way we set `outlier` (#11634)
* `_auth_and_persist_outliers`: mark persisted events as outliers
Mark any events that get persisted via `_auth_and_persist_outliers` as, well,
outliers.
Currently this will be a no-op as everything will already be flagged as an
outlier, but I'm going to change that.
* `process_remote_join`: stop flagging as outlier
The events are now flagged as outliers later on, by `_auth_and_persist_outliers`.
* `send_join`: remove `outlier=True`
The events created here are returned in the result of `send_join` to
`FederationHandler.do_invite_join`. From there they are passed into
`FederationEventHandler.process_remote_join`, which passes them to
`_auth_and_persist_outliers`... which sets the `outlier` flag.
* `get_event_auth`: remove `outlier=True`
stop flagging the events returned by `get_event_auth` as outliers. This method
is only called by `_get_remote_auth_chain_for_event`, which passes the results
into `_auth_and_persist_outliers`, which will flag them as outliers.
* `_get_remote_auth_chain_for_event`: remove `outlier=True`
we pass all the events into `_auth_and_persist_outliers`, which will now flag
the events as outliers.
* `_check_sigs_and_hash_and_fetch`: remove unused `outlier` parameter
This param is now never set to True, so we can remove it.
* `_check_sigs_and_hash_and_fetch_one`: remove unused `outlier` param
This is no longer set anywhere, so we can remove it.
* `get_pdu`: remove unused `outlier` parameter
... and chase it down into `get_pdu_from_destination_raw`.
* `event_from_pdu_json`: remove redundant `outlier` param
This is never set to `True`, so can be removed.
* changelog
* update docstring
2022-01-05 05:26:11 -07:00
|
|
|
def event_from_pdu_json(pdu_json: JsonDict, room_version: RoomVersion) -> EventBase:
|
2020-01-31 09:50:13 -07:00
|
|
|
"""Construct an EventBase from an event json received over federation
|
2017-12-30 11:40:19 -07:00
|
|
|
|
|
|
|
Args:
|
2020-01-31 09:50:13 -07:00
|
|
|
pdu_json: pdu as received over federation
|
|
|
|
room_version: The version of the room this event belongs to
|
2017-12-30 11:40:19 -07:00
|
|
|
|
|
|
|
Raises:
|
2018-05-01 09:19:39 -06:00
|
|
|
SynapseError: if the pdu is missing required fields or is otherwise
|
|
|
|
not a valid matrix event
|
2017-12-30 11:40:19 -07:00
|
|
|
"""
|
2017-12-30 11:40:19 -07:00
|
|
|
# we could probably enforce a bunch of other fields here (room_id, sender,
|
|
|
|
# origin, etc etc)
|
2019-01-29 10:21:48 -07:00
|
|
|
assert_params_in_dict(pdu_json, ("type", "depth"))
|
2018-05-01 09:19:39 -06:00
|
|
|
|
2022-01-06 10:09:30 -07:00
|
|
|
# Strip any unauthorized values from "unsigned" if they exist
|
|
|
|
if "unsigned" in pdu_json:
|
|
|
|
_strip_unsigned_values(pdu_json)
|
|
|
|
|
2018-05-01 09:19:39 -06:00
|
|
|
depth = pdu_json["depth"]
|
2023-01-31 03:57:02 -07:00
|
|
|
if type(depth) is not int:
|
2018-05-01 09:19:39 -06:00
|
|
|
raise SynapseError(400, "Depth %r not an intger" % (depth,), Codes.BAD_JSON)
|
|
|
|
|
|
|
|
if depth < 0:
|
|
|
|
raise SynapseError(400, "Depth too small", Codes.BAD_JSON)
|
|
|
|
elif depth > MAX_DEPTH:
|
|
|
|
raise SynapseError(400, "Depth too large", Codes.BAD_JSON)
|
|
|
|
|
2020-05-14 11:24:01 -06:00
|
|
|
# Validate that the JSON conforms to the specification.
|
|
|
|
if room_version.strict_canonicaljson:
|
|
|
|
validate_canonicaljson(pdu_json)
|
|
|
|
|
2020-02-07 08:30:04 -07:00
|
|
|
event = make_event_from_dict(pdu_json, room_version)
|
2017-12-30 11:40:19 -07:00
|
|
|
return event
|
2022-01-06 10:09:30 -07:00
|
|
|
|
|
|
|
|
|
|
|
def _strip_unsigned_values(pdu_dict: JsonDict) -> None:
|
|
|
|
"""
|
|
|
|
Strip any unsigned values unless specifically allowed, as defined by the whitelist.
|
|
|
|
|
|
|
|
pdu: the json dict to strip values from. Note that the dict is mutated by this
|
|
|
|
function
|
|
|
|
"""
|
|
|
|
unsigned = pdu_dict["unsigned"]
|
|
|
|
|
|
|
|
if not isinstance(unsigned, dict):
|
|
|
|
pdu_dict["unsigned"] = {}
|
|
|
|
|
|
|
|
if pdu_dict["type"] == "m.room.member":
|
|
|
|
whitelist = ["knock_room_state", "invite_room_state", "age"]
|
|
|
|
else:
|
|
|
|
whitelist = ["age"]
|
|
|
|
|
|
|
|
filtered_unsigned = {k: v for k, v in unsigned.items() if k in whitelist}
|
|
|
|
pdu_dict["unsigned"] = filtered_unsigned
|