federation_base.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380
  1. # -*- coding: utf-8 -*-
  2. # Copyright 2015, 2016 OpenMarket Ltd
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. import logging
  16. from collections import namedtuple
  17. import six
  18. from twisted.internet import defer
  19. from twisted.internet.defer import DeferredList
  20. from synapse.api.constants import MAX_DEPTH, EventTypes, Membership
  21. from synapse.api.errors import Codes, SynapseError
  22. from synapse.api.room_versions import KNOWN_ROOM_VERSIONS, EventFormatVersions
  23. from synapse.crypto.event_signing import check_event_content_hash
  24. from synapse.events import event_type_from_format_version
  25. from synapse.events.utils import prune_event
  26. from synapse.http.servlet import assert_params_in_dict
  27. from synapse.logging.context import (
  28. LoggingContext,
  29. PreserveLoggingContext,
  30. make_deferred_yieldable,
  31. preserve_fn,
  32. )
  33. from synapse.types import get_domain_from_id
  34. from synapse.util import unwrapFirstError
  35. logger = logging.getLogger(__name__)
  36. class FederationBase(object):
  37. def __init__(self, hs):
  38. self.hs = hs
  39. self.server_name = hs.hostname
  40. self.keyring = hs.get_keyring()
  41. self.spam_checker = hs.get_spam_checker()
  42. self.store = hs.get_datastore()
  43. self._clock = hs.get_clock()
  44. @defer.inlineCallbacks
  45. def _check_sigs_and_hash_and_fetch(
  46. self, origin, pdus, room_version, outlier=False, include_none=False
  47. ):
  48. """Takes a list of PDUs and checks the signatures and hashs of each
  49. one. If a PDU fails its signature check then we check if we have it in
  50. the database and if not then request if from the originating server of
  51. that PDU.
  52. If a PDU fails its content hash check then it is redacted.
  53. The given list of PDUs are not modified, instead the function returns
  54. a new list.
  55. Args:
  56. origin (str)
  57. pdu (list)
  58. room_version (str)
  59. outlier (bool): Whether the events are outliers or not
  60. include_none (str): Whether to include None in the returned list
  61. for events that have failed their checks
  62. Returns:
  63. Deferred : A list of PDUs that have valid signatures and hashes.
  64. """
  65. deferreds = self._check_sigs_and_hashes(room_version, pdus)
  66. @defer.inlineCallbacks
  67. def handle_check_result(pdu, deferred):
  68. try:
  69. res = yield make_deferred_yieldable(deferred)
  70. except SynapseError:
  71. res = None
  72. if not res:
  73. # Check local db.
  74. res = yield self.store.get_event(
  75. pdu.event_id, allow_rejected=True, allow_none=True
  76. )
  77. if not res and pdu.origin != origin:
  78. try:
  79. res = yield self.get_pdu(
  80. destinations=[pdu.origin],
  81. event_id=pdu.event_id,
  82. room_version=room_version,
  83. outlier=outlier,
  84. timeout=10000,
  85. )
  86. except SynapseError:
  87. pass
  88. if not res:
  89. logger.warn(
  90. "Failed to find copy of %s with valid signature", pdu.event_id
  91. )
  92. return res
  93. handle = preserve_fn(handle_check_result)
  94. deferreds2 = [handle(pdu, deferred) for pdu, deferred in zip(pdus, deferreds)]
  95. valid_pdus = yield make_deferred_yieldable(
  96. defer.gatherResults(deferreds2, consumeErrors=True)
  97. ).addErrback(unwrapFirstError)
  98. if include_none:
  99. return valid_pdus
  100. else:
  101. return [p for p in valid_pdus if p]
  102. def _check_sigs_and_hash(self, room_version, pdu):
  103. return make_deferred_yieldable(
  104. self._check_sigs_and_hashes(room_version, [pdu])[0]
  105. )
  106. def _check_sigs_and_hashes(self, room_version, pdus):
  107. """Checks that each of the received events is correctly signed by the
  108. sending server.
  109. Args:
  110. room_version (str): The room version of the PDUs
  111. pdus (list[FrozenEvent]): the events to be checked
  112. Returns:
  113. list[Deferred]: for each input event, a deferred which:
  114. * returns the original event if the checks pass
  115. * returns a redacted version of the event (if the signature
  116. matched but the hash did not)
  117. * throws a SynapseError if the signature check failed.
  118. The deferreds run their callbacks in the sentinel
  119. """
  120. deferreds = _check_sigs_on_pdus(self.keyring, room_version, pdus)
  121. ctx = LoggingContext.current_context()
  122. def callback(_, pdu):
  123. with PreserveLoggingContext(ctx):
  124. if not check_event_content_hash(pdu):
  125. # let's try to distinguish between failures because the event was
  126. # redacted (which are somewhat expected) vs actual ball-tampering
  127. # incidents.
  128. #
  129. # This is just a heuristic, so we just assume that if the keys are
  130. # about the same between the redacted and received events, then the
  131. # received event was probably a redacted copy (but we then use our
  132. # *actual* redacted copy to be on the safe side.)
  133. redacted_event = prune_event(pdu)
  134. if set(redacted_event.keys()) == set(pdu.keys()) and set(
  135. six.iterkeys(redacted_event.content)
  136. ) == set(six.iterkeys(pdu.content)):
  137. logger.info(
  138. "Event %s seems to have been redacted; using our redacted "
  139. "copy",
  140. pdu.event_id,
  141. )
  142. else:
  143. logger.warning(
  144. "Event %s content has been tampered, redacting",
  145. pdu.event_id,
  146. )
  147. return redacted_event
  148. if self.spam_checker.check_event_for_spam(pdu):
  149. logger.warn(
  150. "Event contains spam, redacting %s: %s",
  151. pdu.event_id,
  152. pdu.get_pdu_json(),
  153. )
  154. return prune_event(pdu)
  155. return pdu
  156. def errback(failure, pdu):
  157. failure.trap(SynapseError)
  158. with PreserveLoggingContext(ctx):
  159. logger.warn(
  160. "Signature check failed for %s: %s",
  161. pdu.event_id,
  162. failure.getErrorMessage(),
  163. )
  164. return failure
  165. for deferred, pdu in zip(deferreds, pdus):
  166. deferred.addCallbacks(
  167. callback, errback, callbackArgs=[pdu], errbackArgs=[pdu]
  168. )
  169. return deferreds
  170. class PduToCheckSig(
  171. namedtuple(
  172. "PduToCheckSig", ["pdu", "redacted_pdu_json", "sender_domain", "deferreds"]
  173. )
  174. ):
  175. pass
  176. def _check_sigs_on_pdus(keyring, room_version, pdus):
  177. """Check that the given events are correctly signed
  178. Args:
  179. keyring (synapse.crypto.Keyring): keyring object to do the checks
  180. room_version (str): the room version of the PDUs
  181. pdus (Collection[EventBase]): the events to be checked
  182. Returns:
  183. List[Deferred]: a Deferred for each event in pdus, which will either succeed if
  184. the signatures are valid, or fail (with a SynapseError) if not.
  185. """
  186. # we want to check that the event is signed by:
  187. #
  188. # (a) the sender's server
  189. #
  190. # - except in the case of invites created from a 3pid invite, which are exempt
  191. # from this check, because the sender has to match that of the original 3pid
  192. # invite, but the event may come from a different HS, for reasons that I don't
  193. # entirely grok (why do the senders have to match? and if they do, why doesn't the
  194. # joining server ask the inviting server to do the switcheroo with
  195. # exchange_third_party_invite?).
  196. #
  197. # That's pretty awful, since redacting such an invite will render it invalid
  198. # (because it will then look like a regular invite without a valid signature),
  199. # and signatures are *supposed* to be valid whether or not an event has been
  200. # redacted. But this isn't the worst of the ways that 3pid invites are broken.
  201. #
  202. # (b) for V1 and V2 rooms, the server which created the event_id
  203. #
  204. # let's start by getting the domain for each pdu, and flattening the event back
  205. # to JSON.
  206. pdus_to_check = [
  207. PduToCheckSig(
  208. pdu=p,
  209. redacted_pdu_json=prune_event(p).get_pdu_json(),
  210. sender_domain=get_domain_from_id(p.sender),
  211. deferreds=[],
  212. )
  213. for p in pdus
  214. ]
  215. v = KNOWN_ROOM_VERSIONS.get(room_version)
  216. if not v:
  217. raise RuntimeError("Unrecognized room version %s" % (room_version,))
  218. # First we check that the sender event is signed by the sender's domain
  219. # (except if its a 3pid invite, in which case it may be sent by any server)
  220. pdus_to_check_sender = [p for p in pdus_to_check if not _is_invite_via_3pid(p.pdu)]
  221. more_deferreds = keyring.verify_json_objects_for_server(
  222. [
  223. (
  224. p.sender_domain,
  225. p.redacted_pdu_json,
  226. p.pdu.origin_server_ts if v.enforce_key_validity else 0,
  227. p.pdu.event_id,
  228. )
  229. for p in pdus_to_check_sender
  230. ]
  231. )
  232. def sender_err(e, pdu_to_check):
  233. errmsg = "event id %s: unable to verify signature for sender %s: %s" % (
  234. pdu_to_check.pdu.event_id,
  235. pdu_to_check.sender_domain,
  236. e.getErrorMessage(),
  237. )
  238. # XX not really sure if these are the right codes, but they are what
  239. # we've done for ages
  240. raise SynapseError(400, errmsg, Codes.UNAUTHORIZED)
  241. for p, d in zip(pdus_to_check_sender, more_deferreds):
  242. d.addErrback(sender_err, p)
  243. p.deferreds.append(d)
  244. # now let's look for events where the sender's domain is different to the
  245. # event id's domain (normally only the case for joins/leaves), and add additional
  246. # checks. Only do this if the room version has a concept of event ID domain
  247. # (ie, the room version uses old-style non-hash event IDs).
  248. if v.event_format == EventFormatVersions.V1:
  249. pdus_to_check_event_id = [
  250. p
  251. for p in pdus_to_check
  252. if p.sender_domain != get_domain_from_id(p.pdu.event_id)
  253. ]
  254. more_deferreds = keyring.verify_json_objects_for_server(
  255. [
  256. (
  257. get_domain_from_id(p.pdu.event_id),
  258. p.redacted_pdu_json,
  259. p.pdu.origin_server_ts if v.enforce_key_validity else 0,
  260. p.pdu.event_id,
  261. )
  262. for p in pdus_to_check_event_id
  263. ]
  264. )
  265. def event_err(e, pdu_to_check):
  266. errmsg = (
  267. "event id %s: unable to verify signature for event id domain: %s"
  268. % (pdu_to_check.pdu.event_id, e.getErrorMessage())
  269. )
  270. # XX as above: not really sure if these are the right codes
  271. raise SynapseError(400, errmsg, Codes.UNAUTHORIZED)
  272. for p, d in zip(pdus_to_check_event_id, more_deferreds):
  273. d.addErrback(event_err, p)
  274. p.deferreds.append(d)
  275. # replace lists of deferreds with single Deferreds
  276. return [_flatten_deferred_list(p.deferreds) for p in pdus_to_check]
  277. def _flatten_deferred_list(deferreds):
  278. """Given a list of deferreds, either return the single deferred,
  279. combine into a DeferredList, or return an already resolved deferred.
  280. """
  281. if len(deferreds) > 1:
  282. return DeferredList(deferreds, fireOnOneErrback=True, consumeErrors=True)
  283. elif len(deferreds) == 1:
  284. return deferreds[0]
  285. else:
  286. return defer.succeed(None)
  287. def _is_invite_via_3pid(event):
  288. return (
  289. event.type == EventTypes.Member
  290. and event.membership == Membership.INVITE
  291. and "third_party_invite" in event.content
  292. )
  293. def event_from_pdu_json(pdu_json, event_format_version, outlier=False):
  294. """Construct a FrozenEvent from an event json received over federation
  295. Args:
  296. pdu_json (object): pdu as received over federation
  297. event_format_version (int): The event format version
  298. outlier (bool): True to mark this event as an outlier
  299. Returns:
  300. FrozenEvent
  301. Raises:
  302. SynapseError: if the pdu is missing required fields or is otherwise
  303. not a valid matrix event
  304. """
  305. # we could probably enforce a bunch of other fields here (room_id, sender,
  306. # origin, etc etc)
  307. assert_params_in_dict(pdu_json, ("type", "depth"))
  308. depth = pdu_json["depth"]
  309. if not isinstance(depth, six.integer_types):
  310. raise SynapseError(400, "Depth %r not an intger" % (depth,), Codes.BAD_JSON)
  311. if depth < 0:
  312. raise SynapseError(400, "Depth too small", Codes.BAD_JSON)
  313. elif depth > MAX_DEPTH:
  314. raise SynapseError(400, "Depth too large", Codes.BAD_JSON)
  315. event = event_type_from_format_version(event_format_version)(pdu_json)
  316. event.internal_metadata.outlier = outlier
  317. return event