initial_sync.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466
  1. # -*- coding: utf-8 -*-
  2. # Copyright 2016 OpenMarket Ltd
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. import logging
  16. from twisted.internet import defer
  17. from synapse.api.constants import EventTypes, Membership
  18. from synapse.api.errors import AuthError, Codes, SynapseError
  19. from synapse.events.validator import EventValidator
  20. from synapse.handlers.presence import format_user_presence_state
  21. from synapse.logging.context import make_deferred_yieldable, run_in_background
  22. from synapse.streams.config import PaginationConfig
  23. from synapse.types import StreamToken, UserID
  24. from synapse.util import unwrapFirstError
  25. from synapse.util.async_helpers import concurrently_execute
  26. from synapse.util.caches.snapshot_cache import SnapshotCache
  27. from synapse.visibility import filter_events_for_client
  28. from ._base import BaseHandler
  29. logger = logging.getLogger(__name__)
  30. class InitialSyncHandler(BaseHandler):
  31. def __init__(self, hs):
  32. super(InitialSyncHandler, self).__init__(hs)
  33. self.hs = hs
  34. self.state = hs.get_state_handler()
  35. self.clock = hs.get_clock()
  36. self.validator = EventValidator()
  37. self.snapshot_cache = SnapshotCache()
  38. self._event_serializer = hs.get_event_client_serializer()
  39. def snapshot_all_rooms(
  40. self,
  41. user_id=None,
  42. pagin_config=None,
  43. as_client_event=True,
  44. include_archived=False,
  45. ):
  46. """Retrieve a snapshot of all rooms the user is invited or has joined.
  47. This snapshot may include messages for all rooms where the user is
  48. joined, depending on the pagination config.
  49. Args:
  50. user_id (str): The ID of the user making the request.
  51. pagin_config (synapse.api.streams.PaginationConfig): The pagination
  52. config used to determine how many messages *PER ROOM* to return.
  53. as_client_event (bool): True to get events in client-server format.
  54. include_archived (bool): True to get rooms that the user has left
  55. Returns:
  56. A list of dicts with "room_id" and "membership" keys for all rooms
  57. the user is currently invited or joined in on. Rooms where the user
  58. is joined on, may return a "messages" key with messages, depending
  59. on the specified PaginationConfig.
  60. """
  61. key = (
  62. user_id,
  63. pagin_config.from_token,
  64. pagin_config.to_token,
  65. pagin_config.direction,
  66. pagin_config.limit,
  67. as_client_event,
  68. include_archived,
  69. )
  70. now_ms = self.clock.time_msec()
  71. result = self.snapshot_cache.get(now_ms, key)
  72. if result is not None:
  73. return result
  74. return self.snapshot_cache.set(
  75. now_ms,
  76. key,
  77. self._snapshot_all_rooms(
  78. user_id, pagin_config, as_client_event, include_archived
  79. ),
  80. )
  81. @defer.inlineCallbacks
  82. def _snapshot_all_rooms(
  83. self,
  84. user_id=None,
  85. pagin_config=None,
  86. as_client_event=True,
  87. include_archived=False,
  88. ):
  89. memberships = [Membership.INVITE, Membership.JOIN]
  90. if include_archived:
  91. memberships.append(Membership.LEAVE)
  92. room_list = yield self.store.get_rooms_for_user_where_membership_is(
  93. user_id=user_id, membership_list=memberships
  94. )
  95. user = UserID.from_string(user_id)
  96. rooms_ret = []
  97. now_token = yield self.hs.get_event_sources().get_current_token()
  98. presence_stream = self.hs.get_event_sources().sources["presence"]
  99. pagination_config = PaginationConfig(from_token=now_token)
  100. presence, _ = yield presence_stream.get_pagination_rows(
  101. user, pagination_config.get_source_config("presence"), None
  102. )
  103. receipt_stream = self.hs.get_event_sources().sources["receipt"]
  104. receipt, _ = yield receipt_stream.get_pagination_rows(
  105. user, pagination_config.get_source_config("receipt"), None
  106. )
  107. tags_by_room = yield self.store.get_tags_for_user(user_id)
  108. account_data, account_data_by_room = (
  109. yield self.store.get_account_data_for_user(user_id)
  110. )
  111. public_room_ids = yield self.store.get_public_room_ids()
  112. limit = pagin_config.limit
  113. if limit is None:
  114. limit = 10
  115. @defer.inlineCallbacks
  116. def handle_room(event):
  117. d = {
  118. "room_id": event.room_id,
  119. "membership": event.membership,
  120. "visibility": (
  121. "public" if event.room_id in public_room_ids else "private"
  122. ),
  123. }
  124. if event.membership == Membership.INVITE:
  125. time_now = self.clock.time_msec()
  126. d["inviter"] = event.sender
  127. invite_event = yield self.store.get_event(event.event_id)
  128. d["invite"] = yield self._event_serializer.serialize_event(
  129. invite_event, time_now, as_client_event
  130. )
  131. rooms_ret.append(d)
  132. if event.membership not in (Membership.JOIN, Membership.LEAVE):
  133. return
  134. try:
  135. if event.membership == Membership.JOIN:
  136. room_end_token = now_token.room_key
  137. deferred_room_state = run_in_background(
  138. self.state_handler.get_current_state, event.room_id
  139. )
  140. elif event.membership == Membership.LEAVE:
  141. room_end_token = "s%d" % (event.stream_ordering,)
  142. deferred_room_state = run_in_background(
  143. self.store.get_state_for_events, [event.event_id]
  144. )
  145. deferred_room_state.addCallback(
  146. lambda states: states[event.event_id]
  147. )
  148. (messages, token), current_state = yield make_deferred_yieldable(
  149. defer.gatherResults(
  150. [
  151. run_in_background(
  152. self.store.get_recent_events_for_room,
  153. event.room_id,
  154. limit=limit,
  155. end_token=room_end_token,
  156. ),
  157. deferred_room_state,
  158. ]
  159. )
  160. ).addErrback(unwrapFirstError)
  161. messages = yield filter_events_for_client(self.store, user_id, messages)
  162. start_token = now_token.copy_and_replace("room_key", token)
  163. end_token = now_token.copy_and_replace("room_key", room_end_token)
  164. time_now = self.clock.time_msec()
  165. d["messages"] = {
  166. "chunk": (
  167. yield self._event_serializer.serialize_events(
  168. messages, time_now=time_now, as_client_event=as_client_event
  169. )
  170. ),
  171. "start": start_token.to_string(),
  172. "end": end_token.to_string(),
  173. }
  174. d["state"] = yield self._event_serializer.serialize_events(
  175. current_state.values(),
  176. time_now=time_now,
  177. as_client_event=as_client_event,
  178. )
  179. account_data_events = []
  180. tags = tags_by_room.get(event.room_id)
  181. if tags:
  182. account_data_events.append(
  183. {"type": "m.tag", "content": {"tags": tags}}
  184. )
  185. account_data = account_data_by_room.get(event.room_id, {})
  186. for account_data_type, content in account_data.items():
  187. account_data_events.append(
  188. {"type": account_data_type, "content": content}
  189. )
  190. d["account_data"] = account_data_events
  191. except Exception:
  192. logger.exception("Failed to get snapshot")
  193. yield concurrently_execute(handle_room, room_list, 10)
  194. account_data_events = []
  195. for account_data_type, content in account_data.items():
  196. account_data_events.append({"type": account_data_type, "content": content})
  197. now = self.clock.time_msec()
  198. ret = {
  199. "rooms": rooms_ret,
  200. "presence": [
  201. {
  202. "type": "m.presence",
  203. "content": format_user_presence_state(event, now),
  204. }
  205. for event in presence
  206. ],
  207. "account_data": account_data_events,
  208. "receipts": receipt,
  209. "end": now_token.to_string(),
  210. }
  211. return ret
  212. @defer.inlineCallbacks
  213. def room_initial_sync(self, requester, room_id, pagin_config=None):
  214. """Capture the a snapshot of a room. If user is currently a member of
  215. the room this will be what is currently in the room. If the user left
  216. the room this will be what was in the room when they left.
  217. Args:
  218. requester(Requester): The user to get a snapshot for.
  219. room_id(str): The room to get a snapshot of.
  220. pagin_config(synapse.streams.config.PaginationConfig):
  221. The pagination config used to determine how many messages to
  222. return.
  223. Raises:
  224. AuthError if the user wasn't in the room.
  225. Returns:
  226. A JSON serialisable dict with the snapshot of the room.
  227. """
  228. blocked = yield self.store.is_room_blocked(room_id)
  229. if blocked:
  230. raise SynapseError(403, "This room has been blocked on this server")
  231. user_id = requester.user.to_string()
  232. membership, member_event_id = yield self._check_in_room_or_world_readable(
  233. room_id, user_id
  234. )
  235. is_peeking = member_event_id is None
  236. if membership == Membership.JOIN:
  237. result = yield self._room_initial_sync_joined(
  238. user_id, room_id, pagin_config, membership, is_peeking
  239. )
  240. elif membership == Membership.LEAVE:
  241. result = yield self._room_initial_sync_parted(
  242. user_id, room_id, pagin_config, membership, member_event_id, is_peeking
  243. )
  244. account_data_events = []
  245. tags = yield self.store.get_tags_for_room(user_id, room_id)
  246. if tags:
  247. account_data_events.append({"type": "m.tag", "content": {"tags": tags}})
  248. account_data = yield self.store.get_account_data_for_room(user_id, room_id)
  249. for account_data_type, content in account_data.items():
  250. account_data_events.append({"type": account_data_type, "content": content})
  251. result["account_data"] = account_data_events
  252. return result
  253. @defer.inlineCallbacks
  254. def _room_initial_sync_parted(
  255. self, user_id, room_id, pagin_config, membership, member_event_id, is_peeking
  256. ):
  257. room_state = yield self.store.get_state_for_events([member_event_id])
  258. room_state = room_state[member_event_id]
  259. limit = pagin_config.limit if pagin_config else None
  260. if limit is None:
  261. limit = 10
  262. stream_token = yield self.store.get_stream_token_for_event(member_event_id)
  263. messages, token = yield self.store.get_recent_events_for_room(
  264. room_id, limit=limit, end_token=stream_token
  265. )
  266. messages = yield filter_events_for_client(
  267. self.store, user_id, messages, is_peeking=is_peeking
  268. )
  269. start_token = StreamToken.START.copy_and_replace("room_key", token)
  270. end_token = StreamToken.START.copy_and_replace("room_key", stream_token)
  271. time_now = self.clock.time_msec()
  272. return {
  273. "membership": membership,
  274. "room_id": room_id,
  275. "messages": {
  276. "chunk": (
  277. yield self._event_serializer.serialize_events(messages, time_now)
  278. ),
  279. "start": start_token.to_string(),
  280. "end": end_token.to_string(),
  281. },
  282. "state": (
  283. yield self._event_serializer.serialize_events(
  284. room_state.values(), time_now
  285. )
  286. ),
  287. "presence": [],
  288. "receipts": [],
  289. }
  290. @defer.inlineCallbacks
  291. def _room_initial_sync_joined(
  292. self, user_id, room_id, pagin_config, membership, is_peeking
  293. ):
  294. current_state = yield self.state.get_current_state(room_id=room_id)
  295. # TODO: These concurrently
  296. time_now = self.clock.time_msec()
  297. state = yield self._event_serializer.serialize_events(
  298. current_state.values(), time_now
  299. )
  300. now_token = yield self.hs.get_event_sources().get_current_token()
  301. limit = pagin_config.limit if pagin_config else None
  302. if limit is None:
  303. limit = 10
  304. room_members = [
  305. m
  306. for m in current_state.values()
  307. if m.type == EventTypes.Member
  308. and m.content["membership"] == Membership.JOIN
  309. ]
  310. presence_handler = self.hs.get_presence_handler()
  311. @defer.inlineCallbacks
  312. def get_presence():
  313. # If presence is disabled, return an empty list
  314. if not self.hs.config.use_presence:
  315. return []
  316. states = yield presence_handler.get_states(
  317. [m.user_id for m in room_members], as_event=True
  318. )
  319. return states
  320. @defer.inlineCallbacks
  321. def get_receipts():
  322. receipts = yield self.store.get_linearized_receipts_for_room(
  323. room_id, to_key=now_token.receipt_key
  324. )
  325. if not receipts:
  326. receipts = []
  327. return receipts
  328. presence, receipts, (messages, token) = yield make_deferred_yieldable(
  329. defer.gatherResults(
  330. [
  331. run_in_background(get_presence),
  332. run_in_background(get_receipts),
  333. run_in_background(
  334. self.store.get_recent_events_for_room,
  335. room_id,
  336. limit=limit,
  337. end_token=now_token.room_key,
  338. ),
  339. ],
  340. consumeErrors=True,
  341. ).addErrback(unwrapFirstError)
  342. )
  343. messages = yield filter_events_for_client(
  344. self.store, user_id, messages, is_peeking=is_peeking
  345. )
  346. start_token = now_token.copy_and_replace("room_key", token)
  347. end_token = now_token
  348. time_now = self.clock.time_msec()
  349. ret = {
  350. "room_id": room_id,
  351. "messages": {
  352. "chunk": (
  353. yield self._event_serializer.serialize_events(messages, time_now)
  354. ),
  355. "start": start_token.to_string(),
  356. "end": end_token.to_string(),
  357. },
  358. "state": state,
  359. "presence": presence,
  360. "receipts": receipts,
  361. }
  362. if not is_peeking:
  363. ret["membership"] = membership
  364. return ret
  365. @defer.inlineCallbacks
  366. def _check_in_room_or_world_readable(self, room_id, user_id):
  367. try:
  368. # check_user_was_in_room will return the most recent membership
  369. # event for the user if:
  370. # * The user is a non-guest user, and was ever in the room
  371. # * The user is a guest user, and has joined the room
  372. # else it will throw.
  373. member_event = yield self.auth.check_user_was_in_room(room_id, user_id)
  374. return (member_event.membership, member_event.event_id)
  375. return
  376. except AuthError:
  377. visibility = yield self.state_handler.get_current_state(
  378. room_id, EventTypes.RoomHistoryVisibility, ""
  379. )
  380. if (
  381. visibility
  382. and visibility.content["history_visibility"] == "world_readable"
  383. ):
  384. return (Membership.JOIN, None)
  385. return
  386. raise AuthError(
  387. 403, "Guest access not allowed", errcode=Codes.GUEST_ACCESS_FORBIDDEN
  388. )