initial_sync.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514
  1. # Copyright 2016 OpenMarket Ltd
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. import logging
  15. from typing import TYPE_CHECKING, List, Optional, Tuple
  16. from synapse.api.constants import (
  17. AccountDataTypes,
  18. Direction,
  19. EduTypes,
  20. EventTypes,
  21. Membership,
  22. )
  23. from synapse.api.errors import SynapseError
  24. from synapse.events.utils import SerializeEventConfig
  25. from synapse.events.validator import EventValidator
  26. from synapse.handlers.presence import format_user_presence_state
  27. from synapse.handlers.receipts import ReceiptEventSource
  28. from synapse.logging.context import make_deferred_yieldable, run_in_background
  29. from synapse.storage.roommember import RoomsForUser
  30. from synapse.streams.config import PaginationConfig
  31. from synapse.types import (
  32. JsonDict,
  33. JsonMapping,
  34. Requester,
  35. RoomStreamToken,
  36. StreamKeyType,
  37. StreamToken,
  38. UserID,
  39. )
  40. from synapse.util import unwrapFirstError
  41. from synapse.util.async_helpers import concurrently_execute, gather_results
  42. from synapse.util.caches.response_cache import ResponseCache
  43. from synapse.visibility import filter_events_for_client
  44. if TYPE_CHECKING:
  45. from synapse.server import HomeServer
  46. logger = logging.getLogger(__name__)
  47. class InitialSyncHandler:
  48. def __init__(self, hs: "HomeServer"):
  49. self.store = hs.get_datastores().main
  50. self.auth = hs.get_auth()
  51. self.state_handler = hs.get_state_handler()
  52. self.hs = hs
  53. self.state = hs.get_state_handler()
  54. self.clock = hs.get_clock()
  55. self.validator = EventValidator()
  56. self.snapshot_cache: ResponseCache[
  57. Tuple[
  58. str,
  59. Optional[StreamToken],
  60. Optional[StreamToken],
  61. Direction,
  62. int,
  63. bool,
  64. bool,
  65. ]
  66. ] = ResponseCache(hs.get_clock(), "initial_sync_cache")
  67. self._event_serializer = hs.get_event_client_serializer()
  68. self._storage_controllers = hs.get_storage_controllers()
  69. self._state_storage_controller = self._storage_controllers.state
  70. async def snapshot_all_rooms(
  71. self,
  72. user_id: str,
  73. pagin_config: PaginationConfig,
  74. as_client_event: bool = True,
  75. include_archived: bool = False,
  76. ) -> JsonDict:
  77. """Retrieve a snapshot of all rooms the user is invited or has joined.
  78. This snapshot may include messages for all rooms where the user is
  79. joined, depending on the pagination config.
  80. Args:
  81. user_id: The ID of the user making the request.
  82. pagin_config: The pagination config used to determine how many
  83. messages *PER ROOM* to return.
  84. as_client_event: True to get events in client-server format.
  85. include_archived: True to get rooms that the user has left
  86. Returns:
  87. A JsonDict with the same format as the response to `/intialSync`
  88. API
  89. """
  90. key = (
  91. user_id,
  92. pagin_config.from_token,
  93. pagin_config.to_token,
  94. pagin_config.direction,
  95. pagin_config.limit,
  96. as_client_event,
  97. include_archived,
  98. )
  99. return await self.snapshot_cache.wrap(
  100. key,
  101. self._snapshot_all_rooms,
  102. user_id,
  103. pagin_config,
  104. as_client_event,
  105. include_archived,
  106. )
  107. async def _snapshot_all_rooms(
  108. self,
  109. user_id: str,
  110. pagin_config: PaginationConfig,
  111. as_client_event: bool = True,
  112. include_archived: bool = False,
  113. ) -> JsonDict:
  114. memberships = [Membership.INVITE, Membership.JOIN]
  115. if include_archived:
  116. memberships.append(Membership.LEAVE)
  117. room_list = await self.store.get_rooms_for_local_user_where_membership_is(
  118. user_id=user_id, membership_list=memberships
  119. )
  120. user = UserID.from_string(user_id)
  121. rooms_ret = []
  122. now_token = self.hs.get_event_sources().get_current_token()
  123. presence_stream = self.hs.get_event_sources().sources.presence
  124. presence, _ = await presence_stream.get_new_events(
  125. user, from_key=None, include_offline=False
  126. )
  127. joined_rooms = [r.room_id for r in room_list if r.membership == Membership.JOIN]
  128. receipt = await self.store.get_linearized_receipts_for_rooms(
  129. joined_rooms,
  130. to_key=now_token.receipt_key,
  131. )
  132. receipt = ReceiptEventSource.filter_out_private_receipts(receipt, user_id)
  133. tags_by_room = await self.store.get_tags_for_user(user_id)
  134. account_data = await self.store.get_global_account_data_for_user(user_id)
  135. account_data_by_room = await self.store.get_room_account_data_for_user(user_id)
  136. public_room_ids = await self.store.get_public_room_ids()
  137. serializer_options = SerializeEventConfig(as_client_event=as_client_event)
  138. async def handle_room(event: RoomsForUser) -> None:
  139. d: JsonDict = {
  140. "room_id": event.room_id,
  141. "membership": event.membership,
  142. "visibility": (
  143. "public" if event.room_id in public_room_ids else "private"
  144. ),
  145. }
  146. if event.membership == Membership.INVITE:
  147. time_now = self.clock.time_msec()
  148. d["inviter"] = event.sender
  149. invite_event = await self.store.get_event(event.event_id)
  150. d["invite"] = await self._event_serializer.serialize_event(
  151. invite_event,
  152. time_now,
  153. config=serializer_options,
  154. )
  155. rooms_ret.append(d)
  156. if event.membership not in (Membership.JOIN, Membership.LEAVE):
  157. return
  158. try:
  159. if event.membership == Membership.JOIN:
  160. room_end_token = now_token.room_key
  161. deferred_room_state = run_in_background(
  162. self._state_storage_controller.get_current_state, event.room_id
  163. )
  164. elif event.membership == Membership.LEAVE:
  165. room_end_token = RoomStreamToken(
  166. stream=event.stream_ordering,
  167. )
  168. deferred_room_state = run_in_background(
  169. self._state_storage_controller.get_state_for_events,
  170. [event.event_id],
  171. ).addCallback(lambda states: states[event.event_id])
  172. (messages, token), current_state = await make_deferred_yieldable(
  173. gather_results(
  174. (
  175. run_in_background(
  176. self.store.get_recent_events_for_room,
  177. event.room_id,
  178. limit=pagin_config.limit,
  179. end_token=room_end_token,
  180. ),
  181. deferred_room_state,
  182. )
  183. )
  184. ).addErrback(unwrapFirstError)
  185. messages = await filter_events_for_client(
  186. self._storage_controllers, user_id, messages
  187. )
  188. start_token = now_token.copy_and_replace(StreamKeyType.ROOM, token)
  189. end_token = now_token.copy_and_replace(
  190. StreamKeyType.ROOM, room_end_token
  191. )
  192. time_now = self.clock.time_msec()
  193. d["messages"] = {
  194. "chunk": (
  195. await self._event_serializer.serialize_events(
  196. messages,
  197. time_now=time_now,
  198. config=serializer_options,
  199. )
  200. ),
  201. "start": await start_token.to_string(self.store),
  202. "end": await end_token.to_string(self.store),
  203. }
  204. d["state"] = await self._event_serializer.serialize_events(
  205. current_state.values(),
  206. time_now=time_now,
  207. config=serializer_options,
  208. )
  209. account_data_events = []
  210. tags = tags_by_room.get(event.room_id)
  211. if tags:
  212. account_data_events.append(
  213. {"type": AccountDataTypes.TAG, "content": {"tags": tags}}
  214. )
  215. account_data = account_data_by_room.get(event.room_id, {})
  216. for account_data_type, content in account_data.items():
  217. account_data_events.append(
  218. {"type": account_data_type, "content": content}
  219. )
  220. d["account_data"] = account_data_events
  221. except Exception:
  222. logger.exception("Failed to get snapshot")
  223. await concurrently_execute(handle_room, room_list, 10)
  224. account_data_events = []
  225. for account_data_type, content in account_data.items():
  226. account_data_events.append({"type": account_data_type, "content": content})
  227. now = self.clock.time_msec()
  228. ret = {
  229. "rooms": rooms_ret,
  230. "presence": [
  231. {
  232. "type": EduTypes.PRESENCE,
  233. "content": format_user_presence_state(event, now),
  234. }
  235. for event in presence
  236. ],
  237. "account_data": account_data_events,
  238. "receipts": receipt,
  239. "end": await now_token.to_string(self.store),
  240. }
  241. return ret
  242. async def room_initial_sync(
  243. self, requester: Requester, room_id: str, pagin_config: PaginationConfig
  244. ) -> JsonDict:
  245. """Capture the a snapshot of a room. If user is currently a member of
  246. the room this will be what is currently in the room. If the user left
  247. the room this will be what was in the room when they left.
  248. Args:
  249. requester: The user to get a snapshot for.
  250. room_id: The room to get a snapshot of.
  251. pagin_config: The pagination config used to determine how many
  252. messages to return.
  253. Raises:
  254. AuthError if the user wasn't in the room.
  255. Returns:
  256. A JSON serialisable dict with the snapshot of the room.
  257. """
  258. blocked = await self.store.is_room_blocked(room_id)
  259. if blocked:
  260. raise SynapseError(403, "This room has been blocked on this server")
  261. (
  262. membership,
  263. member_event_id,
  264. ) = await self.auth.check_user_in_room_or_world_readable(
  265. room_id,
  266. requester,
  267. allow_departed_users=True,
  268. )
  269. is_peeking = member_event_id is None
  270. if membership == Membership.JOIN:
  271. result = await self._room_initial_sync_joined(
  272. requester, room_id, pagin_config, membership, is_peeking
  273. )
  274. elif membership == Membership.LEAVE:
  275. # The member_event_id will always be available if membership is set
  276. # to leave.
  277. assert member_event_id
  278. result = await self._room_initial_sync_parted(
  279. requester,
  280. room_id,
  281. pagin_config,
  282. membership,
  283. member_event_id,
  284. is_peeking,
  285. )
  286. account_data_events = []
  287. user_id = requester.user.to_string()
  288. tags = await self.store.get_tags_for_room(user_id, room_id)
  289. if tags:
  290. account_data_events.append(
  291. {"type": AccountDataTypes.TAG, "content": {"tags": tags}}
  292. )
  293. account_data = await self.store.get_account_data_for_room(user_id, room_id)
  294. for account_data_type, content in account_data.items():
  295. account_data_events.append({"type": account_data_type, "content": content})
  296. result["account_data"] = account_data_events
  297. return result
  298. async def _room_initial_sync_parted(
  299. self,
  300. requester: Requester,
  301. room_id: str,
  302. pagin_config: PaginationConfig,
  303. membership: str,
  304. member_event_id: str,
  305. is_peeking: bool,
  306. ) -> JsonDict:
  307. room_state = await self._state_storage_controller.get_state_for_event(
  308. member_event_id
  309. )
  310. leave_position = await self.store.get_position_for_event(member_event_id)
  311. stream_token = leave_position.to_room_stream_token()
  312. messages, token = await self.store.get_recent_events_for_room(
  313. room_id, limit=pagin_config.limit, end_token=stream_token
  314. )
  315. messages = await filter_events_for_client(
  316. self._storage_controllers,
  317. requester.user.to_string(),
  318. messages,
  319. is_peeking=is_peeking,
  320. )
  321. start_token = StreamToken.START.copy_and_replace(StreamKeyType.ROOM, token)
  322. end_token = StreamToken.START.copy_and_replace(StreamKeyType.ROOM, stream_token)
  323. time_now = self.clock.time_msec()
  324. serialize_options = SerializeEventConfig(requester=requester)
  325. return {
  326. "membership": membership,
  327. "room_id": room_id,
  328. "messages": {
  329. "chunk": (
  330. # Don't bundle aggregations as this is a deprecated API.
  331. await self._event_serializer.serialize_events(
  332. messages, time_now, config=serialize_options
  333. )
  334. ),
  335. "start": await start_token.to_string(self.store),
  336. "end": await end_token.to_string(self.store),
  337. },
  338. "state": (
  339. # Don't bundle aggregations as this is a deprecated API.
  340. await self._event_serializer.serialize_events(
  341. room_state.values(), time_now, config=serialize_options
  342. )
  343. ),
  344. "presence": [],
  345. "receipts": [],
  346. }
  347. async def _room_initial_sync_joined(
  348. self,
  349. requester: Requester,
  350. room_id: str,
  351. pagin_config: PaginationConfig,
  352. membership: str,
  353. is_peeking: bool,
  354. ) -> JsonDict:
  355. current_state = await self._storage_controllers.state.get_current_state(
  356. room_id=room_id
  357. )
  358. # TODO: These concurrently
  359. time_now = self.clock.time_msec()
  360. serialize_options = SerializeEventConfig(requester=requester)
  361. # Don't bundle aggregations as this is a deprecated API.
  362. state = await self._event_serializer.serialize_events(
  363. current_state.values(),
  364. time_now,
  365. config=serialize_options,
  366. )
  367. now_token = self.hs.get_event_sources().get_current_token()
  368. room_members = [
  369. m
  370. for m in current_state.values()
  371. if m.type == EventTypes.Member
  372. and m.content["membership"] == Membership.JOIN
  373. ]
  374. presence_handler = self.hs.get_presence_handler()
  375. async def get_presence() -> List[JsonDict]:
  376. # If presence is disabled, return an empty list
  377. if not self.hs.config.server.presence_enabled:
  378. return []
  379. states = await presence_handler.get_states(
  380. [m.user_id for m in room_members]
  381. )
  382. return [
  383. {
  384. "type": EduTypes.PRESENCE,
  385. "content": format_user_presence_state(s, time_now),
  386. }
  387. for s in states
  388. ]
  389. async def get_receipts() -> List[JsonMapping]:
  390. receipts = await self.store.get_linearized_receipts_for_room(
  391. room_id, to_key=now_token.receipt_key
  392. )
  393. if not receipts:
  394. return []
  395. return ReceiptEventSource.filter_out_private_receipts(
  396. receipts,
  397. requester.user.to_string(),
  398. )
  399. presence, receipts, (messages, token) = await make_deferred_yieldable(
  400. gather_results(
  401. (
  402. run_in_background(get_presence),
  403. run_in_background(get_receipts),
  404. run_in_background(
  405. self.store.get_recent_events_for_room,
  406. room_id,
  407. limit=pagin_config.limit,
  408. end_token=now_token.room_key,
  409. ),
  410. ),
  411. consumeErrors=True,
  412. ).addErrback(unwrapFirstError)
  413. )
  414. messages = await filter_events_for_client(
  415. self._storage_controllers,
  416. requester.user.to_string(),
  417. messages,
  418. is_peeking=is_peeking,
  419. )
  420. start_token = now_token.copy_and_replace(StreamKeyType.ROOM, token)
  421. end_token = now_token
  422. ret = {
  423. "room_id": room_id,
  424. "messages": {
  425. "chunk": (
  426. # Don't bundle aggregations as this is a deprecated API.
  427. await self._event_serializer.serialize_events(
  428. messages, time_now, config=serialize_options
  429. )
  430. ),
  431. "start": await start_token.to_string(self.store),
  432. "end": await end_token.to_string(self.store),
  433. },
  434. "state": state,
  435. "presence": presence,
  436. "receipts": receipts,
  437. }
  438. if not is_peeking:
  439. ret["membership"] = membership
  440. return ret