initial_sync.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455
  1. # -*- coding: utf-8 -*-
  2. # Copyright 2016 OpenMarket Ltd
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. from twisted.internet import defer
  16. from synapse.api.constants import EventTypes, Membership
  17. from synapse.api.errors import AuthError, Codes
  18. from synapse.events.utils import serialize_event
  19. from synapse.events.validator import EventValidator
  20. from synapse.handlers.presence import format_user_presence_state
  21. from synapse.streams.config import PaginationConfig
  22. from synapse.types import (
  23. UserID, StreamToken,
  24. )
  25. from synapse.util import unwrapFirstError
  26. from synapse.util.async import concurrently_execute
  27. from synapse.util.caches.snapshot_cache import SnapshotCache
  28. from synapse.util.logcontext import make_deferred_yieldable, run_in_background
  29. from synapse.visibility import filter_events_for_client
  30. from ._base import BaseHandler
  31. import logging
  32. logger = logging.getLogger(__name__)
  33. class InitialSyncHandler(BaseHandler):
  34. def __init__(self, hs):
  35. super(InitialSyncHandler, self).__init__(hs)
  36. self.hs = hs
  37. self.state = hs.get_state_handler()
  38. self.clock = hs.get_clock()
  39. self.validator = EventValidator()
  40. self.snapshot_cache = SnapshotCache()
  41. def snapshot_all_rooms(self, user_id=None, pagin_config=None,
  42. as_client_event=True, include_archived=False):
  43. """Retrieve a snapshot of all rooms the user is invited or has joined.
  44. This snapshot may include messages for all rooms where the user is
  45. joined, depending on the pagination config.
  46. Args:
  47. user_id (str): The ID of the user making the request.
  48. pagin_config (synapse.api.streams.PaginationConfig): The pagination
  49. config used to determine how many messages *PER ROOM* to return.
  50. as_client_event (bool): True to get events in client-server format.
  51. include_archived (bool): True to get rooms that the user has left
  52. Returns:
  53. A list of dicts with "room_id" and "membership" keys for all rooms
  54. the user is currently invited or joined in on. Rooms where the user
  55. is joined on, may return a "messages" key with messages, depending
  56. on the specified PaginationConfig.
  57. """
  58. key = (
  59. user_id,
  60. pagin_config.from_token,
  61. pagin_config.to_token,
  62. pagin_config.direction,
  63. pagin_config.limit,
  64. as_client_event,
  65. include_archived,
  66. )
  67. now_ms = self.clock.time_msec()
  68. result = self.snapshot_cache.get(now_ms, key)
  69. if result is not None:
  70. return result
  71. return self.snapshot_cache.set(now_ms, key, self._snapshot_all_rooms(
  72. user_id, pagin_config, as_client_event, include_archived
  73. ))
  74. @defer.inlineCallbacks
  75. def _snapshot_all_rooms(self, user_id=None, pagin_config=None,
  76. as_client_event=True, include_archived=False):
  77. memberships = [Membership.INVITE, Membership.JOIN]
  78. if include_archived:
  79. memberships.append(Membership.LEAVE)
  80. room_list = yield self.store.get_rooms_for_user_where_membership_is(
  81. user_id=user_id, membership_list=memberships
  82. )
  83. user = UserID.from_string(user_id)
  84. rooms_ret = []
  85. now_token = yield self.hs.get_event_sources().get_current_token()
  86. presence_stream = self.hs.get_event_sources().sources["presence"]
  87. pagination_config = PaginationConfig(from_token=now_token)
  88. presence, _ = yield presence_stream.get_pagination_rows(
  89. user, pagination_config.get_source_config("presence"), None
  90. )
  91. receipt_stream = self.hs.get_event_sources().sources["receipt"]
  92. receipt, _ = yield receipt_stream.get_pagination_rows(
  93. user, pagination_config.get_source_config("receipt"), None
  94. )
  95. tags_by_room = yield self.store.get_tags_for_user(user_id)
  96. account_data, account_data_by_room = (
  97. yield self.store.get_account_data_for_user(user_id)
  98. )
  99. public_room_ids = yield self.store.get_public_room_ids()
  100. limit = pagin_config.limit
  101. if limit is None:
  102. limit = 10
  103. @defer.inlineCallbacks
  104. def handle_room(event):
  105. d = {
  106. "room_id": event.room_id,
  107. "membership": event.membership,
  108. "visibility": (
  109. "public" if event.room_id in public_room_ids
  110. else "private"
  111. ),
  112. }
  113. if event.membership == Membership.INVITE:
  114. time_now = self.clock.time_msec()
  115. d["inviter"] = event.sender
  116. invite_event = yield self.store.get_event(event.event_id)
  117. d["invite"] = serialize_event(invite_event, time_now, as_client_event)
  118. rooms_ret.append(d)
  119. if event.membership not in (Membership.JOIN, Membership.LEAVE):
  120. return
  121. try:
  122. if event.membership == Membership.JOIN:
  123. room_end_token = now_token.room_key
  124. deferred_room_state = self.state_handler.get_current_state(
  125. event.room_id
  126. )
  127. elif event.membership == Membership.LEAVE:
  128. room_end_token = "s%d" % (event.stream_ordering,)
  129. deferred_room_state = self.store.get_state_for_events(
  130. [event.event_id], None
  131. )
  132. deferred_room_state.addCallback(
  133. lambda states: states[event.event_id]
  134. )
  135. (messages, token), current_state = yield make_deferred_yieldable(
  136. defer.gatherResults(
  137. [
  138. run_in_background(
  139. self.store.get_recent_events_for_room,
  140. event.room_id,
  141. limit=limit,
  142. end_token=room_end_token,
  143. ),
  144. deferred_room_state,
  145. ]
  146. )
  147. ).addErrback(unwrapFirstError)
  148. messages = yield filter_events_for_client(
  149. self.store, user_id, messages
  150. )
  151. start_token = now_token.copy_and_replace("room_key", token[0])
  152. end_token = now_token.copy_and_replace("room_key", token[1])
  153. time_now = self.clock.time_msec()
  154. d["messages"] = {
  155. "chunk": [
  156. serialize_event(m, time_now, as_client_event)
  157. for m in messages
  158. ],
  159. "start": start_token.to_string(),
  160. "end": end_token.to_string(),
  161. }
  162. d["state"] = [
  163. serialize_event(c, time_now, as_client_event)
  164. for c in current_state.values()
  165. ]
  166. account_data_events = []
  167. tags = tags_by_room.get(event.room_id)
  168. if tags:
  169. account_data_events.append({
  170. "type": "m.tag",
  171. "content": {"tags": tags},
  172. })
  173. account_data = account_data_by_room.get(event.room_id, {})
  174. for account_data_type, content in account_data.items():
  175. account_data_events.append({
  176. "type": account_data_type,
  177. "content": content,
  178. })
  179. d["account_data"] = account_data_events
  180. except Exception:
  181. logger.exception("Failed to get snapshot")
  182. yield concurrently_execute(handle_room, room_list, 10)
  183. account_data_events = []
  184. for account_data_type, content in account_data.items():
  185. account_data_events.append({
  186. "type": account_data_type,
  187. "content": content,
  188. })
  189. now = self.clock.time_msec()
  190. ret = {
  191. "rooms": rooms_ret,
  192. "presence": [
  193. {
  194. "type": "m.presence",
  195. "content": format_user_presence_state(event, now),
  196. }
  197. for event in presence
  198. ],
  199. "account_data": account_data_events,
  200. "receipts": receipt,
  201. "end": now_token.to_string(),
  202. }
  203. defer.returnValue(ret)
  204. @defer.inlineCallbacks
  205. def room_initial_sync(self, requester, room_id, pagin_config=None):
  206. """Capture the a snapshot of a room. If user is currently a member of
  207. the room this will be what is currently in the room. If the user left
  208. the room this will be what was in the room when they left.
  209. Args:
  210. requester(Requester): The user to get a snapshot for.
  211. room_id(str): The room to get a snapshot of.
  212. pagin_config(synapse.streams.config.PaginationConfig):
  213. The pagination config used to determine how many messages to
  214. return.
  215. Raises:
  216. AuthError if the user wasn't in the room.
  217. Returns:
  218. A JSON serialisable dict with the snapshot of the room.
  219. """
  220. user_id = requester.user.to_string()
  221. membership, member_event_id = yield self._check_in_room_or_world_readable(
  222. room_id, user_id,
  223. )
  224. is_peeking = member_event_id is None
  225. if membership == Membership.JOIN:
  226. result = yield self._room_initial_sync_joined(
  227. user_id, room_id, pagin_config, membership, is_peeking
  228. )
  229. elif membership == Membership.LEAVE:
  230. result = yield self._room_initial_sync_parted(
  231. user_id, room_id, pagin_config, membership, member_event_id, is_peeking
  232. )
  233. account_data_events = []
  234. tags = yield self.store.get_tags_for_room(user_id, room_id)
  235. if tags:
  236. account_data_events.append({
  237. "type": "m.tag",
  238. "content": {"tags": tags},
  239. })
  240. account_data = yield self.store.get_account_data_for_room(user_id, room_id)
  241. for account_data_type, content in account_data.items():
  242. account_data_events.append({
  243. "type": account_data_type,
  244. "content": content,
  245. })
  246. result["account_data"] = account_data_events
  247. defer.returnValue(result)
  248. @defer.inlineCallbacks
  249. def _room_initial_sync_parted(self, user_id, room_id, pagin_config,
  250. membership, member_event_id, is_peeking):
  251. room_state = yield self.store.get_state_for_events(
  252. [member_event_id], None
  253. )
  254. room_state = room_state[member_event_id]
  255. limit = pagin_config.limit if pagin_config else None
  256. if limit is None:
  257. limit = 10
  258. stream_token = yield self.store.get_stream_token_for_event(
  259. member_event_id
  260. )
  261. messages, token = yield self.store.get_recent_events_for_room(
  262. room_id,
  263. limit=limit,
  264. end_token=stream_token
  265. )
  266. messages = yield filter_events_for_client(
  267. self.store, user_id, messages, is_peeking=is_peeking
  268. )
  269. start_token = StreamToken.START.copy_and_replace("room_key", token[0])
  270. end_token = StreamToken.START.copy_and_replace("room_key", token[1])
  271. time_now = self.clock.time_msec()
  272. defer.returnValue({
  273. "membership": membership,
  274. "room_id": room_id,
  275. "messages": {
  276. "chunk": [serialize_event(m, time_now) for m in messages],
  277. "start": start_token.to_string(),
  278. "end": end_token.to_string(),
  279. },
  280. "state": [serialize_event(s, time_now) for s in room_state.values()],
  281. "presence": [],
  282. "receipts": [],
  283. })
  284. @defer.inlineCallbacks
  285. def _room_initial_sync_joined(self, user_id, room_id, pagin_config,
  286. membership, is_peeking):
  287. current_state = yield self.state.get_current_state(
  288. room_id=room_id,
  289. )
  290. # TODO: These concurrently
  291. time_now = self.clock.time_msec()
  292. state = [
  293. serialize_event(x, time_now)
  294. for x in current_state.values()
  295. ]
  296. now_token = yield self.hs.get_event_sources().get_current_token()
  297. limit = pagin_config.limit if pagin_config else None
  298. if limit is None:
  299. limit = 10
  300. room_members = [
  301. m for m in current_state.values()
  302. if m.type == EventTypes.Member
  303. and m.content["membership"] == Membership.JOIN
  304. ]
  305. presence_handler = self.hs.get_presence_handler()
  306. @defer.inlineCallbacks
  307. def get_presence():
  308. states = yield presence_handler.get_states(
  309. [m.user_id for m in room_members],
  310. as_event=True,
  311. )
  312. defer.returnValue(states)
  313. @defer.inlineCallbacks
  314. def get_receipts():
  315. receipts = yield self.store.get_linearized_receipts_for_room(
  316. room_id,
  317. to_key=now_token.receipt_key,
  318. )
  319. if not receipts:
  320. receipts = []
  321. defer.returnValue(receipts)
  322. presence, receipts, (messages, token) = yield defer.gatherResults(
  323. [
  324. run_in_background(get_presence),
  325. run_in_background(get_receipts),
  326. run_in_background(
  327. self.store.get_recent_events_for_room,
  328. room_id,
  329. limit=limit,
  330. end_token=now_token.room_key,
  331. )
  332. ],
  333. consumeErrors=True,
  334. ).addErrback(unwrapFirstError)
  335. messages = yield filter_events_for_client(
  336. self.store, user_id, messages, is_peeking=is_peeking,
  337. )
  338. start_token = now_token.copy_and_replace("room_key", token[0])
  339. end_token = now_token.copy_and_replace("room_key", token[1])
  340. time_now = self.clock.time_msec()
  341. ret = {
  342. "room_id": room_id,
  343. "messages": {
  344. "chunk": [serialize_event(m, time_now) for m in messages],
  345. "start": start_token.to_string(),
  346. "end": end_token.to_string(),
  347. },
  348. "state": state,
  349. "presence": presence,
  350. "receipts": receipts,
  351. }
  352. if not is_peeking:
  353. ret["membership"] = membership
  354. defer.returnValue(ret)
  355. @defer.inlineCallbacks
  356. def _check_in_room_or_world_readable(self, room_id, user_id):
  357. try:
  358. # check_user_was_in_room will return the most recent membership
  359. # event for the user if:
  360. # * The user is a non-guest user, and was ever in the room
  361. # * The user is a guest user, and has joined the room
  362. # else it will throw.
  363. member_event = yield self.auth.check_user_was_in_room(room_id, user_id)
  364. defer.returnValue((member_event.membership, member_event.event_id))
  365. return
  366. except AuthError:
  367. visibility = yield self.state_handler.get_current_state(
  368. room_id, EventTypes.RoomHistoryVisibility, ""
  369. )
  370. if (
  371. visibility and
  372. visibility.content["history_visibility"] == "world_readable"
  373. ):
  374. defer.returnValue((Membership.JOIN, None))
  375. return
  376. raise AuthError(
  377. 403, "Guest access not allowed", errcode=Codes.GUEST_ACCESS_FORBIDDEN
  378. )