test_filtering.py 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615
  1. # Copyright 2015, 2016 OpenMarket Ltd
  2. # Copyright 2017 Vector Creations Ltd
  3. # Copyright 2018-2019 New Vector Ltd
  4. # Copyright 2019 The Matrix.org Foundation C.I.C.
  5. #
  6. # Licensed under the Apache License, Version 2.0 (the "License");
  7. # you may not use this file except in compliance with the License.
  8. # You may obtain a copy of the License at
  9. #
  10. # http://www.apache.org/licenses/LICENSE-2.0
  11. #
  12. # Unless required by applicable law or agreed to in writing, software
  13. # distributed under the License is distributed on an "AS IS" BASIS,
  14. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. # See the License for the specific language governing permissions and
  16. # limitations under the License.
  17. from unittest.mock import patch
  18. import jsonschema
  19. from frozendict import frozendict
  20. from synapse.api.constants import EduTypes, EventContentFields
  21. from synapse.api.errors import SynapseError
  22. from synapse.api.filtering import Filter
  23. from synapse.events import make_event_from_dict
  24. from tests import unittest
  25. user_localpart = "test_user"
  26. def MockEvent(**kwargs):
  27. if "event_id" not in kwargs:
  28. kwargs["event_id"] = "fake_event_id"
  29. if "type" not in kwargs:
  30. kwargs["type"] = "fake_type"
  31. if "content" not in kwargs:
  32. kwargs["content"] = {}
  33. return make_event_from_dict(kwargs)
  34. class FilteringTestCase(unittest.HomeserverTestCase):
  35. def prepare(self, reactor, clock, hs):
  36. self.filtering = hs.get_filtering()
  37. self.datastore = hs.get_datastores().main
  38. def test_errors_on_invalid_filters(self):
  39. # See USER_FILTER_SCHEMA for the filter schema.
  40. invalid_filters = [
  41. # `account_data` must be a dictionary
  42. {"account_data": "Hello World"},
  43. # `event_fields` entries must not contain backslashes
  44. {"event_fields": [r"\\foo"]},
  45. # `event_format` must be "client" or "federation"
  46. {"event_format": "other"},
  47. # `not_rooms` must contain valid room IDs
  48. {"room": {"not_rooms": ["#foo:pik-test"]}},
  49. # `senders` must contain valid user IDs
  50. {"presence": {"senders": ["@bar;pik.test.com"]}},
  51. ]
  52. for filter in invalid_filters:
  53. with self.assertRaises(SynapseError):
  54. self.filtering.check_valid_filter(filter)
  55. def test_ignores_unknown_filter_fields(self):
  56. # For forward compatibility, we must ignore unknown filter fields.
  57. # See USER_FILTER_SCHEMA for the filter schema.
  58. filters = [
  59. {"org.matrix.msc9999.future_option": True},
  60. {"presence": {"org.matrix.msc9999.future_option": True}},
  61. {"room": {"org.matrix.msc9999.future_option": True}},
  62. {"room": {"timeline": {"org.matrix.msc9999.future_option": True}}},
  63. ]
  64. for filter in filters:
  65. self.filtering.check_valid_filter(filter)
  66. # Must not raise.
  67. def test_valid_filters(self):
  68. valid_filters = [
  69. {
  70. "room": {
  71. "timeline": {"limit": 20},
  72. "state": {"not_types": ["m.room.member"]},
  73. "ephemeral": {"limit": 0, "not_types": ["*"]},
  74. "include_leave": False,
  75. "rooms": ["!dee:pik-test"],
  76. "not_rooms": ["!gee:pik-test"],
  77. "account_data": {"limit": 0, "types": ["*"]},
  78. }
  79. },
  80. {
  81. "room": {
  82. "state": {
  83. "types": ["m.room.*"],
  84. "not_rooms": ["!726s6s6q:example.com"],
  85. },
  86. "timeline": {
  87. "limit": 10,
  88. "types": ["m.room.message"],
  89. "not_rooms": ["!726s6s6q:example.com"],
  90. "not_senders": ["@spam:example.com"],
  91. "org.matrix.labels": ["#fun"],
  92. "org.matrix.not_labels": ["#work"],
  93. },
  94. "ephemeral": {
  95. "types": [EduTypes.RECEIPT, EduTypes.TYPING],
  96. "not_rooms": ["!726s6s6q:example.com"],
  97. "not_senders": ["@spam:example.com"],
  98. },
  99. },
  100. "presence": {
  101. "types": [EduTypes.PRESENCE],
  102. "not_senders": ["@alice:example.com"],
  103. },
  104. "event_format": "client",
  105. "event_fields": ["type", "content", "sender"],
  106. },
  107. # a single backslash should be permitted (though it is debatable whether
  108. # it should be permitted before anything other than `.`, and what that
  109. # actually means)
  110. #
  111. # (note that event_fields is implemented in
  112. # synapse.events.utils.serialize_event, and so whether this actually works
  113. # is tested elsewhere. We just want to check that it is allowed through the
  114. # filter validation)
  115. {"event_fields": [r"foo\.bar"]},
  116. ]
  117. for filter in valid_filters:
  118. try:
  119. self.filtering.check_valid_filter(filter)
  120. except jsonschema.ValidationError as e:
  121. self.fail(e)
  122. def test_limits_are_applied(self):
  123. # TODO
  124. pass
  125. def test_definition_types_works_with_literals(self):
  126. definition = {"types": ["m.room.message", "org.matrix.foo.bar"]}
  127. event = MockEvent(sender="@foo:bar", type="m.room.message", room_id="!foo:bar")
  128. self.assertTrue(Filter(self.hs, definition)._check(event))
  129. def test_definition_types_works_with_wildcards(self):
  130. definition = {"types": ["m.*", "org.matrix.foo.bar"]}
  131. event = MockEvent(sender="@foo:bar", type="m.room.message", room_id="!foo:bar")
  132. self.assertTrue(Filter(self.hs, definition)._check(event))
  133. def test_definition_types_works_with_unknowns(self):
  134. definition = {"types": ["m.room.message", "org.matrix.foo.bar"]}
  135. event = MockEvent(
  136. sender="@foo:bar",
  137. type="now.for.something.completely.different",
  138. room_id="!foo:bar",
  139. )
  140. self.assertFalse(Filter(self.hs, definition)._check(event))
  141. def test_definition_not_types_works_with_literals(self):
  142. definition = {"not_types": ["m.room.message", "org.matrix.foo.bar"]}
  143. event = MockEvent(sender="@foo:bar", type="m.room.message", room_id="!foo:bar")
  144. self.assertFalse(Filter(self.hs, definition)._check(event))
  145. def test_definition_not_types_works_with_wildcards(self):
  146. definition = {"not_types": ["m.room.message", "org.matrix.*"]}
  147. event = MockEvent(
  148. sender="@foo:bar", type="org.matrix.custom.event", room_id="!foo:bar"
  149. )
  150. self.assertFalse(Filter(self.hs, definition)._check(event))
  151. def test_definition_not_types_works_with_unknowns(self):
  152. definition = {"not_types": ["m.*", "org.*"]}
  153. event = MockEvent(sender="@foo:bar", type="com.nom.nom.nom", room_id="!foo:bar")
  154. self.assertTrue(Filter(self.hs, definition)._check(event))
  155. def test_definition_not_types_takes_priority_over_types(self):
  156. definition = {
  157. "not_types": ["m.*", "org.*"],
  158. "types": ["m.room.message", "m.room.topic"],
  159. }
  160. event = MockEvent(sender="@foo:bar", type="m.room.topic", room_id="!foo:bar")
  161. self.assertFalse(Filter(self.hs, definition)._check(event))
  162. def test_definition_senders_works_with_literals(self):
  163. definition = {"senders": ["@flibble:wibble"]}
  164. event = MockEvent(
  165. sender="@flibble:wibble", type="com.nom.nom.nom", room_id="!foo:bar"
  166. )
  167. self.assertTrue(Filter(self.hs, definition)._check(event))
  168. def test_definition_senders_works_with_unknowns(self):
  169. definition = {"senders": ["@flibble:wibble"]}
  170. event = MockEvent(
  171. sender="@challenger:appears", type="com.nom.nom.nom", room_id="!foo:bar"
  172. )
  173. self.assertFalse(Filter(self.hs, definition)._check(event))
  174. def test_definition_not_senders_works_with_literals(self):
  175. definition = {"not_senders": ["@flibble:wibble"]}
  176. event = MockEvent(
  177. sender="@flibble:wibble", type="com.nom.nom.nom", room_id="!foo:bar"
  178. )
  179. self.assertFalse(Filter(self.hs, definition)._check(event))
  180. def test_definition_not_senders_works_with_unknowns(self):
  181. definition = {"not_senders": ["@flibble:wibble"]}
  182. event = MockEvent(
  183. sender="@challenger:appears", type="com.nom.nom.nom", room_id="!foo:bar"
  184. )
  185. self.assertTrue(Filter(self.hs, definition)._check(event))
  186. def test_definition_not_senders_takes_priority_over_senders(self):
  187. definition = {
  188. "not_senders": ["@misspiggy:muppets"],
  189. "senders": ["@kermit:muppets", "@misspiggy:muppets"],
  190. }
  191. event = MockEvent(
  192. sender="@misspiggy:muppets", type="m.room.topic", room_id="!foo:bar"
  193. )
  194. self.assertFalse(Filter(self.hs, definition)._check(event))
  195. def test_definition_rooms_works_with_literals(self):
  196. definition = {"rooms": ["!secretbase:unknown"]}
  197. event = MockEvent(
  198. sender="@foo:bar", type="m.room.message", room_id="!secretbase:unknown"
  199. )
  200. self.assertTrue(Filter(self.hs, definition)._check(event))
  201. def test_definition_rooms_works_with_unknowns(self):
  202. definition = {"rooms": ["!secretbase:unknown"]}
  203. event = MockEvent(
  204. sender="@foo:bar",
  205. type="m.room.message",
  206. room_id="!anothersecretbase:unknown",
  207. )
  208. self.assertFalse(Filter(self.hs, definition)._check(event))
  209. def test_definition_not_rooms_works_with_literals(self):
  210. definition = {"not_rooms": ["!anothersecretbase:unknown"]}
  211. event = MockEvent(
  212. sender="@foo:bar",
  213. type="m.room.message",
  214. room_id="!anothersecretbase:unknown",
  215. )
  216. self.assertFalse(Filter(self.hs, definition)._check(event))
  217. def test_definition_not_rooms_works_with_unknowns(self):
  218. definition = {"not_rooms": ["!secretbase:unknown"]}
  219. event = MockEvent(
  220. sender="@foo:bar",
  221. type="m.room.message",
  222. room_id="!anothersecretbase:unknown",
  223. )
  224. self.assertTrue(Filter(self.hs, definition)._check(event))
  225. def test_definition_not_rooms_takes_priority_over_rooms(self):
  226. definition = {
  227. "not_rooms": ["!secretbase:unknown"],
  228. "rooms": ["!secretbase:unknown"],
  229. }
  230. event = MockEvent(
  231. sender="@foo:bar", type="m.room.message", room_id="!secretbase:unknown"
  232. )
  233. self.assertFalse(Filter(self.hs, definition)._check(event))
  234. def test_definition_combined_event(self):
  235. definition = {
  236. "not_senders": ["@misspiggy:muppets"],
  237. "senders": ["@kermit:muppets"],
  238. "rooms": ["!stage:unknown"],
  239. "not_rooms": ["!piggyshouse:muppets"],
  240. "types": ["m.room.message", "muppets.kermit.*"],
  241. "not_types": ["muppets.misspiggy.*"],
  242. }
  243. event = MockEvent(
  244. sender="@kermit:muppets", # yup
  245. type="m.room.message", # yup
  246. room_id="!stage:unknown", # yup
  247. )
  248. self.assertTrue(Filter(self.hs, definition)._check(event))
  249. def test_definition_combined_event_bad_sender(self):
  250. definition = {
  251. "not_senders": ["@misspiggy:muppets"],
  252. "senders": ["@kermit:muppets"],
  253. "rooms": ["!stage:unknown"],
  254. "not_rooms": ["!piggyshouse:muppets"],
  255. "types": ["m.room.message", "muppets.kermit.*"],
  256. "not_types": ["muppets.misspiggy.*"],
  257. }
  258. event = MockEvent(
  259. sender="@misspiggy:muppets", # nope
  260. type="m.room.message", # yup
  261. room_id="!stage:unknown", # yup
  262. )
  263. self.assertFalse(Filter(self.hs, definition)._check(event))
  264. def test_definition_combined_event_bad_room(self):
  265. definition = {
  266. "not_senders": ["@misspiggy:muppets"],
  267. "senders": ["@kermit:muppets"],
  268. "rooms": ["!stage:unknown"],
  269. "not_rooms": ["!piggyshouse:muppets"],
  270. "types": ["m.room.message", "muppets.kermit.*"],
  271. "not_types": ["muppets.misspiggy.*"],
  272. }
  273. event = MockEvent(
  274. sender="@kermit:muppets", # yup
  275. type="m.room.message", # yup
  276. room_id="!piggyshouse:muppets", # nope
  277. )
  278. self.assertFalse(Filter(self.hs, definition)._check(event))
  279. def test_definition_combined_event_bad_type(self):
  280. definition = {
  281. "not_senders": ["@misspiggy:muppets"],
  282. "senders": ["@kermit:muppets"],
  283. "rooms": ["!stage:unknown"],
  284. "not_rooms": ["!piggyshouse:muppets"],
  285. "types": ["m.room.message", "muppets.kermit.*"],
  286. "not_types": ["muppets.misspiggy.*"],
  287. }
  288. event = MockEvent(
  289. sender="@kermit:muppets", # yup
  290. type="muppets.misspiggy.kisses", # nope
  291. room_id="!stage:unknown", # yup
  292. )
  293. self.assertFalse(Filter(self.hs, definition)._check(event))
  294. def test_filter_labels(self):
  295. definition = {"org.matrix.labels": ["#fun"]}
  296. event = MockEvent(
  297. sender="@foo:bar",
  298. type="m.room.message",
  299. room_id="!secretbase:unknown",
  300. content={EventContentFields.LABELS: ["#fun"]},
  301. )
  302. self.assertTrue(Filter(self.hs, definition)._check(event))
  303. event = MockEvent(
  304. sender="@foo:bar",
  305. type="m.room.message",
  306. room_id="!secretbase:unknown",
  307. content={EventContentFields.LABELS: ["#notfun"]},
  308. )
  309. self.assertFalse(Filter(self.hs, definition)._check(event))
  310. # check it works with frozendicts too
  311. event = MockEvent(
  312. sender="@foo:bar",
  313. type="m.room.message",
  314. room_id="!secretbase:unknown",
  315. content=frozendict({EventContentFields.LABELS: ["#fun"]}),
  316. )
  317. self.assertTrue(Filter(self.hs, definition)._check(event))
  318. def test_filter_not_labels(self):
  319. definition = {"org.matrix.not_labels": ["#fun"]}
  320. event = MockEvent(
  321. sender="@foo:bar",
  322. type="m.room.message",
  323. room_id="!secretbase:unknown",
  324. content={EventContentFields.LABELS: ["#fun"]},
  325. )
  326. self.assertFalse(Filter(self.hs, definition)._check(event))
  327. event = MockEvent(
  328. sender="@foo:bar",
  329. type="m.room.message",
  330. room_id="!secretbase:unknown",
  331. content={EventContentFields.LABELS: ["#notfun"]},
  332. )
  333. self.assertTrue(Filter(self.hs, definition)._check(event))
  334. @unittest.override_config({"experimental_features": {"msc3874_enabled": True}})
  335. def test_filter_rel_type(self):
  336. definition = {"org.matrix.msc3874.rel_types": ["m.thread"]}
  337. event = MockEvent(
  338. sender="@foo:bar",
  339. type="m.room.message",
  340. room_id="!secretbase:unknown",
  341. content={},
  342. )
  343. self.assertFalse(Filter(self.hs, definition)._check(event))
  344. event = MockEvent(
  345. sender="@foo:bar",
  346. type="m.room.message",
  347. room_id="!secretbase:unknown",
  348. content={"m.relates_to": {"event_id": "$abc", "rel_type": "m.reference"}},
  349. )
  350. self.assertFalse(Filter(self.hs, definition)._check(event))
  351. event = MockEvent(
  352. sender="@foo:bar",
  353. type="m.room.message",
  354. room_id="!secretbase:unknown",
  355. content={"m.relates_to": {"event_id": "$abc", "rel_type": "m.thread"}},
  356. )
  357. self.assertTrue(Filter(self.hs, definition)._check(event))
  358. @unittest.override_config({"experimental_features": {"msc3874_enabled": True}})
  359. def test_filter_not_rel_type(self):
  360. definition = {"org.matrix.msc3874.not_rel_types": ["m.thread"]}
  361. event = MockEvent(
  362. sender="@foo:bar",
  363. type="m.room.message",
  364. room_id="!secretbase:unknown",
  365. content={"m.relates_to": {"event_id": "$abc", "rel_type": "m.thread"}},
  366. )
  367. self.assertFalse(Filter(self.hs, definition)._check(event))
  368. event = MockEvent(
  369. sender="@foo:bar",
  370. type="m.room.message",
  371. room_id="!secretbase:unknown",
  372. content={},
  373. )
  374. self.assertTrue(Filter(self.hs, definition)._check(event))
  375. event = MockEvent(
  376. sender="@foo:bar",
  377. type="m.room.message",
  378. room_id="!secretbase:unknown",
  379. content={"m.relates_to": {"event_id": "$abc", "rel_type": "m.reference"}},
  380. )
  381. self.assertTrue(Filter(self.hs, definition)._check(event))
  382. def test_filter_presence_match(self):
  383. user_filter_json = {"presence": {"types": ["m.*"]}}
  384. filter_id = self.get_success(
  385. self.datastore.add_user_filter(
  386. user_localpart=user_localpart, user_filter=user_filter_json
  387. )
  388. )
  389. event = MockEvent(sender="@foo:bar", type="m.profile")
  390. events = [event]
  391. user_filter = self.get_success(
  392. self.filtering.get_user_filter(
  393. user_localpart=user_localpart, filter_id=filter_id
  394. )
  395. )
  396. results = self.get_success(user_filter.filter_presence(events=events))
  397. self.assertEqual(events, results)
  398. def test_filter_presence_no_match(self):
  399. user_filter_json = {"presence": {"types": ["m.*"]}}
  400. filter_id = self.get_success(
  401. self.datastore.add_user_filter(
  402. user_localpart=user_localpart + "2", user_filter=user_filter_json
  403. )
  404. )
  405. event = MockEvent(
  406. event_id="$asdasd:localhost",
  407. sender="@foo:bar",
  408. type="custom.avatar.3d.crazy",
  409. )
  410. events = [event]
  411. user_filter = self.get_success(
  412. self.filtering.get_user_filter(
  413. user_localpart=user_localpart + "2", filter_id=filter_id
  414. )
  415. )
  416. results = self.get_success(user_filter.filter_presence(events=events))
  417. self.assertEqual([], results)
  418. def test_filter_room_state_match(self):
  419. user_filter_json = {"room": {"state": {"types": ["m.*"]}}}
  420. filter_id = self.get_success(
  421. self.datastore.add_user_filter(
  422. user_localpart=user_localpart, user_filter=user_filter_json
  423. )
  424. )
  425. event = MockEvent(sender="@foo:bar", type="m.room.topic", room_id="!foo:bar")
  426. events = [event]
  427. user_filter = self.get_success(
  428. self.filtering.get_user_filter(
  429. user_localpart=user_localpart, filter_id=filter_id
  430. )
  431. )
  432. results = self.get_success(user_filter.filter_room_state(events=events))
  433. self.assertEqual(events, results)
  434. def test_filter_room_state_no_match(self):
  435. user_filter_json = {"room": {"state": {"types": ["m.*"]}}}
  436. filter_id = self.get_success(
  437. self.datastore.add_user_filter(
  438. user_localpart=user_localpart, user_filter=user_filter_json
  439. )
  440. )
  441. event = MockEvent(
  442. sender="@foo:bar", type="org.matrix.custom.event", room_id="!foo:bar"
  443. )
  444. events = [event]
  445. user_filter = self.get_success(
  446. self.filtering.get_user_filter(
  447. user_localpart=user_localpart, filter_id=filter_id
  448. )
  449. )
  450. results = self.get_success(user_filter.filter_room_state(events))
  451. self.assertEqual([], results)
  452. def test_filter_rooms(self):
  453. definition = {
  454. "rooms": ["!allowed:example.com", "!excluded:example.com"],
  455. "not_rooms": ["!excluded:example.com"],
  456. }
  457. room_ids = [
  458. "!allowed:example.com", # Allowed because in rooms and not in not_rooms.
  459. "!excluded:example.com", # Disallowed because in not_rooms.
  460. "!not_included:example.com", # Disallowed because not in rooms.
  461. ]
  462. filtered_room_ids = list(Filter(self.hs, definition).filter_rooms(room_ids))
  463. self.assertEqual(filtered_room_ids, ["!allowed:example.com"])
  464. def test_filter_relations(self):
  465. events = [
  466. # An event without a relation.
  467. MockEvent(
  468. event_id="$no_relation",
  469. sender="@foo:bar",
  470. type="org.matrix.custom.event",
  471. room_id="!foo:bar",
  472. ),
  473. # An event with a relation.
  474. MockEvent(
  475. event_id="$with_relation",
  476. sender="@foo:bar",
  477. type="org.matrix.custom.event",
  478. room_id="!foo:bar",
  479. ),
  480. # Non-EventBase objects get passed through.
  481. {},
  482. ]
  483. # For the following tests we patch the datastore method (intead of injecting
  484. # events). This is a bit cheeky, but tests the logic of _check_event_relations.
  485. # Filter for a particular sender.
  486. definition = {"related_by_senders": ["@foo:bar"]}
  487. async def events_have_relations(*args, **kwargs):
  488. return ["$with_relation"]
  489. with patch.object(
  490. self.datastore, "events_have_relations", new=events_have_relations
  491. ):
  492. filtered_events = list(
  493. self.get_success(
  494. Filter(self.hs, definition)._check_event_relations(events)
  495. )
  496. )
  497. self.assertEqual(filtered_events, events[1:])
  498. def test_add_filter(self):
  499. user_filter_json = {"room": {"state": {"types": ["m.*"]}}}
  500. filter_id = self.get_success(
  501. self.filtering.add_user_filter(
  502. user_localpart=user_localpart, user_filter=user_filter_json
  503. )
  504. )
  505. self.assertEqual(filter_id, 0)
  506. self.assertEqual(
  507. user_filter_json,
  508. (
  509. self.get_success(
  510. self.datastore.get_user_filter(
  511. user_localpart=user_localpart, filter_id=0
  512. )
  513. )
  514. ),
  515. )
  516. def test_get_filter(self):
  517. user_filter_json = {"room": {"state": {"types": ["m.*"]}}}
  518. filter_id = self.get_success(
  519. self.datastore.add_user_filter(
  520. user_localpart=user_localpart, user_filter=user_filter_json
  521. )
  522. )
  523. filter = self.get_success(
  524. self.filtering.get_user_filter(
  525. user_localpart=user_localpart, filter_id=filter_id
  526. )
  527. )
  528. self.assertEqual(filter.get_filter_json(), user_filter_json)
  529. self.assertRegex(repr(filter), r"<FilterCollection \{.*\}>")