mirror of
https://git.anonymousland.org/anonymousland/synapse-product.git
synced 2025-01-25 15:36:19 -05:00
2365 lines
95 KiB
Python
2365 lines
95 KiB
Python
# Copyright 2015-2021 The Matrix.org Foundation C.I.C.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
import itertools
|
|
import logging
|
|
from typing import TYPE_CHECKING, Any, Dict, FrozenSet, List, Optional, Set, Tuple
|
|
|
|
import attr
|
|
from prometheus_client import Counter
|
|
|
|
from synapse.api.constants import EventTypes, Membership
|
|
from synapse.api.filtering import FilterCollection
|
|
from synapse.api.presence import UserPresenceState
|
|
from synapse.api.room_versions import KNOWN_ROOM_VERSIONS
|
|
from synapse.events import EventBase
|
|
from synapse.handlers.relations import BundledAggregations
|
|
from synapse.logging.context import current_context
|
|
from synapse.logging.opentracing import SynapseTags, log_kv, set_tag, start_active_span
|
|
from synapse.push.clientformat import format_push_rules_for_user
|
|
from synapse.storage.databases.main.event_push_actions import NotifCounts
|
|
from synapse.storage.roommember import MemberSummary
|
|
from synapse.storage.state import StateFilter
|
|
from synapse.types import (
|
|
DeviceListUpdates,
|
|
JsonDict,
|
|
MutableStateMap,
|
|
Requester,
|
|
RoomStreamToken,
|
|
StateMap,
|
|
StreamKeyType,
|
|
StreamToken,
|
|
UserID,
|
|
)
|
|
from synapse.util.async_helpers import concurrently_execute
|
|
from synapse.util.caches.expiringcache import ExpiringCache
|
|
from synapse.util.caches.lrucache import LruCache
|
|
from synapse.util.caches.response_cache import ResponseCache, ResponseCacheContext
|
|
from synapse.util.metrics import Measure, measure_func
|
|
from synapse.visibility import filter_events_for_client
|
|
|
|
if TYPE_CHECKING:
|
|
from synapse.server import HomeServer
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
# Counts the number of times we returned a non-empty sync. `type` is one of
|
|
# "initial_sync", "full_state_sync" or "incremental_sync", `lazy_loaded` is
|
|
# "true" or "false" depending on if the request asked for lazy loaded members or
|
|
# not.
|
|
non_empty_sync_counter = Counter(
|
|
"synapse_handlers_sync_nonempty_total",
|
|
"Count of non empty sync responses. type is initial_sync/full_state_sync"
|
|
"/incremental_sync. lazy_loaded indicates if lazy loaded members were "
|
|
"enabled for that request.",
|
|
["type", "lazy_loaded"],
|
|
)
|
|
|
|
# Store the cache that tracks which lazy-loaded members have been sent to a given
|
|
# client for no more than 30 minutes.
|
|
LAZY_LOADED_MEMBERS_CACHE_MAX_AGE = 30 * 60 * 1000
|
|
|
|
# Remember the last 100 members we sent to a client for the purposes of
|
|
# avoiding redundantly sending the same lazy-loaded members to the client
|
|
LAZY_LOADED_MEMBERS_CACHE_MAX_SIZE = 100
|
|
|
|
|
|
SyncRequestKey = Tuple[Any, ...]
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class SyncConfig:
|
|
user: UserID
|
|
filter_collection: FilterCollection
|
|
is_guest: bool
|
|
request_key: SyncRequestKey
|
|
device_id: Optional[str]
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class TimelineBatch:
|
|
prev_batch: StreamToken
|
|
events: List[EventBase]
|
|
limited: bool
|
|
# A mapping of event ID to the bundled aggregations for the above events.
|
|
# This is only calculated if limited is true.
|
|
bundled_aggregations: Optional[Dict[str, BundledAggregations]] = None
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Make the result appear empty if there are no updates. This is used
|
|
to tell if room needs to be part of the sync result.
|
|
"""
|
|
return bool(self.events)
|
|
|
|
|
|
# We can't freeze this class, because we need to update it after it's instantiated to
|
|
# update its unread count. This is because we calculate the unread count for a room only
|
|
# if there are updates for it, which we check after the instance has been created.
|
|
# This should not be a big deal because we update the notification counts afterwards as
|
|
# well anyway.
|
|
@attr.s(slots=True, auto_attribs=True)
|
|
class JoinedSyncResult:
|
|
room_id: str
|
|
timeline: TimelineBatch
|
|
state: StateMap[EventBase]
|
|
ephemeral: List[JsonDict]
|
|
account_data: List[JsonDict]
|
|
unread_notifications: JsonDict
|
|
summary: Optional[JsonDict]
|
|
unread_count: int
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Make the result appear empty if there are no updates. This is used
|
|
to tell if room needs to be part of the sync result.
|
|
"""
|
|
return bool(
|
|
self.timeline
|
|
or self.state
|
|
or self.ephemeral
|
|
or self.account_data
|
|
# nb the notification count does not, er, count: if there's nothing
|
|
# else in the result, we don't need to send it.
|
|
)
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class ArchivedSyncResult:
|
|
room_id: str
|
|
timeline: TimelineBatch
|
|
state: StateMap[EventBase]
|
|
account_data: List[JsonDict]
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Make the result appear empty if there are no updates. This is used
|
|
to tell if room needs to be part of the sync result.
|
|
"""
|
|
return bool(self.timeline or self.state or self.account_data)
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class InvitedSyncResult:
|
|
room_id: str
|
|
invite: EventBase
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Invited rooms should always be reported to the client"""
|
|
return True
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class KnockedSyncResult:
|
|
room_id: str
|
|
knock: EventBase
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Knocked rooms should always be reported to the client"""
|
|
return True
|
|
|
|
|
|
@attr.s(slots=True, auto_attribs=True)
|
|
class _RoomChanges:
|
|
"""The set of room entries to include in the sync, plus the set of joined
|
|
and left room IDs since last sync.
|
|
"""
|
|
|
|
room_entries: List["RoomSyncResultBuilder"]
|
|
invited: List[InvitedSyncResult]
|
|
knocked: List[KnockedSyncResult]
|
|
newly_joined_rooms: List[str]
|
|
newly_left_rooms: List[str]
|
|
|
|
|
|
@attr.s(slots=True, frozen=True, auto_attribs=True)
|
|
class SyncResult:
|
|
"""
|
|
Attributes:
|
|
next_batch: Token for the next sync
|
|
presence: List of presence events for the user.
|
|
account_data: List of account_data events for the user.
|
|
joined: JoinedSyncResult for each joined room.
|
|
invited: InvitedSyncResult for each invited room.
|
|
knocked: KnockedSyncResult for each knocked on room.
|
|
archived: ArchivedSyncResult for each archived room.
|
|
to_device: List of direct messages for the device.
|
|
device_lists: List of user_ids whose devices have changed
|
|
device_one_time_keys_count: Dict of algorithm to count for one time keys
|
|
for this device
|
|
device_unused_fallback_key_types: List of key types that have an unused fallback
|
|
key
|
|
"""
|
|
|
|
next_batch: StreamToken
|
|
presence: List[UserPresenceState]
|
|
account_data: List[JsonDict]
|
|
joined: List[JoinedSyncResult]
|
|
invited: List[InvitedSyncResult]
|
|
knocked: List[KnockedSyncResult]
|
|
archived: List[ArchivedSyncResult]
|
|
to_device: List[JsonDict]
|
|
device_lists: DeviceListUpdates
|
|
device_one_time_keys_count: JsonDict
|
|
device_unused_fallback_key_types: List[str]
|
|
|
|
def __bool__(self) -> bool:
|
|
"""Make the result appear empty if there are no updates. This is used
|
|
to tell if the notifier needs to wait for more events when polling for
|
|
events.
|
|
"""
|
|
return bool(
|
|
self.presence
|
|
or self.joined
|
|
or self.invited
|
|
or self.knocked
|
|
or self.archived
|
|
or self.account_data
|
|
or self.to_device
|
|
or self.device_lists
|
|
)
|
|
|
|
|
|
class SyncHandler:
|
|
def __init__(self, hs: "HomeServer"):
|
|
self.hs_config = hs.config
|
|
self.store = hs.get_datastores().main
|
|
self.notifier = hs.get_notifier()
|
|
self.presence_handler = hs.get_presence_handler()
|
|
self._relations_handler = hs.get_relations_handler()
|
|
self.event_sources = hs.get_event_sources()
|
|
self.clock = hs.get_clock()
|
|
self.state = hs.get_state_handler()
|
|
self.auth_blocking = hs.get_auth_blocking()
|
|
self._storage_controllers = hs.get_storage_controllers()
|
|
self._state_storage_controller = self._storage_controllers.state
|
|
self._device_handler = hs.get_device_handler()
|
|
|
|
# TODO: flush cache entries on subsequent sync request.
|
|
# Once we get the next /sync request (ie, one with the same access token
|
|
# that sets 'since' to 'next_batch'), we know that device won't need a
|
|
# cached result any more, and we could flush the entry from the cache to save
|
|
# memory.
|
|
self.response_cache: ResponseCache[SyncRequestKey] = ResponseCache(
|
|
hs.get_clock(),
|
|
"sync",
|
|
timeout_ms=hs.config.caches.sync_response_cache_duration,
|
|
)
|
|
|
|
# ExpiringCache((User, Device)) -> LruCache(user_id => event_id)
|
|
self.lazy_loaded_members_cache: ExpiringCache[
|
|
Tuple[str, Optional[str]], LruCache[str, str]
|
|
] = ExpiringCache(
|
|
"lazy_loaded_members_cache",
|
|
self.clock,
|
|
max_len=0,
|
|
expiry_ms=LAZY_LOADED_MEMBERS_CACHE_MAX_AGE,
|
|
)
|
|
|
|
self.rooms_to_exclude = hs.config.server.rooms_to_exclude_from_sync
|
|
|
|
async def wait_for_sync_for_user(
|
|
self,
|
|
requester: Requester,
|
|
sync_config: SyncConfig,
|
|
since_token: Optional[StreamToken] = None,
|
|
timeout: int = 0,
|
|
full_state: bool = False,
|
|
) -> SyncResult:
|
|
"""Get the sync for a client if we have new data for it now. Otherwise
|
|
wait for new data to arrive on the server. If the timeout expires, then
|
|
return an empty sync result.
|
|
"""
|
|
# If the user is not part of the mau group, then check that limits have
|
|
# not been exceeded (if not part of the group by this point, almost certain
|
|
# auth_blocking will occur)
|
|
user_id = sync_config.user.to_string()
|
|
await self.auth_blocking.check_auth_blocking(requester=requester)
|
|
|
|
res = await self.response_cache.wrap(
|
|
sync_config.request_key,
|
|
self._wait_for_sync_for_user,
|
|
sync_config,
|
|
since_token,
|
|
timeout,
|
|
full_state,
|
|
cache_context=True,
|
|
)
|
|
logger.debug("Returning sync response for %s", user_id)
|
|
return res
|
|
|
|
async def _wait_for_sync_for_user(
|
|
self,
|
|
sync_config: SyncConfig,
|
|
since_token: Optional[StreamToken],
|
|
timeout: int,
|
|
full_state: bool,
|
|
cache_context: ResponseCacheContext[SyncRequestKey],
|
|
) -> SyncResult:
|
|
"""The start of the machinery that produces a /sync response.
|
|
|
|
See https://spec.matrix.org/v1.1/client-server-api/#syncing for full details.
|
|
|
|
This method does high-level bookkeeping:
|
|
- tracking the kind of sync in the logging context
|
|
- deleting any to_device messages whose delivery has been acknowledged.
|
|
- deciding if we should dispatch an instant or delayed response
|
|
- marking the sync as being lazily loaded, if appropriate
|
|
|
|
Computing the body of the response begins in the next method,
|
|
`current_sync_for_user`.
|
|
"""
|
|
if since_token is None:
|
|
sync_type = "initial_sync"
|
|
elif full_state:
|
|
sync_type = "full_state_sync"
|
|
else:
|
|
sync_type = "incremental_sync"
|
|
|
|
context = current_context()
|
|
if context:
|
|
context.tag = sync_type
|
|
|
|
# if we have a since token, delete any to-device messages before that token
|
|
# (since we now know that the device has received them)
|
|
if since_token is not None:
|
|
since_stream_id = since_token.to_device_key
|
|
deleted = await self.store.delete_messages_for_device(
|
|
sync_config.user.to_string(), sync_config.device_id, since_stream_id
|
|
)
|
|
logger.debug(
|
|
"Deleted %d to-device messages up to %d", deleted, since_stream_id
|
|
)
|
|
|
|
if timeout == 0 or since_token is None or full_state:
|
|
# we are going to return immediately, so don't bother calling
|
|
# notifier.wait_for_events.
|
|
result: SyncResult = await self.current_sync_for_user(
|
|
sync_config, since_token, full_state=full_state
|
|
)
|
|
else:
|
|
# Otherwise, we wait for something to happen and report it to the user.
|
|
async def current_sync_callback(
|
|
before_token: StreamToken, after_token: StreamToken
|
|
) -> SyncResult:
|
|
return await self.current_sync_for_user(sync_config, since_token)
|
|
|
|
result = await self.notifier.wait_for_events(
|
|
sync_config.user.to_string(),
|
|
timeout,
|
|
current_sync_callback,
|
|
from_token=since_token,
|
|
)
|
|
|
|
# if nothing has happened in any of the users' rooms since /sync was called,
|
|
# the resultant next_batch will be the same as since_token (since the result
|
|
# is generated when wait_for_events is first called, and not regenerated
|
|
# when wait_for_events times out).
|
|
#
|
|
# If that happens, we mustn't cache it, so that when the client comes back
|
|
# with the same cache token, we don't immediately return the same empty
|
|
# result, causing a tightloop. (#8518)
|
|
if result.next_batch == since_token:
|
|
cache_context.should_cache = False
|
|
|
|
if result:
|
|
if sync_config.filter_collection.lazy_load_members():
|
|
lazy_loaded = "true"
|
|
else:
|
|
lazy_loaded = "false"
|
|
non_empty_sync_counter.labels(sync_type, lazy_loaded).inc()
|
|
|
|
return result
|
|
|
|
async def current_sync_for_user(
|
|
self,
|
|
sync_config: SyncConfig,
|
|
since_token: Optional[StreamToken] = None,
|
|
full_state: bool = False,
|
|
) -> SyncResult:
|
|
"""Generates the response body of a sync result, represented as a SyncResult.
|
|
|
|
This is a wrapper around `generate_sync_result` which starts an open tracing
|
|
span to track the sync. See `generate_sync_result` for the next part of your
|
|
indoctrination.
|
|
"""
|
|
with start_active_span("sync.current_sync_for_user"):
|
|
log_kv({"since_token": since_token})
|
|
sync_result = await self.generate_sync_result(
|
|
sync_config, since_token, full_state
|
|
)
|
|
|
|
set_tag(SynapseTags.SYNC_RESULT, bool(sync_result))
|
|
return sync_result
|
|
|
|
async def push_rules_for_user(self, user: UserID) -> Dict[str, Dict[str, list]]:
|
|
user_id = user.to_string()
|
|
rules_raw = await self.store.get_push_rules_for_user(user_id)
|
|
rules = format_push_rules_for_user(user, rules_raw)
|
|
return rules
|
|
|
|
async def ephemeral_by_room(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
now_token: StreamToken,
|
|
since_token: Optional[StreamToken] = None,
|
|
) -> Tuple[StreamToken, Dict[str, List[JsonDict]]]:
|
|
"""Get the ephemeral events for each room the user is in
|
|
Args:
|
|
sync_result_builder
|
|
now_token: Where the server is currently up to.
|
|
since_token: Where the server was when the client
|
|
last synced.
|
|
Returns:
|
|
A tuple of the now StreamToken, updated to reflect the which typing
|
|
events are included, and a dict mapping from room_id to a list of
|
|
typing events for that room.
|
|
"""
|
|
|
|
sync_config = sync_result_builder.sync_config
|
|
|
|
with Measure(self.clock, "ephemeral_by_room"):
|
|
typing_key = since_token.typing_key if since_token else 0
|
|
|
|
room_ids = sync_result_builder.joined_room_ids
|
|
|
|
typing_source = self.event_sources.sources.typing
|
|
typing, typing_key = await typing_source.get_new_events(
|
|
user=sync_config.user,
|
|
from_key=typing_key,
|
|
limit=sync_config.filter_collection.ephemeral_limit(),
|
|
room_ids=room_ids,
|
|
is_guest=sync_config.is_guest,
|
|
)
|
|
now_token = now_token.copy_and_replace(StreamKeyType.TYPING, typing_key)
|
|
|
|
ephemeral_by_room: JsonDict = {}
|
|
|
|
for event in typing:
|
|
# we want to exclude the room_id from the event, but modifying the
|
|
# result returned by the event source is poor form (it might cache
|
|
# the object)
|
|
room_id = event["room_id"]
|
|
event_copy = {k: v for (k, v) in event.items() if k != "room_id"}
|
|
ephemeral_by_room.setdefault(room_id, []).append(event_copy)
|
|
|
|
receipt_key = since_token.receipt_key if since_token else 0
|
|
|
|
receipt_source = self.event_sources.sources.receipt
|
|
receipts, receipt_key = await receipt_source.get_new_events(
|
|
user=sync_config.user,
|
|
from_key=receipt_key,
|
|
limit=sync_config.filter_collection.ephemeral_limit(),
|
|
room_ids=room_ids,
|
|
is_guest=sync_config.is_guest,
|
|
)
|
|
now_token = now_token.copy_and_replace(StreamKeyType.RECEIPT, receipt_key)
|
|
|
|
for event in receipts:
|
|
room_id = event["room_id"]
|
|
# exclude room id, as above
|
|
event_copy = {k: v for (k, v) in event.items() if k != "room_id"}
|
|
ephemeral_by_room.setdefault(room_id, []).append(event_copy)
|
|
|
|
return now_token, ephemeral_by_room
|
|
|
|
async def _load_filtered_recents(
|
|
self,
|
|
room_id: str,
|
|
sync_config: SyncConfig,
|
|
now_token: StreamToken,
|
|
since_token: Optional[StreamToken] = None,
|
|
potential_recents: Optional[List[EventBase]] = None,
|
|
newly_joined_room: bool = False,
|
|
) -> TimelineBatch:
|
|
with Measure(self.clock, "load_filtered_recents"):
|
|
timeline_limit = sync_config.filter_collection.timeline_limit()
|
|
block_all_timeline = (
|
|
sync_config.filter_collection.blocks_all_room_timeline()
|
|
)
|
|
|
|
if (
|
|
potential_recents is None
|
|
or newly_joined_room
|
|
or timeline_limit < len(potential_recents)
|
|
):
|
|
limited = True
|
|
else:
|
|
limited = False
|
|
|
|
log_kv({"limited": limited})
|
|
|
|
if potential_recents:
|
|
recents = await sync_config.filter_collection.filter_room_timeline(
|
|
potential_recents
|
|
)
|
|
log_kv({"recents_after_sync_filtering": len(recents)})
|
|
|
|
# We check if there are any state events, if there are then we pass
|
|
# all current state events to the filter_events function. This is to
|
|
# ensure that we always include current state in the timeline
|
|
current_state_ids: FrozenSet[str] = frozenset()
|
|
if any(e.is_state() for e in recents):
|
|
current_state_ids_map = (
|
|
await self._state_storage_controller.get_current_state_ids(
|
|
room_id
|
|
)
|
|
)
|
|
current_state_ids = frozenset(current_state_ids_map.values())
|
|
|
|
recents = await filter_events_for_client(
|
|
self._storage_controllers,
|
|
sync_config.user.to_string(),
|
|
recents,
|
|
always_include_ids=current_state_ids,
|
|
)
|
|
log_kv({"recents_after_visibility_filtering": len(recents)})
|
|
else:
|
|
recents = []
|
|
|
|
if not limited or block_all_timeline:
|
|
prev_batch_token = now_token
|
|
if recents:
|
|
room_key = recents[0].internal_metadata.before
|
|
prev_batch_token = now_token.copy_and_replace(
|
|
StreamKeyType.ROOM, room_key
|
|
)
|
|
|
|
return TimelineBatch(
|
|
events=recents, prev_batch=prev_batch_token, limited=False
|
|
)
|
|
|
|
filtering_factor = 2
|
|
load_limit = max(timeline_limit * filtering_factor, 10)
|
|
max_repeat = 5 # Only try a few times per room, otherwise
|
|
room_key = now_token.room_key
|
|
end_key = room_key
|
|
|
|
since_key = None
|
|
if since_token and not newly_joined_room:
|
|
since_key = since_token.room_key
|
|
|
|
while limited and len(recents) < timeline_limit and max_repeat:
|
|
# If we have a since_key then we are trying to get any events
|
|
# that have happened since `since_key` up to `end_key`, so we
|
|
# can just use `get_room_events_stream_for_room`.
|
|
# Otherwise, we want to return the last N events in the room
|
|
# in topological ordering.
|
|
if since_key:
|
|
events, end_key = await self.store.get_room_events_stream_for_room(
|
|
room_id,
|
|
limit=load_limit + 1,
|
|
from_key=since_key,
|
|
to_key=end_key,
|
|
)
|
|
else:
|
|
events, end_key = await self.store.get_recent_events_for_room(
|
|
room_id, limit=load_limit + 1, end_token=end_key
|
|
)
|
|
|
|
log_kv({"loaded_recents": len(events)})
|
|
|
|
loaded_recents = (
|
|
await sync_config.filter_collection.filter_room_timeline(events)
|
|
)
|
|
|
|
log_kv({"loaded_recents_after_sync_filtering": len(loaded_recents)})
|
|
|
|
# We check if there are any state events, if there are then we pass
|
|
# all current state events to the filter_events function. This is to
|
|
# ensure that we always include current state in the timeline
|
|
current_state_ids = frozenset()
|
|
if any(e.is_state() for e in loaded_recents):
|
|
# FIXME(faster_joins): We use the partial state here as
|
|
# we don't want to block `/sync` on finishing a lazy join.
|
|
# Is this the correct way of doing it?
|
|
current_state_ids_map = (
|
|
await self.store.get_partial_current_state_ids(room_id)
|
|
)
|
|
current_state_ids = frozenset(current_state_ids_map.values())
|
|
|
|
loaded_recents = await filter_events_for_client(
|
|
self._storage_controllers,
|
|
sync_config.user.to_string(),
|
|
loaded_recents,
|
|
always_include_ids=current_state_ids,
|
|
)
|
|
|
|
log_kv({"loaded_recents_after_client_filtering": len(loaded_recents)})
|
|
|
|
loaded_recents.extend(recents)
|
|
recents = loaded_recents
|
|
|
|
if len(events) <= load_limit:
|
|
limited = False
|
|
break
|
|
max_repeat -= 1
|
|
|
|
if len(recents) > timeline_limit:
|
|
limited = True
|
|
recents = recents[-timeline_limit:]
|
|
room_key = recents[0].internal_metadata.before
|
|
|
|
prev_batch_token = now_token.copy_and_replace(StreamKeyType.ROOM, room_key)
|
|
|
|
# Don't bother to bundle aggregations if the timeline is unlimited,
|
|
# as clients will have all the necessary information.
|
|
bundled_aggregations = None
|
|
if limited or newly_joined_room:
|
|
bundled_aggregations = (
|
|
await self._relations_handler.get_bundled_aggregations(
|
|
recents, sync_config.user.to_string()
|
|
)
|
|
)
|
|
|
|
return TimelineBatch(
|
|
events=recents,
|
|
prev_batch=prev_batch_token,
|
|
limited=limited or newly_joined_room,
|
|
bundled_aggregations=bundled_aggregations,
|
|
)
|
|
|
|
async def get_state_after_event(
|
|
self, event_id: str, state_filter: Optional[StateFilter] = None
|
|
) -> StateMap[str]:
|
|
"""
|
|
Get the room state after the given event
|
|
|
|
Args:
|
|
event_id: event of interest
|
|
state_filter: The state filter used to fetch state from the database.
|
|
"""
|
|
state_ids = await self._state_storage_controller.get_state_ids_for_event(
|
|
event_id, state_filter=state_filter or StateFilter.all()
|
|
)
|
|
|
|
# using get_metadata_for_events here (instead of get_event) sidesteps an issue
|
|
# with redactions: if `event_id` is a redaction event, and we don't have the
|
|
# original (possibly because it got purged), get_event will refuse to return
|
|
# the redaction event, which isn't terribly helpful here.
|
|
#
|
|
# (To be fair, in that case we could assume it's *not* a state event, and
|
|
# therefore we don't need to worry about it. But still, it seems cleaner just
|
|
# to pull the metadata.)
|
|
m = (await self.store.get_metadata_for_events([event_id]))[event_id]
|
|
if m.state_key is not None and m.rejection_reason is None:
|
|
state_ids = dict(state_ids)
|
|
state_ids[(m.event_type, m.state_key)] = event_id
|
|
|
|
return state_ids
|
|
|
|
async def get_state_at(
|
|
self,
|
|
room_id: str,
|
|
stream_position: StreamToken,
|
|
state_filter: Optional[StateFilter] = None,
|
|
) -> StateMap[str]:
|
|
"""Get the room state at a particular stream position
|
|
|
|
Args:
|
|
room_id: room for which to get state
|
|
stream_position: point at which to get state
|
|
state_filter: The state filter used to fetch state from the database.
|
|
"""
|
|
# FIXME: This gets the state at the latest event before the stream ordering,
|
|
# which might not be the same as the "current state" of the room at the time
|
|
# of the stream token if there were multiple forward extremities at the time.
|
|
last_event_id = await self.store.get_last_event_in_room_before_stream_ordering(
|
|
room_id,
|
|
end_token=stream_position.room_key,
|
|
)
|
|
|
|
if last_event_id:
|
|
state = await self.get_state_after_event(
|
|
last_event_id, state_filter=state_filter or StateFilter.all()
|
|
)
|
|
|
|
else:
|
|
# no events in this room - so presumably no state
|
|
state = {}
|
|
|
|
# (erikj) This should be rarely hit, but we've had some reports that
|
|
# we get more state down gappy syncs than we should, so let's add
|
|
# some logging.
|
|
logger.info(
|
|
"Failed to find any events in room %s at %s",
|
|
room_id,
|
|
stream_position.room_key,
|
|
)
|
|
return state
|
|
|
|
async def compute_summary(
|
|
self,
|
|
room_id: str,
|
|
sync_config: SyncConfig,
|
|
batch: TimelineBatch,
|
|
state: MutableStateMap[EventBase],
|
|
now_token: StreamToken,
|
|
) -> Optional[JsonDict]:
|
|
"""Works out a room summary block for this room, summarising the number
|
|
of joined members in the room, and providing the 'hero' members if the
|
|
room has no name so clients can consistently name rooms. Also adds
|
|
state events to 'state' if needed to describe the heroes.
|
|
|
|
Args
|
|
room_id
|
|
sync_config
|
|
batch: The timeline batch for the room that will be sent to the user.
|
|
state: State as returned by compute_state_delta
|
|
now_token: Token of the end of the current batch.
|
|
"""
|
|
|
|
# FIXME: we could/should get this from room_stats when matthew/stats lands
|
|
|
|
# FIXME: this promulgates https://github.com/matrix-org/synapse/issues/3305
|
|
last_events, _ = await self.store.get_recent_event_ids_for_room(
|
|
room_id, end_token=now_token.room_key, limit=1
|
|
)
|
|
|
|
if not last_events:
|
|
return None
|
|
|
|
last_event = last_events[-1]
|
|
state_ids = await self._state_storage_controller.get_state_ids_for_event(
|
|
last_event.event_id,
|
|
state_filter=StateFilter.from_types(
|
|
[(EventTypes.Name, ""), (EventTypes.CanonicalAlias, "")]
|
|
),
|
|
)
|
|
|
|
# this is heavily cached, thus: fast.
|
|
details = await self.store.get_room_summary(room_id)
|
|
|
|
name_id = state_ids.get((EventTypes.Name, ""))
|
|
canonical_alias_id = state_ids.get((EventTypes.CanonicalAlias, ""))
|
|
|
|
summary: JsonDict = {}
|
|
empty_ms = MemberSummary([], 0)
|
|
|
|
# TODO: only send these when they change.
|
|
summary["m.joined_member_count"] = details.get(Membership.JOIN, empty_ms).count
|
|
summary["m.invited_member_count"] = details.get(
|
|
Membership.INVITE, empty_ms
|
|
).count
|
|
|
|
# if the room has a name or canonical_alias set, we can skip
|
|
# calculating heroes. Empty strings are falsey, so we check
|
|
# for the "name" value and default to an empty string.
|
|
if name_id:
|
|
name = await self.store.get_event(name_id, allow_none=True)
|
|
if name and name.content.get("name"):
|
|
return summary
|
|
|
|
if canonical_alias_id:
|
|
canonical_alias = await self.store.get_event(
|
|
canonical_alias_id, allow_none=True
|
|
)
|
|
if canonical_alias and canonical_alias.content.get("alias"):
|
|
return summary
|
|
|
|
me = sync_config.user.to_string()
|
|
|
|
joined_user_ids = [
|
|
r[0] for r in details.get(Membership.JOIN, empty_ms).members if r[0] != me
|
|
]
|
|
invited_user_ids = [
|
|
r[0] for r in details.get(Membership.INVITE, empty_ms).members if r[0] != me
|
|
]
|
|
gone_user_ids = [
|
|
r[0] for r in details.get(Membership.LEAVE, empty_ms).members if r[0] != me
|
|
] + [r[0] for r in details.get(Membership.BAN, empty_ms).members if r[0] != me]
|
|
|
|
# FIXME: only build up a member_ids list for our heroes
|
|
member_ids = {}
|
|
for membership in (
|
|
Membership.JOIN,
|
|
Membership.INVITE,
|
|
Membership.LEAVE,
|
|
Membership.BAN,
|
|
):
|
|
for user_id, event_id in details.get(membership, empty_ms).members:
|
|
member_ids[user_id] = event_id
|
|
|
|
# FIXME: order by stream ordering rather than as returned by SQL
|
|
if joined_user_ids or invited_user_ids:
|
|
summary["m.heroes"] = sorted(joined_user_ids + invited_user_ids)[0:5]
|
|
else:
|
|
summary["m.heroes"] = sorted(gone_user_ids)[0:5]
|
|
|
|
if not sync_config.filter_collection.lazy_load_members():
|
|
return summary
|
|
|
|
# ensure we send membership events for heroes if needed
|
|
cache_key = (sync_config.user.to_string(), sync_config.device_id)
|
|
cache = self.get_lazy_loaded_members_cache(cache_key)
|
|
|
|
# track which members the client should already know about via LL:
|
|
# Ones which are already in state...
|
|
existing_members = {
|
|
user_id for (typ, user_id) in state.keys() if typ == EventTypes.Member
|
|
}
|
|
|
|
# ...or ones which are in the timeline...
|
|
for ev in batch.events:
|
|
if ev.type == EventTypes.Member:
|
|
existing_members.add(ev.state_key)
|
|
|
|
# ...and then ensure any missing ones get included in state.
|
|
missing_hero_event_ids = [
|
|
member_ids[hero_id]
|
|
for hero_id in summary["m.heroes"]
|
|
if (
|
|
cache.get(hero_id) != member_ids[hero_id]
|
|
and hero_id not in existing_members
|
|
)
|
|
]
|
|
|
|
missing_hero_state = await self.store.get_events(missing_hero_event_ids)
|
|
|
|
for s in missing_hero_state.values():
|
|
cache.set(s.state_key, s.event_id)
|
|
state[(EventTypes.Member, s.state_key)] = s
|
|
|
|
return summary
|
|
|
|
def get_lazy_loaded_members_cache(
|
|
self, cache_key: Tuple[str, Optional[str]]
|
|
) -> LruCache[str, str]:
|
|
cache: Optional[LruCache[str, str]] = self.lazy_loaded_members_cache.get(
|
|
cache_key
|
|
)
|
|
if cache is None:
|
|
logger.debug("creating LruCache for %r", cache_key)
|
|
cache = LruCache(LAZY_LOADED_MEMBERS_CACHE_MAX_SIZE)
|
|
self.lazy_loaded_members_cache[cache_key] = cache
|
|
else:
|
|
logger.debug("found LruCache for %r", cache_key)
|
|
return cache
|
|
|
|
async def compute_state_delta(
|
|
self,
|
|
room_id: str,
|
|
batch: TimelineBatch,
|
|
sync_config: SyncConfig,
|
|
since_token: Optional[StreamToken],
|
|
now_token: StreamToken,
|
|
full_state: bool,
|
|
) -> MutableStateMap[EventBase]:
|
|
"""Works out the difference in state between the start of the timeline
|
|
and the previous sync.
|
|
|
|
Args:
|
|
room_id:
|
|
batch: The timeline batch for the room that will be sent to the user.
|
|
sync_config:
|
|
since_token: Token of the end of the previous batch. May be None.
|
|
now_token: Token of the end of the current batch.
|
|
full_state: Whether to force returning the full state.
|
|
"""
|
|
# TODO(mjark) Check if the state events were received by the server
|
|
# after the previous sync, since we need to include those state
|
|
# updates even if they occurred logically before the previous event.
|
|
# TODO(mjark) Check for new redactions in the state events.
|
|
|
|
with Measure(self.clock, "compute_state_delta"):
|
|
|
|
members_to_fetch = None
|
|
|
|
lazy_load_members = sync_config.filter_collection.lazy_load_members()
|
|
include_redundant_members = (
|
|
sync_config.filter_collection.include_redundant_members()
|
|
)
|
|
|
|
if lazy_load_members:
|
|
# We only request state for the members needed to display the
|
|
# timeline:
|
|
|
|
members_to_fetch = {
|
|
event.sender # FIXME: we also care about invite targets etc.
|
|
for event in batch.events
|
|
}
|
|
|
|
if full_state:
|
|
# always make sure we LL ourselves so we know we're in the room
|
|
# (if we are) to fix https://github.com/vector-im/riot-web/issues/7209
|
|
# We only need apply this on full state syncs given we disabled
|
|
# LL for incr syncs in #3840.
|
|
members_to_fetch.add(sync_config.user.to_string())
|
|
|
|
state_filter = StateFilter.from_lazy_load_member_list(members_to_fetch)
|
|
else:
|
|
state_filter = StateFilter.all()
|
|
|
|
timeline_state = {
|
|
(event.type, event.state_key): event.event_id
|
|
for event in batch.events
|
|
if event.is_state()
|
|
}
|
|
|
|
if full_state:
|
|
if batch:
|
|
current_state_ids = (
|
|
await self._state_storage_controller.get_state_ids_for_event(
|
|
batch.events[-1].event_id, state_filter=state_filter
|
|
)
|
|
)
|
|
|
|
state_ids = (
|
|
await self._state_storage_controller.get_state_ids_for_event(
|
|
batch.events[0].event_id, state_filter=state_filter
|
|
)
|
|
)
|
|
|
|
else:
|
|
current_state_ids = await self.get_state_at(
|
|
room_id, stream_position=now_token, state_filter=state_filter
|
|
)
|
|
|
|
state_ids = current_state_ids
|
|
|
|
state_ids = _calculate_state(
|
|
timeline_contains=timeline_state,
|
|
timeline_start=state_ids,
|
|
previous={},
|
|
current=current_state_ids,
|
|
lazy_load_members=lazy_load_members,
|
|
)
|
|
elif batch.limited:
|
|
if batch:
|
|
state_at_timeline_start = (
|
|
await self._state_storage_controller.get_state_ids_for_event(
|
|
batch.events[0].event_id, state_filter=state_filter
|
|
)
|
|
)
|
|
else:
|
|
# We can get here if the user has ignored the senders of all
|
|
# the recent events.
|
|
state_at_timeline_start = await self.get_state_at(
|
|
room_id, stream_position=now_token, state_filter=state_filter
|
|
)
|
|
|
|
# for now, we disable LL for gappy syncs - see
|
|
# https://github.com/vector-im/riot-web/issues/7211#issuecomment-419976346
|
|
# N.B. this slows down incr syncs as we are now processing way
|
|
# more state in the server than if we were LLing.
|
|
#
|
|
# We still have to filter timeline_start to LL entries (above) in order
|
|
# for _calculate_state's LL logic to work, as we have to include LL
|
|
# members for timeline senders in case they weren't loaded in the initial
|
|
# sync. We do this by (counterintuitively) by filtering timeline_start
|
|
# members to just be ones which were timeline senders, which then ensures
|
|
# all of the rest get included in the state block (if we need to know
|
|
# about them).
|
|
state_filter = StateFilter.all()
|
|
|
|
# If this is an initial sync then full_state should be set, and
|
|
# that case is handled above. We assert here to ensure that this
|
|
# is indeed the case.
|
|
assert since_token is not None
|
|
state_at_previous_sync = await self.get_state_at(
|
|
room_id, stream_position=since_token, state_filter=state_filter
|
|
)
|
|
|
|
if batch:
|
|
current_state_ids = (
|
|
await self._state_storage_controller.get_state_ids_for_event(
|
|
batch.events[-1].event_id, state_filter=state_filter
|
|
)
|
|
)
|
|
else:
|
|
# Its not clear how we get here, but empirically we do
|
|
# (#5407). Logging has been added elsewhere to try and
|
|
# figure out where this state comes from.
|
|
current_state_ids = await self.get_state_at(
|
|
room_id, stream_position=now_token, state_filter=state_filter
|
|
)
|
|
|
|
state_ids = _calculate_state(
|
|
timeline_contains=timeline_state,
|
|
timeline_start=state_at_timeline_start,
|
|
previous=state_at_previous_sync,
|
|
current=current_state_ids,
|
|
# we have to include LL members in case LL initial sync missed them
|
|
lazy_load_members=lazy_load_members,
|
|
)
|
|
else:
|
|
state_ids = {}
|
|
if lazy_load_members:
|
|
if members_to_fetch and batch.events:
|
|
# We're returning an incremental sync, with no
|
|
# "gap" since the previous sync, so normally there would be
|
|
# no state to return.
|
|
# But we're lazy-loading, so the client might need some more
|
|
# member events to understand the events in this timeline.
|
|
# So we fish out all the member events corresponding to the
|
|
# timeline here, and then dedupe any redundant ones below.
|
|
|
|
state_ids = await self._state_storage_controller.get_state_ids_for_event(
|
|
batch.events[0].event_id,
|
|
# we only want members!
|
|
state_filter=StateFilter.from_types(
|
|
(EventTypes.Member, member)
|
|
for member in members_to_fetch
|
|
),
|
|
)
|
|
|
|
if lazy_load_members and not include_redundant_members:
|
|
cache_key = (sync_config.user.to_string(), sync_config.device_id)
|
|
cache = self.get_lazy_loaded_members_cache(cache_key)
|
|
|
|
# if it's a new sync sequence, then assume the client has had
|
|
# amnesia and doesn't want any recent lazy-loaded members
|
|
# de-duplicated.
|
|
if since_token is None:
|
|
logger.debug("clearing LruCache for %r", cache_key)
|
|
cache.clear()
|
|
else:
|
|
# only send members which aren't in our LruCache (either
|
|
# because they're new to this client or have been pushed out
|
|
# of the cache)
|
|
logger.debug("filtering state from %r...", state_ids)
|
|
state_ids = {
|
|
t: event_id
|
|
for t, event_id in state_ids.items()
|
|
if cache.get(t[1]) != event_id
|
|
}
|
|
logger.debug("...to %r", state_ids)
|
|
|
|
# add any member IDs we are about to send into our LruCache
|
|
for t, event_id in itertools.chain(
|
|
state_ids.items(), timeline_state.items()
|
|
):
|
|
if t[0] == EventTypes.Member:
|
|
cache.set(t[1], event_id)
|
|
|
|
state: Dict[str, EventBase] = {}
|
|
if state_ids:
|
|
state = await self.store.get_events(list(state_ids.values()))
|
|
|
|
return {
|
|
(e.type, e.state_key): e
|
|
for e in await sync_config.filter_collection.filter_room_state(
|
|
list(state.values())
|
|
)
|
|
if e.type != EventTypes.Aliases # until MSC2261 or alternative solution
|
|
}
|
|
|
|
async def unread_notifs_for_room_id(
|
|
self, room_id: str, sync_config: SyncConfig
|
|
) -> NotifCounts:
|
|
with Measure(self.clock, "unread_notifs_for_room_id"):
|
|
|
|
return await self.store.get_unread_event_push_actions_by_room_for_user(
|
|
room_id,
|
|
sync_config.user.to_string(),
|
|
)
|
|
|
|
async def generate_sync_result(
|
|
self,
|
|
sync_config: SyncConfig,
|
|
since_token: Optional[StreamToken] = None,
|
|
full_state: bool = False,
|
|
) -> SyncResult:
|
|
"""Generates the response body of a sync result.
|
|
|
|
This is represented by a `SyncResult` struct, which is built from small pieces
|
|
using a `SyncResultBuilder`. See also
|
|
https://spec.matrix.org/v1.1/client-server-api/#get_matrixclientv3sync
|
|
the `sync_result_builder` is passed as a mutable ("inout") parameter to various
|
|
helper functions. These retrieve and process the data which forms the sync body,
|
|
often writing to the `sync_result_builder` to store their output.
|
|
|
|
At the end, we transfer data from the `sync_result_builder` to a new `SyncResult`
|
|
instance to signify that the sync calculation is complete.
|
|
"""
|
|
# NB: The now_token gets changed by some of the generate_sync_* methods,
|
|
# this is due to some of the underlying streams not supporting the ability
|
|
# to query up to a given point.
|
|
# Always use the `now_token` in `SyncResultBuilder`
|
|
now_token = self.event_sources.get_current_token()
|
|
log_kv({"now_token": now_token})
|
|
|
|
logger.debug(
|
|
"Calculating sync response for %r between %s and %s",
|
|
sync_config.user,
|
|
since_token,
|
|
now_token,
|
|
)
|
|
|
|
user_id = sync_config.user.to_string()
|
|
app_service = self.store.get_app_service_by_user_id(user_id)
|
|
if app_service:
|
|
# We no longer support AS users using /sync directly.
|
|
# See https://github.com/matrix-org/matrix-doc/issues/1144
|
|
raise NotImplementedError()
|
|
else:
|
|
joined_room_ids = await self.get_rooms_for_user_at(
|
|
user_id, now_token.room_key
|
|
)
|
|
sync_result_builder = SyncResultBuilder(
|
|
sync_config,
|
|
full_state,
|
|
since_token=since_token,
|
|
now_token=now_token,
|
|
joined_room_ids=joined_room_ids,
|
|
)
|
|
|
|
logger.debug("Fetching account data")
|
|
|
|
account_data_by_room = await self._generate_sync_entry_for_account_data(
|
|
sync_result_builder
|
|
)
|
|
|
|
logger.debug("Fetching room data")
|
|
|
|
res = await self._generate_sync_entry_for_rooms(
|
|
sync_result_builder, account_data_by_room
|
|
)
|
|
newly_joined_rooms, newly_joined_or_invited_or_knocked_users, _, _ = res
|
|
_, _, newly_left_rooms, newly_left_users = res
|
|
|
|
block_all_presence_data = (
|
|
since_token is None and sync_config.filter_collection.blocks_all_presence()
|
|
)
|
|
if self.hs_config.server.use_presence and not block_all_presence_data:
|
|
logger.debug("Fetching presence data")
|
|
await self._generate_sync_entry_for_presence(
|
|
sync_result_builder,
|
|
newly_joined_rooms,
|
|
newly_joined_or_invited_or_knocked_users,
|
|
)
|
|
|
|
logger.debug("Fetching to-device data")
|
|
await self._generate_sync_entry_for_to_device(sync_result_builder)
|
|
|
|
device_lists = await self._generate_sync_entry_for_device_list(
|
|
sync_result_builder,
|
|
newly_joined_rooms=newly_joined_rooms,
|
|
newly_joined_or_invited_or_knocked_users=newly_joined_or_invited_or_knocked_users,
|
|
newly_left_rooms=newly_left_rooms,
|
|
newly_left_users=newly_left_users,
|
|
)
|
|
|
|
logger.debug("Fetching OTK data")
|
|
device_id = sync_config.device_id
|
|
one_time_key_counts: JsonDict = {}
|
|
unused_fallback_key_types: List[str] = []
|
|
if device_id:
|
|
# TODO: We should have a way to let clients differentiate between the states of:
|
|
# * no change in OTK count since the provided since token
|
|
# * the server has zero OTKs left for this device
|
|
# Spec issue: https://github.com/matrix-org/matrix-doc/issues/3298
|
|
one_time_key_counts = await self.store.count_e2e_one_time_keys(
|
|
user_id, device_id
|
|
)
|
|
unused_fallback_key_types = (
|
|
await self.store.get_e2e_unused_fallback_key_types(user_id, device_id)
|
|
)
|
|
|
|
num_events = 0
|
|
|
|
# debug for https://github.com/matrix-org/synapse/issues/9424
|
|
for joined_room in sync_result_builder.joined:
|
|
num_events += len(joined_room.timeline.events)
|
|
|
|
log_kv(
|
|
{
|
|
"joined_rooms_in_result": len(sync_result_builder.joined),
|
|
"events_in_result": num_events,
|
|
}
|
|
)
|
|
|
|
logger.debug("Sync response calculation complete")
|
|
return SyncResult(
|
|
presence=sync_result_builder.presence,
|
|
account_data=sync_result_builder.account_data,
|
|
joined=sync_result_builder.joined,
|
|
invited=sync_result_builder.invited,
|
|
knocked=sync_result_builder.knocked,
|
|
archived=sync_result_builder.archived,
|
|
to_device=sync_result_builder.to_device,
|
|
device_lists=device_lists,
|
|
device_one_time_keys_count=one_time_key_counts,
|
|
device_unused_fallback_key_types=unused_fallback_key_types,
|
|
next_batch=sync_result_builder.now_token,
|
|
)
|
|
|
|
@measure_func("_generate_sync_entry_for_device_list")
|
|
async def _generate_sync_entry_for_device_list(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
newly_joined_rooms: Set[str],
|
|
newly_joined_or_invited_or_knocked_users: Set[str],
|
|
newly_left_rooms: Set[str],
|
|
newly_left_users: Set[str],
|
|
) -> DeviceListUpdates:
|
|
"""Generate the DeviceListUpdates section of sync
|
|
|
|
Args:
|
|
sync_result_builder
|
|
newly_joined_rooms: Set of rooms user has joined since previous sync
|
|
newly_joined_or_invited_or_knocked_users: Set of users that have joined,
|
|
been invited to a room or are knocking on a room since
|
|
previous sync.
|
|
newly_left_rooms: Set of rooms user has left since previous sync
|
|
newly_left_users: Set of users that have left a room we're in since
|
|
previous sync
|
|
"""
|
|
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
since_token = sync_result_builder.since_token
|
|
|
|
# We're going to mutate these fields, so lets copy them rather than
|
|
# assume they won't get used later.
|
|
newly_joined_or_invited_or_knocked_users = set(
|
|
newly_joined_or_invited_or_knocked_users
|
|
)
|
|
newly_left_users = set(newly_left_users)
|
|
|
|
if since_token and since_token.device_list_key:
|
|
# We want to figure out what user IDs the client should refetch
|
|
# device keys for, and which users we aren't going to track changes
|
|
# for anymore.
|
|
#
|
|
# For the first step we check:
|
|
# a. if any users we share a room with have updated their devices,
|
|
# and
|
|
# b. we also check if we've joined any new rooms, or if a user has
|
|
# joined a room we're in.
|
|
#
|
|
# For the second step we just find any users we no longer share a
|
|
# room with by looking at all users that have left a room plus users
|
|
# that were in a room we've left.
|
|
|
|
users_that_have_changed = set()
|
|
|
|
joined_rooms = sync_result_builder.joined_room_ids
|
|
|
|
# Step 1a, check for changes in devices of users we share a room
|
|
# with
|
|
#
|
|
# We do this in two different ways depending on what we have cached.
|
|
# If we already have a list of all the user that have changed since
|
|
# the last sync then it's likely more efficient to compare the rooms
|
|
# they're in with the rooms the syncing user is in.
|
|
#
|
|
# If we don't have that info cached then we get all the users that
|
|
# share a room with our user and check if those users have changed.
|
|
changed_users = self.store.get_cached_device_list_changes(
|
|
since_token.device_list_key
|
|
)
|
|
if changed_users is not None:
|
|
result = await self.store.get_rooms_for_users_with_stream_ordering(
|
|
changed_users
|
|
)
|
|
|
|
for changed_user_id, entries in result.items():
|
|
# Check if the changed user shares any rooms with the user,
|
|
# or if the changed user is the syncing user (as we always
|
|
# want to include device list updates of their own devices).
|
|
if user_id == changed_user_id or any(
|
|
e.room_id in joined_rooms for e in entries
|
|
):
|
|
users_that_have_changed.add(changed_user_id)
|
|
else:
|
|
users_that_have_changed = (
|
|
await self._device_handler.get_device_changes_in_shared_rooms(
|
|
user_id,
|
|
sync_result_builder.joined_room_ids,
|
|
from_token=since_token,
|
|
)
|
|
)
|
|
|
|
# Step 1b, check for newly joined rooms
|
|
for room_id in newly_joined_rooms:
|
|
joined_users = await self.store.get_users_in_room(room_id)
|
|
newly_joined_or_invited_or_knocked_users.update(joined_users)
|
|
|
|
# TODO: Check that these users are actually new, i.e. either they
|
|
# weren't in the previous sync *or* they left and rejoined.
|
|
users_that_have_changed.update(newly_joined_or_invited_or_knocked_users)
|
|
|
|
user_signatures_changed = (
|
|
await self.store.get_users_whose_signatures_changed(
|
|
user_id, since_token.device_list_key
|
|
)
|
|
)
|
|
users_that_have_changed.update(user_signatures_changed)
|
|
|
|
# Now find users that we no longer track
|
|
for room_id in newly_left_rooms:
|
|
left_users = await self.store.get_users_in_room(room_id)
|
|
newly_left_users.update(left_users)
|
|
|
|
# Remove any users that we still share a room with.
|
|
left_users_rooms = (
|
|
await self.store.get_rooms_for_users_with_stream_ordering(
|
|
newly_left_users
|
|
)
|
|
)
|
|
for user_id, entries in left_users_rooms.items():
|
|
if any(e.room_id in joined_rooms for e in entries):
|
|
newly_left_users.discard(user_id)
|
|
|
|
return DeviceListUpdates(
|
|
changed=users_that_have_changed, left=newly_left_users
|
|
)
|
|
else:
|
|
return DeviceListUpdates()
|
|
|
|
async def _generate_sync_entry_for_to_device(
|
|
self, sync_result_builder: "SyncResultBuilder"
|
|
) -> None:
|
|
"""Generates the portion of the sync response. Populates
|
|
`sync_result_builder` with the result.
|
|
"""
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
device_id = sync_result_builder.sync_config.device_id
|
|
now_token = sync_result_builder.now_token
|
|
since_stream_id = 0
|
|
if sync_result_builder.since_token is not None:
|
|
since_stream_id = int(sync_result_builder.since_token.to_device_key)
|
|
|
|
if device_id is not None and since_stream_id != int(now_token.to_device_key):
|
|
messages, stream_id = await self.store.get_messages_for_device(
|
|
user_id, device_id, since_stream_id, now_token.to_device_key
|
|
)
|
|
|
|
for message in messages:
|
|
# We pop here as we shouldn't be sending the message ID down
|
|
# `/sync`
|
|
message_id = message.pop("message_id", None)
|
|
if message_id:
|
|
set_tag(SynapseTags.TO_DEVICE_MESSAGE_ID, message_id)
|
|
|
|
logger.debug(
|
|
"Returning %d to-device messages between %d and %d (current token: %d)",
|
|
len(messages),
|
|
since_stream_id,
|
|
stream_id,
|
|
now_token.to_device_key,
|
|
)
|
|
sync_result_builder.now_token = now_token.copy_and_replace(
|
|
StreamKeyType.TO_DEVICE, stream_id
|
|
)
|
|
sync_result_builder.to_device = messages
|
|
else:
|
|
sync_result_builder.to_device = []
|
|
|
|
async def _generate_sync_entry_for_account_data(
|
|
self, sync_result_builder: "SyncResultBuilder"
|
|
) -> Dict[str, Dict[str, JsonDict]]:
|
|
"""Generates the account data portion of the sync response.
|
|
|
|
Account data (called "Client Config" in the spec) can be set either globally
|
|
or for a specific room. Account data consists of a list of events which
|
|
accumulate state, much like a room.
|
|
|
|
This function retrieves global and per-room account data. The former is written
|
|
to the given `sync_result_builder`. The latter is returned directly, to be
|
|
later written to the `sync_result_builder` on a room-by-room basis.
|
|
|
|
Args:
|
|
sync_result_builder
|
|
|
|
Returns:
|
|
A dictionary whose keys (room ids) map to the per room account data for that
|
|
room.
|
|
"""
|
|
sync_config = sync_result_builder.sync_config
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
since_token = sync_result_builder.since_token
|
|
|
|
if since_token and not sync_result_builder.full_state:
|
|
(
|
|
global_account_data,
|
|
account_data_by_room,
|
|
) = await self.store.get_updated_account_data_for_user(
|
|
user_id, since_token.account_data_key
|
|
)
|
|
|
|
push_rules_changed = await self.store.have_push_rules_changed_for_user(
|
|
user_id, int(since_token.push_rules_key)
|
|
)
|
|
|
|
if push_rules_changed:
|
|
global_account_data["m.push_rules"] = await self.push_rules_for_user(
|
|
sync_config.user
|
|
)
|
|
else:
|
|
(
|
|
global_account_data,
|
|
account_data_by_room,
|
|
) = await self.store.get_account_data_for_user(sync_config.user.to_string())
|
|
|
|
global_account_data["m.push_rules"] = await self.push_rules_for_user(
|
|
sync_config.user
|
|
)
|
|
|
|
account_data_for_user = await sync_config.filter_collection.filter_account_data(
|
|
[
|
|
{"type": account_data_type, "content": content}
|
|
for account_data_type, content in global_account_data.items()
|
|
]
|
|
)
|
|
|
|
sync_result_builder.account_data = account_data_for_user
|
|
|
|
return account_data_by_room
|
|
|
|
async def _generate_sync_entry_for_presence(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
newly_joined_rooms: Set[str],
|
|
newly_joined_or_invited_users: Set[str],
|
|
) -> None:
|
|
"""Generates the presence portion of the sync response. Populates the
|
|
`sync_result_builder` with the result.
|
|
|
|
Args:
|
|
sync_result_builder
|
|
newly_joined_rooms: Set of rooms that the user has joined since
|
|
the last sync (or empty if an initial sync)
|
|
newly_joined_or_invited_users: Set of users that have joined or
|
|
been invited to rooms since the last sync (or empty if an
|
|
initial sync)
|
|
"""
|
|
now_token = sync_result_builder.now_token
|
|
sync_config = sync_result_builder.sync_config
|
|
user = sync_result_builder.sync_config.user
|
|
|
|
presence_source = self.event_sources.sources.presence
|
|
|
|
since_token = sync_result_builder.since_token
|
|
presence_key = None
|
|
include_offline = False
|
|
if since_token and not sync_result_builder.full_state:
|
|
presence_key = since_token.presence_key
|
|
include_offline = True
|
|
|
|
presence, presence_key = await presence_source.get_new_events(
|
|
user=user,
|
|
from_key=presence_key,
|
|
is_guest=sync_config.is_guest,
|
|
include_offline=include_offline,
|
|
)
|
|
assert presence_key
|
|
sync_result_builder.now_token = now_token.copy_and_replace(
|
|
StreamKeyType.PRESENCE, presence_key
|
|
)
|
|
|
|
extra_users_ids = set(newly_joined_or_invited_users)
|
|
for room_id in newly_joined_rooms:
|
|
users = await self.store.get_users_in_room(room_id)
|
|
extra_users_ids.update(users)
|
|
extra_users_ids.discard(user.to_string())
|
|
|
|
if extra_users_ids:
|
|
states = await self.presence_handler.get_states(extra_users_ids)
|
|
presence.extend(states)
|
|
|
|
# Deduplicate the presence entries so that there's at most one per user
|
|
presence = list({p.user_id: p for p in presence}.values())
|
|
|
|
presence = await sync_config.filter_collection.filter_presence(presence)
|
|
|
|
sync_result_builder.presence = presence
|
|
|
|
async def _generate_sync_entry_for_rooms(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
account_data_by_room: Dict[str, Dict[str, JsonDict]],
|
|
) -> Tuple[Set[str], Set[str], Set[str], Set[str]]:
|
|
"""Generates the rooms portion of the sync response. Populates the
|
|
`sync_result_builder` with the result.
|
|
|
|
In the response that reaches the client, rooms are divided into four categories:
|
|
`invite`, `join`, `knock`, `leave`. These aren't the same as the four sets of
|
|
room ids returned by this function.
|
|
|
|
Args:
|
|
sync_result_builder
|
|
account_data_by_room: Dictionary of per room account data
|
|
|
|
Returns:
|
|
Returns a 4-tuple describing rooms the user has joined or left, and users who've
|
|
joined or left rooms any rooms the user is in. This gets used later in
|
|
`_generate_sync_entry_for_device_list`.
|
|
|
|
Its entries are:
|
|
- newly_joined_rooms
|
|
- newly_joined_or_invited_or_knocked_users
|
|
- newly_left_rooms
|
|
- newly_left_users
|
|
"""
|
|
since_token = sync_result_builder.since_token
|
|
|
|
# 1. Start by fetching all ephemeral events in rooms we've joined (if required).
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
block_all_room_ephemeral = (
|
|
since_token is None
|
|
and sync_result_builder.sync_config.filter_collection.blocks_all_room_ephemeral()
|
|
)
|
|
|
|
if block_all_room_ephemeral:
|
|
ephemeral_by_room: Dict[str, List[JsonDict]] = {}
|
|
else:
|
|
now_token, ephemeral_by_room = await self.ephemeral_by_room(
|
|
sync_result_builder,
|
|
now_token=sync_result_builder.now_token,
|
|
since_token=sync_result_builder.since_token,
|
|
)
|
|
sync_result_builder.now_token = now_token
|
|
|
|
# 2. We check up front if anything has changed, if it hasn't then there is
|
|
# no point in going further.
|
|
if not sync_result_builder.full_state:
|
|
if since_token and not ephemeral_by_room and not account_data_by_room:
|
|
have_changed = await self._have_rooms_changed(sync_result_builder)
|
|
log_kv({"rooms_have_changed": have_changed})
|
|
if not have_changed:
|
|
tags_by_room = await self.store.get_updated_tags(
|
|
user_id, since_token.account_data_key
|
|
)
|
|
if not tags_by_room:
|
|
logger.debug("no-oping sync")
|
|
return set(), set(), set(), set()
|
|
|
|
# 3. Work out which rooms need reporting in the sync response.
|
|
ignored_users = await self.store.ignored_users(user_id)
|
|
if since_token:
|
|
room_changes = await self._get_rooms_changed(
|
|
sync_result_builder, ignored_users
|
|
)
|
|
tags_by_room = await self.store.get_updated_tags(
|
|
user_id, since_token.account_data_key
|
|
)
|
|
else:
|
|
room_changes = await self._get_all_rooms(sync_result_builder, ignored_users)
|
|
tags_by_room = await self.store.get_tags_for_user(user_id)
|
|
|
|
log_kv({"rooms_changed": len(room_changes.room_entries)})
|
|
|
|
room_entries = room_changes.room_entries
|
|
invited = room_changes.invited
|
|
knocked = room_changes.knocked
|
|
newly_joined_rooms = room_changes.newly_joined_rooms
|
|
newly_left_rooms = room_changes.newly_left_rooms
|
|
|
|
# 4. We need to apply further processing to `room_entries` (rooms considered
|
|
# joined or archived).
|
|
async def handle_room_entries(room_entry: "RoomSyncResultBuilder") -> None:
|
|
logger.debug("Generating room entry for %s", room_entry.room_id)
|
|
await self._generate_room_entry(
|
|
sync_result_builder,
|
|
room_entry,
|
|
ephemeral=ephemeral_by_room.get(room_entry.room_id, []),
|
|
tags=tags_by_room.get(room_entry.room_id),
|
|
account_data=account_data_by_room.get(room_entry.room_id, {}),
|
|
always_include=sync_result_builder.full_state,
|
|
)
|
|
logger.debug("Generated room entry for %s", room_entry.room_id)
|
|
|
|
with start_active_span("sync.generate_room_entries"):
|
|
await concurrently_execute(handle_room_entries, room_entries, 10)
|
|
|
|
sync_result_builder.invited.extend(invited)
|
|
sync_result_builder.knocked.extend(knocked)
|
|
|
|
# 5. Work out which users have joined or left rooms we're in. We use this
|
|
# to build the device_list part of the sync response in
|
|
# `_generate_sync_entry_for_device_list`.
|
|
(
|
|
newly_joined_or_invited_or_knocked_users,
|
|
newly_left_users,
|
|
) = sync_result_builder.calculate_user_changes()
|
|
|
|
return (
|
|
set(newly_joined_rooms),
|
|
newly_joined_or_invited_or_knocked_users,
|
|
set(newly_left_rooms),
|
|
newly_left_users,
|
|
)
|
|
|
|
async def _have_rooms_changed(
|
|
self, sync_result_builder: "SyncResultBuilder"
|
|
) -> bool:
|
|
"""Returns whether there may be any new events that should be sent down
|
|
the sync. Returns True if there are.
|
|
|
|
Does not modify the `sync_result_builder`.
|
|
"""
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
since_token = sync_result_builder.since_token
|
|
now_token = sync_result_builder.now_token
|
|
|
|
assert since_token
|
|
|
|
# Get a list of membership change events that have happened to the user
|
|
# requesting the sync.
|
|
membership_changes = await self.store.get_membership_changes_for_user(
|
|
user_id, since_token.room_key, now_token.room_key
|
|
)
|
|
|
|
if membership_changes:
|
|
return True
|
|
|
|
stream_id = since_token.room_key.stream
|
|
for room_id in sync_result_builder.joined_room_ids:
|
|
if self.store.has_room_changed_since(room_id, stream_id):
|
|
return True
|
|
return False
|
|
|
|
async def _get_rooms_changed(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
ignored_users: FrozenSet[str],
|
|
) -> _RoomChanges:
|
|
"""Determine the changes in rooms to report to the user.
|
|
|
|
This function is a first pass at generating the rooms part of the sync response.
|
|
It determines which rooms have changed during the sync period, and categorises
|
|
them into four buckets: "knock", "invite", "join" and "leave". It also excludes
|
|
from that list any room that appears in the list of rooms to exclude from sync
|
|
results in the server configuration.
|
|
|
|
1. Finds all membership changes for the user in the sync period (from
|
|
`since_token` up to `now_token`).
|
|
2. Uses those to place the room in one of the four categories above.
|
|
3. Builds a `_RoomChanges` struct to record this, and return that struct.
|
|
|
|
For rooms classified as "knock", "invite" or "leave", we just need to report
|
|
a single membership event in the eventual /sync response. For "join" we need
|
|
to fetch additional non-membership events, e.g. messages in the room. That is
|
|
more complicated, so instead we report an intermediary `RoomSyncResultBuilder`
|
|
struct, and leave the additional work to `_generate_room_entry`.
|
|
|
|
The sync_result_builder is not modified by this function.
|
|
"""
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
since_token = sync_result_builder.since_token
|
|
now_token = sync_result_builder.now_token
|
|
sync_config = sync_result_builder.sync_config
|
|
|
|
assert since_token
|
|
|
|
# TODO: we've already called this function and ran this query in
|
|
# _have_rooms_changed. We could keep the results in memory to avoid a
|
|
# second query, at the cost of more complicated source code.
|
|
membership_change_events = await self.store.get_membership_changes_for_user(
|
|
user_id, since_token.room_key, now_token.room_key, self.rooms_to_exclude
|
|
)
|
|
|
|
mem_change_events_by_room_id: Dict[str, List[EventBase]] = {}
|
|
for event in membership_change_events:
|
|
mem_change_events_by_room_id.setdefault(event.room_id, []).append(event)
|
|
|
|
newly_joined_rooms: List[str] = []
|
|
newly_left_rooms: List[str] = []
|
|
room_entries: List[RoomSyncResultBuilder] = []
|
|
invited: List[InvitedSyncResult] = []
|
|
knocked: List[KnockedSyncResult] = []
|
|
for room_id, events in mem_change_events_by_room_id.items():
|
|
# The body of this loop will add this room to at least one of the five lists
|
|
# above. Things get messy if you've e.g. joined, left, joined then left the
|
|
# room all in the same sync period.
|
|
logger.debug(
|
|
"Membership changes in %s: [%s]",
|
|
room_id,
|
|
", ".join("%s (%s)" % (e.event_id, e.membership) for e in events),
|
|
)
|
|
|
|
non_joins = [e for e in events if e.membership != Membership.JOIN]
|
|
has_join = len(non_joins) != len(events)
|
|
|
|
# We want to figure out if we joined the room at some point since
|
|
# the last sync (even if we have since left). This is to make sure
|
|
# we do send down the room, and with full state, where necessary
|
|
|
|
old_state_ids = None
|
|
if room_id in sync_result_builder.joined_room_ids and non_joins:
|
|
# Always include if the user (re)joined the room, especially
|
|
# important so that device list changes are calculated correctly.
|
|
# If there are non-join member events, but we are still in the room,
|
|
# then the user must have left and joined
|
|
newly_joined_rooms.append(room_id)
|
|
|
|
# User is in the room so we don't need to do the invite/leave checks
|
|
continue
|
|
|
|
if room_id in sync_result_builder.joined_room_ids or has_join:
|
|
old_state_ids = await self.get_state_at(room_id, since_token)
|
|
old_mem_ev_id = old_state_ids.get((EventTypes.Member, user_id), None)
|
|
old_mem_ev = None
|
|
if old_mem_ev_id:
|
|
old_mem_ev = await self.store.get_event(
|
|
old_mem_ev_id, allow_none=True
|
|
)
|
|
|
|
if not old_mem_ev or old_mem_ev.membership != Membership.JOIN:
|
|
newly_joined_rooms.append(room_id)
|
|
|
|
# If user is in the room then we don't need to do the invite/leave checks
|
|
if room_id in sync_result_builder.joined_room_ids:
|
|
continue
|
|
|
|
if not non_joins:
|
|
continue
|
|
last_non_join = non_joins[-1]
|
|
|
|
# Check if we have left the room. This can either be because we were
|
|
# joined before *or* that we since joined and then left.
|
|
if events[-1].membership != Membership.JOIN:
|
|
if has_join:
|
|
newly_left_rooms.append(room_id)
|
|
else:
|
|
if not old_state_ids:
|
|
old_state_ids = await self.get_state_at(room_id, since_token)
|
|
old_mem_ev_id = old_state_ids.get(
|
|
(EventTypes.Member, user_id), None
|
|
)
|
|
old_mem_ev = None
|
|
if old_mem_ev_id:
|
|
old_mem_ev = await self.store.get_event(
|
|
old_mem_ev_id, allow_none=True
|
|
)
|
|
if old_mem_ev and old_mem_ev.membership == Membership.JOIN:
|
|
newly_left_rooms.append(room_id)
|
|
|
|
# Only bother if we're still currently invited
|
|
should_invite = last_non_join.membership == Membership.INVITE
|
|
if should_invite:
|
|
if last_non_join.sender not in ignored_users:
|
|
invite_room_sync = InvitedSyncResult(room_id, invite=last_non_join)
|
|
if invite_room_sync:
|
|
invited.append(invite_room_sync)
|
|
|
|
# Only bother if our latest membership in the room is knock (and we haven't
|
|
# been accepted/rejected in the meantime).
|
|
should_knock = last_non_join.membership == Membership.KNOCK
|
|
if should_knock:
|
|
knock_room_sync = KnockedSyncResult(room_id, knock=last_non_join)
|
|
if knock_room_sync:
|
|
knocked.append(knock_room_sync)
|
|
|
|
# Always include leave/ban events. Just take the last one.
|
|
# TODO: How do we handle ban -> leave in same batch?
|
|
leave_events = [
|
|
e
|
|
for e in non_joins
|
|
if e.membership in (Membership.LEAVE, Membership.BAN)
|
|
]
|
|
|
|
if leave_events:
|
|
leave_event = leave_events[-1]
|
|
leave_position = await self.store.get_position_for_event(
|
|
leave_event.event_id
|
|
)
|
|
|
|
# If the leave event happened before the since token then we
|
|
# bail.
|
|
if since_token and not leave_position.persisted_after(
|
|
since_token.room_key
|
|
):
|
|
continue
|
|
|
|
# We can safely convert the position of the leave event into a
|
|
# stream token as it'll only be used in the context of this
|
|
# room. (c.f. the docstring of `to_room_stream_token`).
|
|
leave_token = since_token.copy_and_replace(
|
|
StreamKeyType.ROOM, leave_position.to_room_stream_token()
|
|
)
|
|
|
|
# If this is an out of band message, like a remote invite
|
|
# rejection, we include it in the recents batch. Otherwise, we
|
|
# let _load_filtered_recents handle fetching the correct
|
|
# batches.
|
|
#
|
|
# This is all screaming out for a refactor, as the logic here is
|
|
# subtle and the moving parts numerous.
|
|
if leave_event.internal_metadata.is_out_of_band_membership():
|
|
batch_events: Optional[List[EventBase]] = [leave_event]
|
|
else:
|
|
batch_events = None
|
|
|
|
room_entries.append(
|
|
RoomSyncResultBuilder(
|
|
room_id=room_id,
|
|
rtype="archived",
|
|
events=batch_events,
|
|
newly_joined=room_id in newly_joined_rooms,
|
|
full_state=False,
|
|
since_token=since_token,
|
|
upto_token=leave_token,
|
|
out_of_band=leave_event.internal_metadata.is_out_of_band_membership(),
|
|
)
|
|
)
|
|
|
|
timeline_limit = sync_config.filter_collection.timeline_limit()
|
|
|
|
# Get all events since the `from_key` in rooms we're currently joined to.
|
|
# If there are too many, we get the most recent events only. This leaves
|
|
# a "gap" in the timeline, as described by the spec for /sync.
|
|
room_to_events = await self.store.get_room_events_stream_for_rooms(
|
|
room_ids=sync_result_builder.joined_room_ids,
|
|
from_key=since_token.room_key,
|
|
to_key=now_token.room_key,
|
|
limit=timeline_limit + 1,
|
|
)
|
|
|
|
# We loop through all room ids, even if there are no new events, in case
|
|
# there are non room events that we need to notify about.
|
|
for room_id in sync_result_builder.joined_room_ids:
|
|
room_entry = room_to_events.get(room_id, None)
|
|
|
|
newly_joined = room_id in newly_joined_rooms
|
|
if room_entry:
|
|
events, start_key = room_entry
|
|
|
|
prev_batch_token = now_token.copy_and_replace(
|
|
StreamKeyType.ROOM, start_key
|
|
)
|
|
|
|
entry = RoomSyncResultBuilder(
|
|
room_id=room_id,
|
|
rtype="joined",
|
|
events=events,
|
|
newly_joined=newly_joined,
|
|
full_state=False,
|
|
since_token=None if newly_joined else since_token,
|
|
upto_token=prev_batch_token,
|
|
)
|
|
else:
|
|
entry = RoomSyncResultBuilder(
|
|
room_id=room_id,
|
|
rtype="joined",
|
|
events=[],
|
|
newly_joined=newly_joined,
|
|
full_state=False,
|
|
since_token=since_token,
|
|
upto_token=since_token,
|
|
)
|
|
|
|
room_entries.append(entry)
|
|
|
|
return _RoomChanges(
|
|
room_entries,
|
|
invited,
|
|
knocked,
|
|
newly_joined_rooms,
|
|
newly_left_rooms,
|
|
)
|
|
|
|
async def _get_all_rooms(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
ignored_users: FrozenSet[str],
|
|
) -> _RoomChanges:
|
|
"""Returns entries for all rooms for the user.
|
|
|
|
Like `_get_rooms_changed`, but assumes the `since_token` is `None`.
|
|
|
|
This function does not modify the sync_result_builder.
|
|
|
|
Args:
|
|
sync_result_builder
|
|
ignored_users: Set of users ignored by user.
|
|
ignored_rooms: List of rooms to ignore.
|
|
"""
|
|
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
since_token = sync_result_builder.since_token
|
|
now_token = sync_result_builder.now_token
|
|
sync_config = sync_result_builder.sync_config
|
|
|
|
room_list = await self.store.get_rooms_for_local_user_where_membership_is(
|
|
user_id=user_id,
|
|
membership_list=Membership.LIST,
|
|
excluded_rooms=self.rooms_to_exclude,
|
|
)
|
|
|
|
room_entries = []
|
|
invited = []
|
|
knocked = []
|
|
|
|
for event in room_list:
|
|
if event.room_version_id not in KNOWN_ROOM_VERSIONS:
|
|
continue
|
|
|
|
if event.membership == Membership.JOIN:
|
|
room_entries.append(
|
|
RoomSyncResultBuilder(
|
|
room_id=event.room_id,
|
|
rtype="joined",
|
|
events=None,
|
|
newly_joined=False,
|
|
full_state=True,
|
|
since_token=since_token,
|
|
upto_token=now_token,
|
|
)
|
|
)
|
|
elif event.membership == Membership.INVITE:
|
|
if event.sender in ignored_users:
|
|
continue
|
|
invite = await self.store.get_event(event.event_id)
|
|
invited.append(InvitedSyncResult(room_id=event.room_id, invite=invite))
|
|
elif event.membership == Membership.KNOCK:
|
|
knock = await self.store.get_event(event.event_id)
|
|
knocked.append(KnockedSyncResult(room_id=event.room_id, knock=knock))
|
|
elif event.membership in (Membership.LEAVE, Membership.BAN):
|
|
# Always send down rooms we were banned from or kicked from.
|
|
if not sync_config.filter_collection.include_leave:
|
|
if event.membership == Membership.LEAVE:
|
|
if user_id == event.sender:
|
|
continue
|
|
|
|
leave_token = now_token.copy_and_replace(
|
|
StreamKeyType.ROOM, RoomStreamToken(None, event.stream_ordering)
|
|
)
|
|
room_entries.append(
|
|
RoomSyncResultBuilder(
|
|
room_id=event.room_id,
|
|
rtype="archived",
|
|
events=None,
|
|
newly_joined=False,
|
|
full_state=True,
|
|
since_token=since_token,
|
|
upto_token=leave_token,
|
|
)
|
|
)
|
|
|
|
return _RoomChanges(room_entries, invited, knocked, [], [])
|
|
|
|
async def _generate_room_entry(
|
|
self,
|
|
sync_result_builder: "SyncResultBuilder",
|
|
room_builder: "RoomSyncResultBuilder",
|
|
ephemeral: List[JsonDict],
|
|
tags: Optional[Dict[str, Dict[str, Any]]],
|
|
account_data: Dict[str, JsonDict],
|
|
always_include: bool = False,
|
|
) -> None:
|
|
"""Populates the `joined` and `archived` section of `sync_result_builder`
|
|
based on the `room_builder`.
|
|
|
|
Ideally, we want to report all events whose stream ordering `s` lies in the
|
|
range `since_token < s <= now_token`, where the two tokens are read from the
|
|
sync_result_builder.
|
|
|
|
If there are too many events in that range to report, things get complicated.
|
|
In this situation we return a truncated list of the most recent events, and
|
|
indicate in the response that there is a "gap" of omitted events. Lots of this
|
|
is handled in `_load_filtered_recents`, but some of is handled in this method.
|
|
|
|
Additionally:
|
|
- we include a "state_delta", to describe the changes in state over the gap,
|
|
- we include all membership events applying to the user making the request,
|
|
even those in the gap.
|
|
|
|
See the spec for the rationale:
|
|
https://spec.matrix.org/v1.1/client-server-api/#syncing
|
|
|
|
Args:
|
|
sync_result_builder
|
|
room_builder
|
|
ephemeral: List of new ephemeral events for room
|
|
tags: List of *all* tags for room, or None if there has been
|
|
no change.
|
|
account_data: List of new account data for room
|
|
always_include: Always include this room in the sync response,
|
|
even if empty.
|
|
"""
|
|
newly_joined = room_builder.newly_joined
|
|
full_state = (
|
|
room_builder.full_state or newly_joined or sync_result_builder.full_state
|
|
)
|
|
events = room_builder.events
|
|
|
|
# We want to shortcut out as early as possible.
|
|
if not (always_include or account_data or ephemeral or full_state):
|
|
if events == [] and tags is None:
|
|
return
|
|
|
|
now_token = sync_result_builder.now_token
|
|
sync_config = sync_result_builder.sync_config
|
|
|
|
room_id = room_builder.room_id
|
|
since_token = room_builder.since_token
|
|
upto_token = room_builder.upto_token
|
|
|
|
with start_active_span("sync.generate_room_entry"):
|
|
set_tag("room_id", room_id)
|
|
log_kv({"events": len(events or ())})
|
|
|
|
log_kv(
|
|
{
|
|
"since_token": since_token,
|
|
"upto_token": upto_token,
|
|
}
|
|
)
|
|
|
|
batch = await self._load_filtered_recents(
|
|
room_id,
|
|
sync_config,
|
|
now_token=upto_token,
|
|
since_token=since_token,
|
|
potential_recents=events,
|
|
newly_joined_room=newly_joined,
|
|
)
|
|
log_kv(
|
|
{
|
|
"batch_events": len(batch.events),
|
|
"prev_batch": batch.prev_batch,
|
|
"batch_limited": batch.limited,
|
|
}
|
|
)
|
|
|
|
# Note: `batch` can be both empty and limited here in the case where
|
|
# `_load_filtered_recents` can't find any events the user should see
|
|
# (e.g. due to having ignored the sender of the last 50 events).
|
|
|
|
# When we join the room (or the client requests full_state), we should
|
|
# send down any existing tags. Usually the user won't have tags in a
|
|
# newly joined room, unless either a) they've joined before or b) the
|
|
# tag was added by synapse e.g. for server notice rooms.
|
|
if full_state:
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
tags = await self.store.get_tags_for_room(user_id, room_id)
|
|
|
|
# If there aren't any tags, don't send the empty tags list down
|
|
# sync
|
|
if not tags:
|
|
tags = None
|
|
|
|
account_data_events = []
|
|
if tags is not None:
|
|
account_data_events.append({"type": "m.tag", "content": {"tags": tags}})
|
|
|
|
for account_data_type, content in account_data.items():
|
|
account_data_events.append(
|
|
{"type": account_data_type, "content": content}
|
|
)
|
|
|
|
account_data_events = (
|
|
await sync_config.filter_collection.filter_room_account_data(
|
|
account_data_events
|
|
)
|
|
)
|
|
|
|
ephemeral = await sync_config.filter_collection.filter_room_ephemeral(
|
|
ephemeral
|
|
)
|
|
|
|
if not (
|
|
always_include
|
|
or batch
|
|
or account_data_events
|
|
or ephemeral
|
|
or full_state
|
|
):
|
|
return
|
|
|
|
if not room_builder.out_of_band:
|
|
state = await self.compute_state_delta(
|
|
room_id,
|
|
batch,
|
|
sync_config,
|
|
since_token,
|
|
now_token,
|
|
full_state=full_state,
|
|
)
|
|
else:
|
|
# An out of band room won't have any state changes.
|
|
state = {}
|
|
|
|
summary: Optional[JsonDict] = {}
|
|
|
|
# we include a summary in room responses when we're lazy loading
|
|
# members (as the client otherwise doesn't have enough info to form
|
|
# the name itself).
|
|
if (
|
|
not room_builder.out_of_band
|
|
and sync_config.filter_collection.lazy_load_members()
|
|
and (
|
|
# we recalculate the summary:
|
|
# if there are membership changes in the timeline, or
|
|
# if membership has changed during a gappy sync, or
|
|
# if this is an initial sync.
|
|
any(ev.type == EventTypes.Member for ev in batch.events)
|
|
or (
|
|
# XXX: this may include false positives in the form of LL
|
|
# members which have snuck into state
|
|
batch.limited
|
|
and any(t == EventTypes.Member for (t, k) in state)
|
|
)
|
|
or since_token is None
|
|
)
|
|
):
|
|
summary = await self.compute_summary(
|
|
room_id, sync_config, batch, state, now_token
|
|
)
|
|
|
|
if room_builder.rtype == "joined":
|
|
unread_notifications: Dict[str, int] = {}
|
|
room_sync = JoinedSyncResult(
|
|
room_id=room_id,
|
|
timeline=batch,
|
|
state=state,
|
|
ephemeral=ephemeral,
|
|
account_data=account_data_events,
|
|
unread_notifications=unread_notifications,
|
|
summary=summary,
|
|
unread_count=0,
|
|
)
|
|
|
|
if room_sync or always_include:
|
|
notifs = await self.unread_notifs_for_room_id(room_id, sync_config)
|
|
|
|
unread_notifications["notification_count"] = notifs.notify_count
|
|
unread_notifications["highlight_count"] = notifs.highlight_count
|
|
|
|
room_sync.unread_count = notifs.unread_count
|
|
|
|
sync_result_builder.joined.append(room_sync)
|
|
|
|
if batch.limited and since_token:
|
|
user_id = sync_result_builder.sync_config.user.to_string()
|
|
logger.debug(
|
|
"Incremental gappy sync of %s for user %s with %d state events"
|
|
% (room_id, user_id, len(state))
|
|
)
|
|
elif room_builder.rtype == "archived":
|
|
archived_room_sync = ArchivedSyncResult(
|
|
room_id=room_id,
|
|
timeline=batch,
|
|
state=state,
|
|
account_data=account_data_events,
|
|
)
|
|
if archived_room_sync or always_include:
|
|
sync_result_builder.archived.append(archived_room_sync)
|
|
else:
|
|
raise Exception("Unrecognized rtype: %r", room_builder.rtype)
|
|
|
|
async def get_rooms_for_user_at(
|
|
self,
|
|
user_id: str,
|
|
room_key: RoomStreamToken,
|
|
) -> FrozenSet[str]:
|
|
"""Get set of joined rooms for a user at the given stream ordering.
|
|
|
|
The stream ordering *must* be recent, otherwise this may throw an
|
|
exception if older than a month. (This function is called with the
|
|
current token, which should be perfectly fine).
|
|
|
|
Args:
|
|
user_id
|
|
stream_ordering
|
|
|
|
ReturnValue:
|
|
Set of room_ids the user is in at given stream_ordering.
|
|
"""
|
|
joined_rooms = await self.store.get_rooms_for_user_with_stream_ordering(user_id)
|
|
|
|
joined_room_ids = set()
|
|
|
|
# We need to check that the stream ordering of the join for each room
|
|
# is before the stream_ordering asked for. This might not be the case
|
|
# if the user joins a room between us getting the current token and
|
|
# calling `get_rooms_for_user_with_stream_ordering`.
|
|
# If the membership's stream ordering is after the given stream
|
|
# ordering, we need to go and work out if the user was in the room
|
|
# before.
|
|
# We also need to check whether the room should be excluded from sync
|
|
# responses as per the homeserver config.
|
|
for joined_room in joined_rooms:
|
|
if joined_room.room_id in self.rooms_to_exclude:
|
|
continue
|
|
|
|
if not joined_room.event_pos.persisted_after(room_key):
|
|
joined_room_ids.add(joined_room.room_id)
|
|
continue
|
|
|
|
logger.info("User joined room after current token: %s", joined_room.room_id)
|
|
|
|
extrems = (
|
|
await self.store.get_forward_extremities_for_room_at_stream_ordering(
|
|
joined_room.room_id, joined_room.event_pos.stream
|
|
)
|
|
)
|
|
users_in_room = await self.state.get_current_users_in_room(
|
|
joined_room.room_id, extrems
|
|
)
|
|
if user_id in users_in_room:
|
|
joined_room_ids.add(joined_room.room_id)
|
|
|
|
return frozenset(joined_room_ids)
|
|
|
|
|
|
def _action_has_highlight(actions: List[JsonDict]) -> bool:
|
|
for action in actions:
|
|
try:
|
|
if action.get("set_tweak", None) == "highlight":
|
|
return action.get("value", True)
|
|
except AttributeError:
|
|
pass
|
|
|
|
return False
|
|
|
|
|
|
def _calculate_state(
|
|
timeline_contains: StateMap[str],
|
|
timeline_start: StateMap[str],
|
|
previous: StateMap[str],
|
|
current: StateMap[str],
|
|
lazy_load_members: bool,
|
|
) -> StateMap[str]:
|
|
"""Works out what state to include in a sync response.
|
|
|
|
Args:
|
|
timeline_contains: state in the timeline
|
|
timeline_start: state at the start of the timeline
|
|
previous: state at the end of the previous sync (or empty dict
|
|
if this is an initial sync)
|
|
current: state at the end of the timeline
|
|
lazy_load_members: whether to return members from timeline_start
|
|
or not. assumes that timeline_start has already been filtered to
|
|
include only the members the client needs to know about.
|
|
"""
|
|
event_id_to_key = {
|
|
e: key
|
|
for key, e in itertools.chain(
|
|
timeline_contains.items(),
|
|
previous.items(),
|
|
timeline_start.items(),
|
|
current.items(),
|
|
)
|
|
}
|
|
|
|
c_ids = set(current.values())
|
|
ts_ids = set(timeline_start.values())
|
|
p_ids = set(previous.values())
|
|
tc_ids = set(timeline_contains.values())
|
|
|
|
# If we are lazyloading room members, we explicitly add the membership events
|
|
# for the senders in the timeline into the state block returned by /sync,
|
|
# as we may not have sent them to the client before. We find these membership
|
|
# events by filtering them out of timeline_start, which has already been filtered
|
|
# to only include membership events for the senders in the timeline.
|
|
# In practice, we can do this by removing them from the p_ids list,
|
|
# which is the list of relevant state we know we have already sent to the client.
|
|
# see https://github.com/matrix-org/synapse/pull/2970/files/efcdacad7d1b7f52f879179701c7e0d9b763511f#r204732809
|
|
|
|
if lazy_load_members:
|
|
p_ids.difference_update(
|
|
e for t, e in timeline_start.items() if t[0] == EventTypes.Member
|
|
)
|
|
|
|
state_ids = ((c_ids | ts_ids) - p_ids) - tc_ids
|
|
|
|
return {event_id_to_key[e]: e for e in state_ids}
|
|
|
|
|
|
@attr.s(slots=True, auto_attribs=True)
|
|
class SyncResultBuilder:
|
|
"""Used to help build up a new SyncResult for a user
|
|
|
|
Attributes:
|
|
sync_config
|
|
full_state: The full_state flag as specified by user
|
|
since_token: The token supplied by user, or None.
|
|
now_token: The token to sync up to.
|
|
joined_room_ids: List of rooms the user is joined to
|
|
|
|
# The following mirror the fields in a sync response
|
|
presence
|
|
account_data
|
|
joined
|
|
invited
|
|
knocked
|
|
archived
|
|
to_device
|
|
"""
|
|
|
|
sync_config: SyncConfig
|
|
full_state: bool
|
|
since_token: Optional[StreamToken]
|
|
now_token: StreamToken
|
|
joined_room_ids: FrozenSet[str]
|
|
|
|
presence: List[UserPresenceState] = attr.Factory(list)
|
|
account_data: List[JsonDict] = attr.Factory(list)
|
|
joined: List[JoinedSyncResult] = attr.Factory(list)
|
|
invited: List[InvitedSyncResult] = attr.Factory(list)
|
|
knocked: List[KnockedSyncResult] = attr.Factory(list)
|
|
archived: List[ArchivedSyncResult] = attr.Factory(list)
|
|
to_device: List[JsonDict] = attr.Factory(list)
|
|
|
|
def calculate_user_changes(self) -> Tuple[Set[str], Set[str]]:
|
|
"""Work out which other users have joined or left rooms we are joined to.
|
|
|
|
This data only is only useful for an incremental sync.
|
|
|
|
The SyncResultBuilder is not modified by this function.
|
|
"""
|
|
newly_joined_or_invited_or_knocked_users = set()
|
|
newly_left_users = set()
|
|
if self.since_token:
|
|
for joined_sync in self.joined:
|
|
it = itertools.chain(
|
|
joined_sync.timeline.events, joined_sync.state.values()
|
|
)
|
|
for event in it:
|
|
if event.type == EventTypes.Member:
|
|
if (
|
|
event.membership == Membership.JOIN
|
|
or event.membership == Membership.INVITE
|
|
or event.membership == Membership.KNOCK
|
|
):
|
|
newly_joined_or_invited_or_knocked_users.add(
|
|
event.state_key
|
|
)
|
|
else:
|
|
prev_content = event.unsigned.get("prev_content", {})
|
|
prev_membership = prev_content.get("membership", None)
|
|
if prev_membership == Membership.JOIN:
|
|
newly_left_users.add(event.state_key)
|
|
|
|
newly_left_users -= newly_joined_or_invited_or_knocked_users
|
|
return newly_joined_or_invited_or_knocked_users, newly_left_users
|
|
|
|
|
|
@attr.s(slots=True, auto_attribs=True)
|
|
class RoomSyncResultBuilder:
|
|
"""Stores information needed to create either a `JoinedSyncResult` or
|
|
`ArchivedSyncResult`.
|
|
|
|
Attributes:
|
|
room_id
|
|
rtype: One of `"joined"` or `"archived"`
|
|
events: List of events to include in the room (more events may be added
|
|
when generating result).
|
|
newly_joined: If the user has newly joined the room
|
|
full_state: Whether the full state should be sent in result
|
|
since_token: Earliest point to return events from, or None
|
|
upto_token: Latest point to return events from.
|
|
out_of_band: whether the events in the room are "out of band" events
|
|
and the server isn't in the room.
|
|
"""
|
|
|
|
room_id: str
|
|
rtype: str
|
|
events: Optional[List[EventBase]]
|
|
newly_joined: bool
|
|
full_state: bool
|
|
since_token: Optional[StreamToken]
|
|
upto_token: StreamToken
|
|
|
|
out_of_band: bool = False
|