2267 lines
87 KiB
Python
2267 lines
87 KiB
Python
# Copyright 2014-2016 OpenMarket Ltd
|
|
# Copyright 2020 The Matrix.org Foundation C.I.C.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
"""This module is responsible for keeping track of presence status of local
|
|
and remote users.
|
|
|
|
The methods that define policy are:
|
|
- PresenceHandler._update_states
|
|
- PresenceHandler._handle_timeouts
|
|
- should_notify
|
|
"""
|
|
import abc
|
|
import contextlib
|
|
import logging
|
|
from bisect import bisect
|
|
from contextlib import contextmanager
|
|
from types import TracebackType
|
|
from typing import (
|
|
TYPE_CHECKING,
|
|
Any,
|
|
Awaitable,
|
|
Callable,
|
|
Collection,
|
|
Dict,
|
|
FrozenSet,
|
|
Generator,
|
|
Iterable,
|
|
List,
|
|
Optional,
|
|
Set,
|
|
Tuple,
|
|
Type,
|
|
Union,
|
|
)
|
|
|
|
from prometheus_client import Counter
|
|
from typing_extensions import ContextManager
|
|
|
|
import synapse.metrics
|
|
from synapse.api.constants import EventTypes, Membership, PresenceState
|
|
from synapse.api.errors import SynapseError
|
|
from synapse.api.presence import UserPresenceState
|
|
from synapse.appservice import ApplicationService
|
|
from synapse.events.presence_router import PresenceRouter
|
|
from synapse.logging.context import run_in_background
|
|
from synapse.metrics import LaterGauge
|
|
from synapse.metrics.background_process_metrics import run_as_background_process
|
|
from synapse.replication.http.presence import (
|
|
ReplicationBumpPresenceActiveTime,
|
|
ReplicationPresenceSetState,
|
|
)
|
|
from synapse.replication.http.streams import ReplicationGetStreamUpdates
|
|
from synapse.replication.tcp.commands import ClearUserSyncsCommand
|
|
from synapse.replication.tcp.streams import PresenceFederationStream, PresenceStream
|
|
from synapse.storage.databases.main import DataStore
|
|
from synapse.streams import EventSource
|
|
from synapse.types import JsonDict, UserID, get_domain_from_id
|
|
from synapse.util.async_helpers import Linearizer
|
|
from synapse.util.caches.descriptors import _CacheContext, cached
|
|
from synapse.util.metrics import Measure
|
|
from synapse.util.wheel_timer import WheelTimer
|
|
|
|
if TYPE_CHECKING:
|
|
from synapse.server import HomeServer
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
notified_presence_counter = Counter("synapse_handler_presence_notified_presence", "")
|
|
federation_presence_out_counter = Counter(
|
|
"synapse_handler_presence_federation_presence_out", ""
|
|
)
|
|
presence_updates_counter = Counter("synapse_handler_presence_presence_updates", "")
|
|
timers_fired_counter = Counter("synapse_handler_presence_timers_fired", "")
|
|
federation_presence_counter = Counter(
|
|
"synapse_handler_presence_federation_presence", ""
|
|
)
|
|
bump_active_time_counter = Counter("synapse_handler_presence_bump_active_time", "")
|
|
|
|
get_updates_counter = Counter("synapse_handler_presence_get_updates", "", ["type"])
|
|
|
|
notify_reason_counter = Counter(
|
|
"synapse_handler_presence_notify_reason", "", ["reason"]
|
|
)
|
|
state_transition_counter = Counter(
|
|
"synapse_handler_presence_state_transition", "", ["from", "to"]
|
|
)
|
|
|
|
|
|
# If a user was last active in the last LAST_ACTIVE_GRANULARITY, consider them
|
|
# "currently_active"
|
|
LAST_ACTIVE_GRANULARITY = 60 * 1000
|
|
|
|
# How long to wait until a new /events or /sync request before assuming
|
|
# the client has gone.
|
|
SYNC_ONLINE_TIMEOUT = 30 * 1000
|
|
|
|
# How long to wait before marking the user as idle. Compared against last active
|
|
IDLE_TIMER = 5 * 60 * 1000
|
|
|
|
# How often we expect remote servers to resend us presence.
|
|
FEDERATION_TIMEOUT = 30 * 60 * 1000
|
|
|
|
# How often to resend presence to remote servers
|
|
FEDERATION_PING_INTERVAL = 25 * 60 * 1000
|
|
|
|
# How long we will wait before assuming that the syncs from an external process
|
|
# are dead.
|
|
EXTERNAL_PROCESS_EXPIRY = 5 * 60 * 1000
|
|
|
|
# Delay before a worker tells the presence handler that a user has stopped
|
|
# syncing.
|
|
UPDATE_SYNCING_USERS_MS = 10 * 1000
|
|
|
|
assert LAST_ACTIVE_GRANULARITY < IDLE_TIMER
|
|
|
|
|
|
class BasePresenceHandler(abc.ABC):
|
|
"""Parts of the PresenceHandler that are shared between workers and presence
|
|
writer"""
|
|
|
|
def __init__(self, hs: "HomeServer"):
|
|
self.clock = hs.get_clock()
|
|
self.store = hs.get_datastore()
|
|
self.presence_router = hs.get_presence_router()
|
|
self.state = hs.get_state_handler()
|
|
self.is_mine_id = hs.is_mine_id
|
|
|
|
self._federation = None
|
|
if hs.should_send_federation():
|
|
self._federation = hs.get_federation_sender()
|
|
|
|
self._federation_queue = PresenceFederationQueue(hs, self)
|
|
|
|
self._busy_presence_enabled = hs.config.experimental.msc3026_enabled
|
|
|
|
active_presence = self.store.take_presence_startup_info()
|
|
self.user_to_current_state = {state.user_id: state for state in active_presence}
|
|
|
|
@abc.abstractmethod
|
|
async def user_syncing(
|
|
self, user_id: str, affect_presence: bool
|
|
) -> ContextManager[None]:
|
|
"""Returns a context manager that should surround any stream requests
|
|
from the user.
|
|
|
|
This allows us to keep track of who is currently streaming and who isn't
|
|
without having to have timers outside of this module to avoid flickering
|
|
when users disconnect/reconnect.
|
|
|
|
Args:
|
|
user_id: the user that is starting a sync
|
|
affect_presence: If false this function will be a no-op.
|
|
Useful for streams that are not associated with an actual
|
|
client that is being used by a user.
|
|
"""
|
|
|
|
@abc.abstractmethod
|
|
def get_currently_syncing_users_for_replication(self) -> Iterable[str]:
|
|
"""Get an iterable of syncing users on this worker, to send to the presence handler
|
|
|
|
This is called when a replication connection is established. It should return
|
|
a list of user ids, which are then sent as USER_SYNC commands to inform the
|
|
process handling presence about those users.
|
|
|
|
Returns:
|
|
An iterable of user_id strings.
|
|
"""
|
|
|
|
async def get_state(self, target_user: UserID) -> UserPresenceState:
|
|
results = await self.get_states([target_user.to_string()])
|
|
return results[0]
|
|
|
|
async def get_states(
|
|
self, target_user_ids: Iterable[str]
|
|
) -> List[UserPresenceState]:
|
|
"""Get the presence state for users."""
|
|
|
|
updates_d = await self.current_state_for_users(target_user_ids)
|
|
updates = list(updates_d.values())
|
|
|
|
for user_id in set(target_user_ids) - {u.user_id for u in updates}:
|
|
updates.append(UserPresenceState.default(user_id))
|
|
|
|
return updates
|
|
|
|
async def current_state_for_users(
|
|
self, user_ids: Iterable[str]
|
|
) -> Dict[str, UserPresenceState]:
|
|
"""Get the current presence state for multiple users.
|
|
|
|
Returns:
|
|
dict: `user_id` -> `UserPresenceState`
|
|
"""
|
|
states = {
|
|
user_id: self.user_to_current_state.get(user_id, None)
|
|
for user_id in user_ids
|
|
}
|
|
|
|
missing = [user_id for user_id, state in states.items() if not state]
|
|
if missing:
|
|
# There are things not in our in memory cache. Lets pull them out of
|
|
# the database.
|
|
res = await self.store.get_presence_for_users(missing)
|
|
states.update(res)
|
|
|
|
missing = [user_id for user_id, state in states.items() if not state]
|
|
if missing:
|
|
new = {
|
|
user_id: UserPresenceState.default(user_id) for user_id in missing
|
|
}
|
|
states.update(new)
|
|
self.user_to_current_state.update(new)
|
|
|
|
return states
|
|
|
|
@abc.abstractmethod
|
|
async def set_state(
|
|
self,
|
|
target_user: UserID,
|
|
state: JsonDict,
|
|
ignore_status_msg: bool = False,
|
|
force_notify: bool = False,
|
|
) -> None:
|
|
"""Set the presence state of the user.
|
|
|
|
Args:
|
|
target_user: The ID of the user to set the presence state of.
|
|
state: The presence state as a JSON dictionary.
|
|
ignore_status_msg: True to ignore the "status_msg" field of the `state` dict.
|
|
If False, the user's current status will be updated.
|
|
force_notify: Whether to force notification of the update to clients.
|
|
"""
|
|
|
|
@abc.abstractmethod
|
|
async def bump_presence_active_time(self, user: UserID) -> None:
|
|
"""We've seen the user do something that indicates they're interacting
|
|
with the app.
|
|
"""
|
|
|
|
async def update_external_syncs_row(
|
|
self, process_id: str, user_id: str, is_syncing: bool, sync_time_msec: int
|
|
) -> None:
|
|
"""Update the syncing users for an external process as a delta.
|
|
|
|
This is a no-op when presence is handled by a different worker.
|
|
|
|
Args:
|
|
process_id: An identifier for the process the users are
|
|
syncing against. This allows synapse to process updates
|
|
as user start and stop syncing against a given process.
|
|
user_id: The user who has started or stopped syncing
|
|
is_syncing: Whether or not the user is now syncing
|
|
sync_time_msec: Time in ms when the user was last syncing
|
|
"""
|
|
pass
|
|
|
|
async def update_external_syncs_clear(self, process_id: str) -> None:
|
|
"""Marks all users that had been marked as syncing by a given process
|
|
as offline.
|
|
|
|
Used when the process has stopped/disappeared.
|
|
|
|
This is a no-op when presence is handled by a different worker.
|
|
"""
|
|
pass
|
|
|
|
async def process_replication_rows(
|
|
self, stream_name: str, instance_name: str, token: int, rows: list
|
|
) -> None:
|
|
"""Process streams received over replication."""
|
|
await self._federation_queue.process_replication_rows(
|
|
stream_name, instance_name, token, rows
|
|
)
|
|
|
|
def get_federation_queue(self) -> "PresenceFederationQueue":
|
|
"""Get the presence federation queue."""
|
|
return self._federation_queue
|
|
|
|
async def maybe_send_presence_to_interested_destinations(
|
|
self, states: List[UserPresenceState]
|
|
) -> None:
|
|
"""If this instance is a federation sender, send the states to all
|
|
destinations that are interested. Filters out any states for remote
|
|
users.
|
|
"""
|
|
|
|
if not self._federation:
|
|
return
|
|
|
|
states = [s for s in states if self.is_mine_id(s.user_id)]
|
|
|
|
if not states:
|
|
return
|
|
|
|
hosts_to_states = await get_interested_remotes(
|
|
self.store,
|
|
self.presence_router,
|
|
states,
|
|
)
|
|
|
|
for destination, host_states in hosts_to_states.items():
|
|
self._federation.send_presence_to_destinations(host_states, [destination])
|
|
|
|
async def send_full_presence_to_users(self, user_ids: Collection[str]) -> None:
|
|
"""
|
|
Adds to the list of users who should receive a full snapshot of presence
|
|
upon their next sync. Note that this only works for local users.
|
|
|
|
Then, grabs the current presence state for a given set of users and adds it
|
|
to the top of the presence stream.
|
|
|
|
Args:
|
|
user_ids: The IDs of the local users to send full presence to.
|
|
"""
|
|
# Retrieve one of the users from the given set
|
|
if not user_ids:
|
|
raise Exception(
|
|
"send_full_presence_to_users must be called with at least one user"
|
|
)
|
|
user_id = next(iter(user_ids))
|
|
|
|
# Mark all users as receiving full presence on their next sync
|
|
await self.store.add_users_to_send_full_presence_to(user_ids)
|
|
|
|
# Add a new entry to the presence stream. Since we use stream tokens to determine whether a
|
|
# local user should receive a full snapshot of presence when they sync, we need to bump the
|
|
# presence stream so that subsequent syncs with no presence activity in between won't result
|
|
# in the client receiving multiple full snapshots of presence.
|
|
#
|
|
# If we bump the stream ID, then the user will get a higher stream token next sync, and thus
|
|
# correctly won't receive a second snapshot.
|
|
|
|
# Get the current presence state for one of the users (defaults to offline if not found)
|
|
current_presence_state = await self.get_state(UserID.from_string(user_id))
|
|
|
|
# Convert the UserPresenceState object into a serializable dict
|
|
state = {
|
|
"presence": current_presence_state.state,
|
|
"status_message": current_presence_state.status_msg,
|
|
}
|
|
|
|
# Copy the presence state to the tip of the presence stream.
|
|
|
|
# We set force_notify=True here so that this presence update is guaranteed to
|
|
# increment the presence stream ID (which resending the current user's presence
|
|
# otherwise would not do).
|
|
await self.set_state(UserID.from_string(user_id), state, force_notify=True)
|
|
|
|
async def is_visible(self, observed_user: UserID, observer_user: UserID) -> bool:
|
|
raise NotImplementedError(
|
|
"Attempting to check presence on a non-presence worker."
|
|
)
|
|
|
|
|
|
class _NullContextManager(ContextManager[None]):
|
|
"""A context manager which does nothing."""
|
|
|
|
def __exit__(
|
|
self,
|
|
exc_type: Optional[Type[BaseException]],
|
|
exc_val: Optional[BaseException],
|
|
exc_tb: Optional[TracebackType],
|
|
) -> None:
|
|
pass
|
|
|
|
|
|
class WorkerPresenceHandler(BasePresenceHandler):
|
|
def __init__(self, hs: "HomeServer"):
|
|
super().__init__(hs)
|
|
self.hs = hs
|
|
|
|
self._presence_writer_instance = hs.config.worker.writers.presence[0]
|
|
|
|
self._presence_enabled = hs.config.server.use_presence
|
|
|
|
# Route presence EDUs to the right worker
|
|
hs.get_federation_registry().register_instances_for_edu(
|
|
"m.presence",
|
|
hs.config.worker.writers.presence,
|
|
)
|
|
|
|
# The number of ongoing syncs on this process, by user id.
|
|
# Empty if _presence_enabled is false.
|
|
self._user_to_num_current_syncs: Dict[str, int] = {}
|
|
|
|
self.notifier = hs.get_notifier()
|
|
self.instance_id = hs.get_instance_id()
|
|
|
|
# user_id -> last_sync_ms. Lists the users that have stopped syncing but
|
|
# we haven't notified the presence writer of that yet
|
|
self.users_going_offline: Dict[str, int] = {}
|
|
|
|
self._bump_active_client = ReplicationBumpPresenceActiveTime.make_client(hs)
|
|
self._set_state_client = ReplicationPresenceSetState.make_client(hs)
|
|
|
|
self._send_stop_syncing_loop = self.clock.looping_call(
|
|
self.send_stop_syncing, UPDATE_SYNCING_USERS_MS
|
|
)
|
|
|
|
self._busy_presence_enabled = hs.config.experimental.msc3026_enabled
|
|
|
|
hs.get_reactor().addSystemEventTrigger(
|
|
"before",
|
|
"shutdown",
|
|
run_as_background_process,
|
|
"generic_presence.on_shutdown",
|
|
self._on_shutdown,
|
|
)
|
|
|
|
async def _on_shutdown(self) -> None:
|
|
if self._presence_enabled:
|
|
self.hs.get_tcp_replication().send_command(
|
|
ClearUserSyncsCommand(self.instance_id)
|
|
)
|
|
|
|
def send_user_sync(self, user_id: str, is_syncing: bool, last_sync_ms: int) -> None:
|
|
if self._presence_enabled:
|
|
self.hs.get_tcp_replication().send_user_sync(
|
|
self.instance_id, user_id, is_syncing, last_sync_ms
|
|
)
|
|
|
|
def mark_as_coming_online(self, user_id: str) -> None:
|
|
"""A user has started syncing. Send a UserSync to the presence writer,
|
|
unless they had recently stopped syncing.
|
|
"""
|
|
going_offline = self.users_going_offline.pop(user_id, None)
|
|
if not going_offline:
|
|
# Safe to skip because we haven't yet told the presence writer they
|
|
# were offline
|
|
self.send_user_sync(user_id, True, self.clock.time_msec())
|
|
|
|
def mark_as_going_offline(self, user_id: str) -> None:
|
|
"""A user has stopped syncing. We wait before notifying the presence
|
|
writer as its likely they'll come back soon. This allows us to avoid
|
|
sending a stopped syncing immediately followed by a started syncing
|
|
notification to the presence writer
|
|
"""
|
|
self.users_going_offline[user_id] = self.clock.time_msec()
|
|
|
|
def send_stop_syncing(self) -> None:
|
|
"""Check if there are any users who have stopped syncing a while ago and
|
|
haven't come back yet. If there are poke the presence writer about them.
|
|
"""
|
|
now = self.clock.time_msec()
|
|
for user_id, last_sync_ms in list(self.users_going_offline.items()):
|
|
if now - last_sync_ms > UPDATE_SYNCING_USERS_MS:
|
|
self.users_going_offline.pop(user_id, None)
|
|
self.send_user_sync(user_id, False, last_sync_ms)
|
|
|
|
async def user_syncing(
|
|
self, user_id: str, affect_presence: bool
|
|
) -> ContextManager[None]:
|
|
"""Record that a user is syncing.
|
|
|
|
Called by the sync and events servlets to record that a user has connected to
|
|
this worker and is waiting for some events.
|
|
"""
|
|
if not affect_presence or not self._presence_enabled:
|
|
return _NullContextManager()
|
|
|
|
curr_sync = self._user_to_num_current_syncs.get(user_id, 0)
|
|
self._user_to_num_current_syncs[user_id] = curr_sync + 1
|
|
|
|
# If we went from no in flight sync to some, notify replication
|
|
if self._user_to_num_current_syncs[user_id] == 1:
|
|
self.mark_as_coming_online(user_id)
|
|
|
|
def _end() -> None:
|
|
# We check that the user_id is in user_to_num_current_syncs because
|
|
# user_to_num_current_syncs may have been cleared if we are
|
|
# shutting down.
|
|
if user_id in self._user_to_num_current_syncs:
|
|
self._user_to_num_current_syncs[user_id] -= 1
|
|
|
|
# If we went from one in flight sync to non, notify replication
|
|
if self._user_to_num_current_syncs[user_id] == 0:
|
|
self.mark_as_going_offline(user_id)
|
|
|
|
@contextlib.contextmanager
|
|
def _user_syncing() -> Generator[None, None, None]:
|
|
try:
|
|
yield
|
|
finally:
|
|
_end()
|
|
|
|
return _user_syncing()
|
|
|
|
async def notify_from_replication(
|
|
self, states: List[UserPresenceState], stream_id: int
|
|
) -> None:
|
|
parties = await get_interested_parties(self.store, self.presence_router, states)
|
|
room_ids_to_states, users_to_states = parties
|
|
|
|
self.notifier.on_new_event(
|
|
"presence_key",
|
|
stream_id,
|
|
rooms=room_ids_to_states.keys(),
|
|
users=users_to_states.keys(),
|
|
)
|
|
|
|
async def process_replication_rows(
|
|
self, stream_name: str, instance_name: str, token: int, rows: list
|
|
) -> None:
|
|
await super().process_replication_rows(stream_name, instance_name, token, rows)
|
|
|
|
if stream_name != PresenceStream.NAME:
|
|
return
|
|
|
|
states = [
|
|
UserPresenceState(
|
|
row.user_id,
|
|
row.state,
|
|
row.last_active_ts,
|
|
row.last_federation_update_ts,
|
|
row.last_user_sync_ts,
|
|
row.status_msg,
|
|
row.currently_active,
|
|
)
|
|
for row in rows
|
|
]
|
|
|
|
# The list of states to notify sync streams and remote servers about.
|
|
# This is calculated by comparing the old and new states for each user
|
|
# using `should_notify(..)`.
|
|
#
|
|
# Note that this is necessary as the presence writer will periodically
|
|
# flush presence state changes that should not be notified about to the
|
|
# DB, and so will be sent over the replication stream.
|
|
state_to_notify = []
|
|
|
|
for new_state in states:
|
|
old_state = self.user_to_current_state.get(new_state.user_id)
|
|
self.user_to_current_state[new_state.user_id] = new_state
|
|
|
|
if not old_state or should_notify(old_state, new_state):
|
|
state_to_notify.append(new_state)
|
|
|
|
stream_id = token
|
|
await self.notify_from_replication(state_to_notify, stream_id)
|
|
|
|
# If this is a federation sender, notify about presence updates.
|
|
await self.maybe_send_presence_to_interested_destinations(state_to_notify)
|
|
|
|
def get_currently_syncing_users_for_replication(self) -> Iterable[str]:
|
|
return [
|
|
user_id
|
|
for user_id, count in self._user_to_num_current_syncs.items()
|
|
if count > 0
|
|
]
|
|
|
|
async def set_state(
|
|
self,
|
|
target_user: UserID,
|
|
state: JsonDict,
|
|
ignore_status_msg: bool = False,
|
|
force_notify: bool = False,
|
|
) -> None:
|
|
"""Set the presence state of the user.
|
|
|
|
Args:
|
|
target_user: The ID of the user to set the presence state of.
|
|
state: The presence state as a JSON dictionary.
|
|
ignore_status_msg: True to ignore the "status_msg" field of the `state` dict.
|
|
If False, the user's current status will be updated.
|
|
force_notify: Whether to force notification of the update to clients.
|
|
"""
|
|
presence = state["presence"]
|
|
|
|
valid_presence = (
|
|
PresenceState.ONLINE,
|
|
PresenceState.UNAVAILABLE,
|
|
PresenceState.OFFLINE,
|
|
PresenceState.BUSY,
|
|
)
|
|
|
|
if presence not in valid_presence or (
|
|
presence == PresenceState.BUSY and not self._busy_presence_enabled
|
|
):
|
|
raise SynapseError(400, "Invalid presence state")
|
|
|
|
user_id = target_user.to_string()
|
|
|
|
# If presence is disabled, no-op
|
|
if not self.hs.config.server.use_presence:
|
|
return
|
|
|
|
# Proxy request to instance that writes presence
|
|
await self._set_state_client(
|
|
instance_name=self._presence_writer_instance,
|
|
user_id=user_id,
|
|
state=state,
|
|
ignore_status_msg=ignore_status_msg,
|
|
force_notify=force_notify,
|
|
)
|
|
|
|
async def bump_presence_active_time(self, user: UserID) -> None:
|
|
"""We've seen the user do something that indicates they're interacting
|
|
with the app.
|
|
"""
|
|
# If presence is disabled, no-op
|
|
if not self.hs.config.server.use_presence:
|
|
return
|
|
|
|
# Proxy request to instance that writes presence
|
|
user_id = user.to_string()
|
|
await self._bump_active_client(
|
|
instance_name=self._presence_writer_instance, user_id=user_id
|
|
)
|
|
|
|
|
|
class PresenceHandler(BasePresenceHandler):
|
|
def __init__(self, hs: "HomeServer"):
|
|
super().__init__(hs)
|
|
self.hs = hs
|
|
self.server_name = hs.hostname
|
|
self.wheel_timer: WheelTimer[str] = WheelTimer()
|
|
self.notifier = hs.get_notifier()
|
|
self._presence_enabled = hs.config.server.use_presence
|
|
|
|
federation_registry = hs.get_federation_registry()
|
|
|
|
federation_registry.register_edu_handler("m.presence", self.incoming_presence)
|
|
|
|
LaterGauge(
|
|
"synapse_handlers_presence_user_to_current_state_size",
|
|
"",
|
|
[],
|
|
lambda: len(self.user_to_current_state),
|
|
)
|
|
|
|
now = self.clock.time_msec()
|
|
for state in self.user_to_current_state.values():
|
|
self.wheel_timer.insert(
|
|
now=now, obj=state.user_id, then=state.last_active_ts + IDLE_TIMER
|
|
)
|
|
self.wheel_timer.insert(
|
|
now=now,
|
|
obj=state.user_id,
|
|
then=state.last_user_sync_ts + SYNC_ONLINE_TIMEOUT,
|
|
)
|
|
if self.is_mine_id(state.user_id):
|
|
self.wheel_timer.insert(
|
|
now=now,
|
|
obj=state.user_id,
|
|
then=state.last_federation_update_ts + FEDERATION_PING_INTERVAL,
|
|
)
|
|
else:
|
|
self.wheel_timer.insert(
|
|
now=now,
|
|
obj=state.user_id,
|
|
then=state.last_federation_update_ts + FEDERATION_TIMEOUT,
|
|
)
|
|
|
|
# Set of users who have presence in the `user_to_current_state` that
|
|
# have not yet been persisted
|
|
self.unpersisted_users_changes: Set[str] = set()
|
|
|
|
hs.get_reactor().addSystemEventTrigger(
|
|
"before",
|
|
"shutdown",
|
|
run_as_background_process,
|
|
"presence.on_shutdown",
|
|
self._on_shutdown,
|
|
)
|
|
|
|
self._next_serial = 1
|
|
|
|
# Keeps track of the number of *ongoing* syncs on this process. While
|
|
# this is non zero a user will never go offline.
|
|
self.user_to_num_current_syncs: Dict[str, int] = {}
|
|
|
|
# Keeps track of the number of *ongoing* syncs on other processes.
|
|
# While any sync is ongoing on another process the user will never
|
|
# go offline.
|
|
# Each process has a unique identifier and an update frequency. If
|
|
# no update is received from that process within the update period then
|
|
# we assume that all the sync requests on that process have stopped.
|
|
# Stored as a dict from process_id to set of user_id, and a dict of
|
|
# process_id to millisecond timestamp last updated.
|
|
self.external_process_to_current_syncs: Dict[str, Set[str]] = {}
|
|
self.external_process_last_updated_ms: Dict[str, int] = {}
|
|
|
|
self.external_sync_linearizer = Linearizer(name="external_sync_linearizer")
|
|
|
|
if self._presence_enabled:
|
|
# Start a LoopingCall in 30s that fires every 5s.
|
|
# The initial delay is to allow disconnected clients a chance to
|
|
# reconnect before we treat them as offline.
|
|
def run_timeout_handler() -> Awaitable[None]:
|
|
return run_as_background_process(
|
|
"handle_presence_timeouts", self._handle_timeouts
|
|
)
|
|
|
|
self.clock.call_later(
|
|
30, self.clock.looping_call, run_timeout_handler, 5000
|
|
)
|
|
|
|
def run_persister() -> Awaitable[None]:
|
|
return run_as_background_process(
|
|
"persist_presence_changes", self._persist_unpersisted_changes
|
|
)
|
|
|
|
self.clock.call_later(60, self.clock.looping_call, run_persister, 60 * 1000)
|
|
|
|
LaterGauge(
|
|
"synapse_handlers_presence_wheel_timer_size",
|
|
"",
|
|
[],
|
|
lambda: len(self.wheel_timer),
|
|
)
|
|
|
|
# Used to handle sending of presence to newly joined users/servers
|
|
if self._presence_enabled:
|
|
self.notifier.add_replication_callback(self.notify_new_event)
|
|
|
|
# Presence is best effort and quickly heals itself, so lets just always
|
|
# stream from the current state when we restart.
|
|
self._event_pos = self.store.get_room_max_stream_ordering()
|
|
self._event_processing = False
|
|
|
|
async def _on_shutdown(self) -> None:
|
|
"""Gets called when shutting down. This lets us persist any updates that
|
|
we haven't yet persisted, e.g. updates that only changes some internal
|
|
timers. This allows changes to persist across startup without having to
|
|
persist every single change.
|
|
|
|
If this does not run it simply means that some of the timers will fire
|
|
earlier than they should when synapse is restarted. This affect of this
|
|
is some spurious presence changes that will self-correct.
|
|
"""
|
|
# If the DB pool has already terminated, don't try updating
|
|
if not self.store.db_pool.is_running():
|
|
return
|
|
|
|
logger.info(
|
|
"Performing _on_shutdown. Persisting %d unpersisted changes",
|
|
len(self.user_to_current_state),
|
|
)
|
|
|
|
if self.unpersisted_users_changes:
|
|
|
|
await self.store.update_presence(
|
|
[
|
|
self.user_to_current_state[user_id]
|
|
for user_id in self.unpersisted_users_changes
|
|
]
|
|
)
|
|
logger.info("Finished _on_shutdown")
|
|
|
|
async def _persist_unpersisted_changes(self) -> None:
|
|
"""We periodically persist the unpersisted changes, as otherwise they
|
|
may stack up and slow down shutdown times.
|
|
"""
|
|
unpersisted = self.unpersisted_users_changes
|
|
self.unpersisted_users_changes = set()
|
|
|
|
if unpersisted:
|
|
logger.info("Persisting %d unpersisted presence updates", len(unpersisted))
|
|
await self.store.update_presence(
|
|
[self.user_to_current_state[user_id] for user_id in unpersisted]
|
|
)
|
|
|
|
async def _update_states(
|
|
self, new_states: Iterable[UserPresenceState], force_notify: bool = False
|
|
) -> None:
|
|
"""Updates presence of users. Sets the appropriate timeouts. Pokes
|
|
the notifier and federation if and only if the changed presence state
|
|
should be sent to clients/servers.
|
|
|
|
Args:
|
|
new_states: The new user presence state updates to process.
|
|
force_notify: Whether to force notifying clients of this presence state update,
|
|
even if it doesn't change the state of a user's presence (e.g online -> online).
|
|
This is currently used to bump the max presence stream ID without changing any
|
|
user's presence (see PresenceHandler.add_users_to_send_full_presence_to).
|
|
"""
|
|
now = self.clock.time_msec()
|
|
|
|
with Measure(self.clock, "presence_update_states"):
|
|
|
|
# NOTE: We purposefully don't await between now and when we've
|
|
# calculated what we want to do with the new states, to avoid races.
|
|
|
|
to_notify = {} # Changes we want to notify everyone about
|
|
to_federation_ping = {} # These need sending keep-alives
|
|
|
|
# Only bother handling the last presence change for each user
|
|
new_states_dict = {}
|
|
for new_state in new_states:
|
|
new_states_dict[new_state.user_id] = new_state
|
|
new_states = new_states_dict.values()
|
|
|
|
for new_state in new_states:
|
|
user_id = new_state.user_id
|
|
|
|
# Its fine to not hit the database here, as the only thing not in
|
|
# the current state cache are OFFLINE states, where the only field
|
|
# of interest is last_active which is safe enough to assume is 0
|
|
# here.
|
|
prev_state = self.user_to_current_state.get(
|
|
user_id, UserPresenceState.default(user_id)
|
|
)
|
|
|
|
new_state, should_notify, should_ping = handle_update(
|
|
prev_state,
|
|
new_state,
|
|
is_mine=self.is_mine_id(user_id),
|
|
wheel_timer=self.wheel_timer,
|
|
now=now,
|
|
)
|
|
|
|
if force_notify:
|
|
should_notify = True
|
|
|
|
self.user_to_current_state[user_id] = new_state
|
|
|
|
if should_notify:
|
|
to_notify[user_id] = new_state
|
|
elif should_ping:
|
|
to_federation_ping[user_id] = new_state
|
|
|
|
# TODO: We should probably ensure there are no races hereafter
|
|
|
|
presence_updates_counter.inc(len(new_states))
|
|
|
|
if to_notify:
|
|
notified_presence_counter.inc(len(to_notify))
|
|
await self._persist_and_notify(list(to_notify.values()))
|
|
|
|
self.unpersisted_users_changes |= {s.user_id for s in new_states}
|
|
self.unpersisted_users_changes -= set(to_notify.keys())
|
|
|
|
# Check if we need to resend any presence states to remote hosts. We
|
|
# only do this for states that haven't been updated in a while to
|
|
# ensure that the remote host doesn't time the presence state out.
|
|
#
|
|
# Note that since these are states that have *not* been updated,
|
|
# they won't get sent down the normal presence replication stream,
|
|
# and so we have to explicitly send them via the federation stream.
|
|
to_federation_ping = {
|
|
user_id: state
|
|
for user_id, state in to_federation_ping.items()
|
|
if user_id not in to_notify
|
|
}
|
|
if to_federation_ping:
|
|
federation_presence_out_counter.inc(len(to_federation_ping))
|
|
|
|
hosts_to_states = await get_interested_remotes(
|
|
self.store,
|
|
self.presence_router,
|
|
list(to_federation_ping.values()),
|
|
)
|
|
|
|
for destination, states in hosts_to_states.items():
|
|
self._federation_queue.send_presence_to_destinations(
|
|
states, [destination]
|
|
)
|
|
|
|
async def _handle_timeouts(self) -> None:
|
|
"""Checks the presence of users that have timed out and updates as
|
|
appropriate.
|
|
"""
|
|
logger.debug("Handling presence timeouts")
|
|
now = self.clock.time_msec()
|
|
|
|
# Fetch the list of users that *may* have timed out. Things may have
|
|
# changed since the timeout was set, so we won't necessarily have to
|
|
# take any action.
|
|
users_to_check = set(self.wheel_timer.fetch(now))
|
|
|
|
# Check whether the lists of syncing processes from an external
|
|
# process have expired.
|
|
expired_process_ids = [
|
|
process_id
|
|
for process_id, last_update in self.external_process_last_updated_ms.items()
|
|
if now - last_update > EXTERNAL_PROCESS_EXPIRY
|
|
]
|
|
for process_id in expired_process_ids:
|
|
# For each expired process drop tracking info and check the users
|
|
# that were syncing on that process to see if they need to be timed
|
|
# out.
|
|
users_to_check.update(
|
|
self.external_process_to_current_syncs.pop(process_id, ())
|
|
)
|
|
self.external_process_last_updated_ms.pop(process_id)
|
|
|
|
states = [
|
|
self.user_to_current_state.get(user_id, UserPresenceState.default(user_id))
|
|
for user_id in users_to_check
|
|
]
|
|
|
|
timers_fired_counter.inc(len(states))
|
|
|
|
syncing_user_ids = {
|
|
user_id
|
|
for user_id, count in self.user_to_num_current_syncs.items()
|
|
if count
|
|
}
|
|
for user_ids in self.external_process_to_current_syncs.values():
|
|
syncing_user_ids.update(user_ids)
|
|
|
|
changes = handle_timeouts(
|
|
states,
|
|
is_mine_fn=self.is_mine_id,
|
|
syncing_user_ids=syncing_user_ids,
|
|
now=now,
|
|
)
|
|
|
|
return await self._update_states(changes)
|
|
|
|
async def bump_presence_active_time(self, user: UserID) -> None:
|
|
"""We've seen the user do something that indicates they're interacting
|
|
with the app.
|
|
"""
|
|
# If presence is disabled, no-op
|
|
if not self.hs.config.server.use_presence:
|
|
return
|
|
|
|
user_id = user.to_string()
|
|
|
|
bump_active_time_counter.inc()
|
|
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
|
|
new_fields: Dict[str, Any] = {"last_active_ts": self.clock.time_msec()}
|
|
if prev_state.state == PresenceState.UNAVAILABLE:
|
|
new_fields["state"] = PresenceState.ONLINE
|
|
|
|
await self._update_states([prev_state.copy_and_replace(**new_fields)])
|
|
|
|
async def user_syncing(
|
|
self, user_id: str, affect_presence: bool = True
|
|
) -> ContextManager[None]:
|
|
"""Returns a context manager that should surround any stream requests
|
|
from the user.
|
|
|
|
This allows us to keep track of who is currently streaming and who isn't
|
|
without having to have timers outside of this module to avoid flickering
|
|
when users disconnect/reconnect.
|
|
|
|
Args:
|
|
user_id
|
|
affect_presence: If false this function will be a no-op.
|
|
Useful for streams that are not associated with an actual
|
|
client that is being used by a user.
|
|
"""
|
|
# Override if it should affect the user's presence, if presence is
|
|
# disabled.
|
|
if not self.hs.config.server.use_presence:
|
|
affect_presence = False
|
|
|
|
if affect_presence:
|
|
curr_sync = self.user_to_num_current_syncs.get(user_id, 0)
|
|
self.user_to_num_current_syncs[user_id] = curr_sync + 1
|
|
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
if prev_state.state == PresenceState.OFFLINE:
|
|
# If they're currently offline then bring them online, otherwise
|
|
# just update the last sync times.
|
|
await self._update_states(
|
|
[
|
|
prev_state.copy_and_replace(
|
|
state=PresenceState.ONLINE,
|
|
last_active_ts=self.clock.time_msec(),
|
|
last_user_sync_ts=self.clock.time_msec(),
|
|
)
|
|
]
|
|
)
|
|
else:
|
|
await self._update_states(
|
|
[
|
|
prev_state.copy_and_replace(
|
|
last_user_sync_ts=self.clock.time_msec()
|
|
)
|
|
]
|
|
)
|
|
|
|
async def _end() -> None:
|
|
try:
|
|
self.user_to_num_current_syncs[user_id] -= 1
|
|
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
await self._update_states(
|
|
[
|
|
prev_state.copy_and_replace(
|
|
last_user_sync_ts=self.clock.time_msec()
|
|
)
|
|
]
|
|
)
|
|
except Exception:
|
|
logger.exception("Error updating presence after sync")
|
|
|
|
@contextmanager
|
|
def _user_syncing() -> Generator[None, None, None]:
|
|
try:
|
|
yield
|
|
finally:
|
|
if affect_presence:
|
|
run_in_background(_end)
|
|
|
|
return _user_syncing()
|
|
|
|
def get_currently_syncing_users_for_replication(self) -> Iterable[str]:
|
|
# since we are the process handling presence, there is nothing to do here.
|
|
return []
|
|
|
|
async def update_external_syncs_row(
|
|
self, process_id: str, user_id: str, is_syncing: bool, sync_time_msec: int
|
|
) -> None:
|
|
"""Update the syncing users for an external process as a delta.
|
|
|
|
Args:
|
|
process_id: An identifier for the process the users are
|
|
syncing against. This allows synapse to process updates
|
|
as user start and stop syncing against a given process.
|
|
user_id: The user who has started or stopped syncing
|
|
is_syncing: Whether or not the user is now syncing
|
|
sync_time_msec: Time in ms when the user was last syncing
|
|
"""
|
|
with (await self.external_sync_linearizer.queue(process_id)):
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
|
|
process_presence = self.external_process_to_current_syncs.setdefault(
|
|
process_id, set()
|
|
)
|
|
|
|
updates = []
|
|
if is_syncing and user_id not in process_presence:
|
|
if prev_state.state == PresenceState.OFFLINE:
|
|
updates.append(
|
|
prev_state.copy_and_replace(
|
|
state=PresenceState.ONLINE,
|
|
last_active_ts=sync_time_msec,
|
|
last_user_sync_ts=sync_time_msec,
|
|
)
|
|
)
|
|
else:
|
|
updates.append(
|
|
prev_state.copy_and_replace(last_user_sync_ts=sync_time_msec)
|
|
)
|
|
process_presence.add(user_id)
|
|
elif user_id in process_presence:
|
|
updates.append(
|
|
prev_state.copy_and_replace(last_user_sync_ts=sync_time_msec)
|
|
)
|
|
|
|
if not is_syncing:
|
|
process_presence.discard(user_id)
|
|
|
|
if updates:
|
|
await self._update_states(updates)
|
|
|
|
self.external_process_last_updated_ms[process_id] = self.clock.time_msec()
|
|
|
|
async def update_external_syncs_clear(self, process_id: str) -> None:
|
|
"""Marks all users that had been marked as syncing by a given process
|
|
as offline.
|
|
|
|
Used when the process has stopped/disappeared.
|
|
"""
|
|
with (await self.external_sync_linearizer.queue(process_id)):
|
|
process_presence = self.external_process_to_current_syncs.pop(
|
|
process_id, set()
|
|
)
|
|
prev_states = await self.current_state_for_users(process_presence)
|
|
time_now_ms = self.clock.time_msec()
|
|
|
|
await self._update_states(
|
|
[
|
|
prev_state.copy_and_replace(last_user_sync_ts=time_now_ms)
|
|
for prev_state in prev_states.values()
|
|
]
|
|
)
|
|
self.external_process_last_updated_ms.pop(process_id, None)
|
|
|
|
async def current_state_for_user(self, user_id: str) -> UserPresenceState:
|
|
"""Get the current presence state for a user."""
|
|
res = await self.current_state_for_users([user_id])
|
|
return res[user_id]
|
|
|
|
async def _persist_and_notify(self, states: List[UserPresenceState]) -> None:
|
|
"""Persist states in the database, poke the notifier and send to
|
|
interested remote servers
|
|
"""
|
|
stream_id, max_token = await self.store.update_presence(states)
|
|
|
|
parties = await get_interested_parties(self.store, self.presence_router, states)
|
|
room_ids_to_states, users_to_states = parties
|
|
|
|
self.notifier.on_new_event(
|
|
"presence_key",
|
|
stream_id,
|
|
rooms=room_ids_to_states.keys(),
|
|
users=[UserID.from_string(u) for u in users_to_states],
|
|
)
|
|
|
|
# We only want to poke the local federation sender, if any, as other
|
|
# workers will receive the presence updates via the presence replication
|
|
# stream (which is updated by `store.update_presence`).
|
|
await self.maybe_send_presence_to_interested_destinations(states)
|
|
|
|
async def incoming_presence(self, origin: str, content: JsonDict) -> None:
|
|
"""Called when we receive a `m.presence` EDU from a remote server."""
|
|
if not self._presence_enabled:
|
|
return
|
|
|
|
now = self.clock.time_msec()
|
|
updates = []
|
|
for push in content.get("push", []):
|
|
# A "push" contains a list of presence that we are probably interested
|
|
# in.
|
|
user_id = push.get("user_id", None)
|
|
if not user_id:
|
|
logger.info(
|
|
"Got presence update from %r with no 'user_id': %r", origin, push
|
|
)
|
|
continue
|
|
|
|
if get_domain_from_id(user_id) != origin:
|
|
logger.info(
|
|
"Got presence update from %r with bad 'user_id': %r",
|
|
origin,
|
|
user_id,
|
|
)
|
|
continue
|
|
|
|
presence_state = push.get("presence", None)
|
|
if not presence_state:
|
|
logger.info(
|
|
"Got presence update from %r with no 'presence_state': %r",
|
|
origin,
|
|
push,
|
|
)
|
|
continue
|
|
|
|
new_fields = {"state": presence_state, "last_federation_update_ts": now}
|
|
|
|
last_active_ago = push.get("last_active_ago", None)
|
|
if last_active_ago is not None:
|
|
new_fields["last_active_ts"] = now - last_active_ago
|
|
|
|
new_fields["status_msg"] = push.get("status_msg", None)
|
|
new_fields["currently_active"] = push.get("currently_active", False)
|
|
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
updates.append(prev_state.copy_and_replace(**new_fields))
|
|
|
|
if updates:
|
|
federation_presence_counter.inc(len(updates))
|
|
await self._update_states(updates)
|
|
|
|
async def set_state(
|
|
self,
|
|
target_user: UserID,
|
|
state: JsonDict,
|
|
ignore_status_msg: bool = False,
|
|
force_notify: bool = False,
|
|
) -> None:
|
|
"""Set the presence state of the user.
|
|
|
|
Args:
|
|
target_user: The ID of the user to set the presence state of.
|
|
state: The presence state as a JSON dictionary.
|
|
ignore_status_msg: True to ignore the "status_msg" field of the `state` dict.
|
|
If False, the user's current status will be updated.
|
|
force_notify: Whether to force notification of the update to clients.
|
|
"""
|
|
status_msg = state.get("status_msg", None)
|
|
presence = state["presence"]
|
|
|
|
valid_presence = (
|
|
PresenceState.ONLINE,
|
|
PresenceState.UNAVAILABLE,
|
|
PresenceState.OFFLINE,
|
|
PresenceState.BUSY,
|
|
)
|
|
|
|
if presence not in valid_presence or (
|
|
presence == PresenceState.BUSY and not self._busy_presence_enabled
|
|
):
|
|
raise SynapseError(400, "Invalid presence state")
|
|
|
|
user_id = target_user.to_string()
|
|
|
|
prev_state = await self.current_state_for_user(user_id)
|
|
|
|
new_fields = {"state": presence}
|
|
|
|
if not ignore_status_msg:
|
|
new_fields["status_msg"] = status_msg
|
|
|
|
if presence == PresenceState.ONLINE or (
|
|
presence == PresenceState.BUSY and self._busy_presence_enabled
|
|
):
|
|
new_fields["last_active_ts"] = self.clock.time_msec()
|
|
|
|
await self._update_states(
|
|
[prev_state.copy_and_replace(**new_fields)], force_notify=force_notify
|
|
)
|
|
|
|
async def is_visible(self, observed_user: UserID, observer_user: UserID) -> bool:
|
|
"""Returns whether a user can see another user's presence."""
|
|
observer_room_ids = await self.store.get_rooms_for_user(
|
|
observer_user.to_string()
|
|
)
|
|
observed_room_ids = await self.store.get_rooms_for_user(
|
|
observed_user.to_string()
|
|
)
|
|
|
|
if observer_room_ids & observed_room_ids:
|
|
return True
|
|
|
|
return False
|
|
|
|
async def get_all_presence_updates(
|
|
self, instance_name: str, last_id: int, current_id: int, limit: int
|
|
) -> Tuple[List[Tuple[int, list]], int, bool]:
|
|
"""
|
|
Gets a list of presence update rows from between the given stream ids.
|
|
Each row has:
|
|
- stream_id(str)
|
|
- user_id(str)
|
|
- state(str)
|
|
- last_active_ts(int)
|
|
- last_federation_update_ts(int)
|
|
- last_user_sync_ts(int)
|
|
- status_msg(int)
|
|
- currently_active(int)
|
|
|
|
Args:
|
|
instance_name: The writer we want to fetch updates from. Unused
|
|
here since there is only ever one writer.
|
|
last_id: The token to fetch updates from. Exclusive.
|
|
current_id: The token to fetch updates up to. Inclusive.
|
|
limit: The requested limit for the number of rows to return. The
|
|
function may return more or fewer rows.
|
|
|
|
Returns:
|
|
A tuple consisting of: the updates, a token to use to fetch
|
|
subsequent updates, and whether we returned fewer rows than exists
|
|
between the requested tokens due to the limit.
|
|
|
|
The token returned can be used in a subsequent call to this
|
|
function to get further updates.
|
|
|
|
The updates are a list of 2-tuples of stream ID and the row data
|
|
"""
|
|
|
|
# TODO(markjh): replicate the unpersisted changes.
|
|
# This could use the in-memory stores for recent changes.
|
|
rows = await self.store.get_all_presence_updates(
|
|
instance_name, last_id, current_id, limit
|
|
)
|
|
return rows
|
|
|
|
def notify_new_event(self) -> None:
|
|
"""Called when new events have happened. Handles users and servers
|
|
joining rooms and require being sent presence.
|
|
"""
|
|
|
|
if self._event_processing:
|
|
return
|
|
|
|
async def _process_presence() -> None:
|
|
assert not self._event_processing
|
|
|
|
self._event_processing = True
|
|
try:
|
|
await self._unsafe_process()
|
|
finally:
|
|
self._event_processing = False
|
|
|
|
run_as_background_process("presence.notify_new_event", _process_presence)
|
|
|
|
async def _unsafe_process(self) -> None:
|
|
# Loop round handling deltas until we're up to date
|
|
while True:
|
|
with Measure(self.clock, "presence_delta"):
|
|
room_max_stream_ordering = self.store.get_room_max_stream_ordering()
|
|
if self._event_pos == room_max_stream_ordering:
|
|
return
|
|
|
|
logger.debug(
|
|
"Processing presence stats %s->%s",
|
|
self._event_pos,
|
|
room_max_stream_ordering,
|
|
)
|
|
max_pos, deltas = await self.store.get_current_state_deltas(
|
|
self._event_pos, room_max_stream_ordering
|
|
)
|
|
|
|
# We may get multiple deltas for different rooms, but we want to
|
|
# handle them on a room by room basis, so we batch them up by
|
|
# room.
|
|
deltas_by_room: Dict[str, List[JsonDict]] = {}
|
|
for delta in deltas:
|
|
deltas_by_room.setdefault(delta["room_id"], []).append(delta)
|
|
|
|
for room_id, deltas_for_room in deltas_by_room.items():
|
|
await self._handle_state_delta(room_id, deltas_for_room)
|
|
|
|
self._event_pos = max_pos
|
|
|
|
# Expose current event processing position to prometheus
|
|
synapse.metrics.event_processing_positions.labels("presence").set(
|
|
max_pos
|
|
)
|
|
|
|
async def _handle_state_delta(self, room_id: str, deltas: List[JsonDict]) -> None:
|
|
"""Process current state deltas for the room to find new joins that need
|
|
to be handled.
|
|
"""
|
|
|
|
# Sets of newly joined users. Note that if the local server is
|
|
# joining a remote room for the first time we'll see both the joining
|
|
# user and all remote users as newly joined.
|
|
newly_joined_users = set()
|
|
|
|
for delta in deltas:
|
|
assert room_id == delta["room_id"]
|
|
|
|
typ = delta["type"]
|
|
state_key = delta["state_key"]
|
|
event_id = delta["event_id"]
|
|
prev_event_id = delta["prev_event_id"]
|
|
|
|
logger.debug("Handling: %r %r, %s", typ, state_key, event_id)
|
|
|
|
# Drop any event that isn't a membership join
|
|
if typ != EventTypes.Member:
|
|
continue
|
|
|
|
if event_id is None:
|
|
# state has been deleted, so this is not a join. We only care about
|
|
# joins.
|
|
continue
|
|
|
|
event = await self.store.get_event(event_id, allow_none=True)
|
|
if not event or event.content.get("membership") != Membership.JOIN:
|
|
# We only care about joins
|
|
continue
|
|
|
|
if prev_event_id:
|
|
prev_event = await self.store.get_event(prev_event_id, allow_none=True)
|
|
if (
|
|
prev_event
|
|
and prev_event.content.get("membership") == Membership.JOIN
|
|
):
|
|
# Ignore changes to join events.
|
|
continue
|
|
|
|
newly_joined_users.add(state_key)
|
|
|
|
if not newly_joined_users:
|
|
# If nobody has joined then there's nothing to do.
|
|
return
|
|
|
|
# We want to send:
|
|
# 1. presence states of all local users in the room to newly joined
|
|
# remote servers
|
|
# 2. presence states of newly joined users to all remote servers in
|
|
# the room.
|
|
#
|
|
# TODO: Only send presence states to remote hosts that don't already
|
|
# have them (because they already share rooms).
|
|
|
|
# Get all the users who were already in the room, by fetching the
|
|
# current users in the room and removing the newly joined users.
|
|
users = await self.store.get_users_in_room(room_id)
|
|
prev_users = set(users) - newly_joined_users
|
|
|
|
# Construct sets for all the local users and remote hosts that were
|
|
# already in the room
|
|
prev_local_users = []
|
|
prev_remote_hosts = set()
|
|
for user_id in prev_users:
|
|
if self.is_mine_id(user_id):
|
|
prev_local_users.append(user_id)
|
|
else:
|
|
prev_remote_hosts.add(get_domain_from_id(user_id))
|
|
|
|
# Similarly, construct sets for all the local users and remote hosts
|
|
# that were *not* already in the room. Care needs to be taken with the
|
|
# calculating the remote hosts, as a host may have already been in the
|
|
# room even if there is a newly joined user from that host.
|
|
newly_joined_local_users = []
|
|
newly_joined_remote_hosts = set()
|
|
for user_id in newly_joined_users:
|
|
if self.is_mine_id(user_id):
|
|
newly_joined_local_users.append(user_id)
|
|
else:
|
|
host = get_domain_from_id(user_id)
|
|
if host not in prev_remote_hosts:
|
|
newly_joined_remote_hosts.add(host)
|
|
|
|
# Send presence states of all local users in the room to newly joined
|
|
# remote servers. (We actually only send states for local users already
|
|
# in the room, as we'll send states for newly joined local users below.)
|
|
if prev_local_users and newly_joined_remote_hosts:
|
|
local_states = await self.current_state_for_users(prev_local_users)
|
|
|
|
# Filter out old presence, i.e. offline presence states where
|
|
# the user hasn't been active for a week. We can change this
|
|
# depending on what we want the UX to be, but at the least we
|
|
# should filter out offline presence where the state is just the
|
|
# default state.
|
|
now = self.clock.time_msec()
|
|
states = [
|
|
state
|
|
for state in local_states.values()
|
|
if state.state != PresenceState.OFFLINE
|
|
or now - state.last_active_ts < 7 * 24 * 60 * 60 * 1000
|
|
or state.status_msg is not None
|
|
]
|
|
|
|
self._federation_queue.send_presence_to_destinations(
|
|
destinations=newly_joined_remote_hosts,
|
|
states=states,
|
|
)
|
|
|
|
# Send presence states of newly joined users to all remote servers in
|
|
# the room
|
|
if newly_joined_local_users and (
|
|
prev_remote_hosts or newly_joined_remote_hosts
|
|
):
|
|
local_states = await self.current_state_for_users(newly_joined_local_users)
|
|
self._federation_queue.send_presence_to_destinations(
|
|
destinations=prev_remote_hosts | newly_joined_remote_hosts,
|
|
states=list(local_states.values()),
|
|
)
|
|
|
|
|
|
def should_notify(old_state: UserPresenceState, new_state: UserPresenceState) -> bool:
|
|
"""Decides if a presence state change should be sent to interested parties."""
|
|
if old_state == new_state:
|
|
return False
|
|
|
|
if old_state.status_msg != new_state.status_msg:
|
|
notify_reason_counter.labels("status_msg_change").inc()
|
|
return True
|
|
|
|
if old_state.state != new_state.state:
|
|
notify_reason_counter.labels("state_change").inc()
|
|
state_transition_counter.labels(old_state.state, new_state.state).inc()
|
|
return True
|
|
|
|
if old_state.state == PresenceState.ONLINE:
|
|
if new_state.currently_active != old_state.currently_active:
|
|
notify_reason_counter.labels("current_active_change").inc()
|
|
return True
|
|
|
|
if (
|
|
new_state.last_active_ts - old_state.last_active_ts
|
|
> LAST_ACTIVE_GRANULARITY
|
|
):
|
|
# Only notify about last active bumps if we're not currently active
|
|
if not new_state.currently_active:
|
|
notify_reason_counter.labels("last_active_change_online").inc()
|
|
return True
|
|
|
|
elif new_state.last_active_ts - old_state.last_active_ts > LAST_ACTIVE_GRANULARITY:
|
|
# Always notify for a transition where last active gets bumped.
|
|
notify_reason_counter.labels("last_active_change_not_online").inc()
|
|
return True
|
|
|
|
return False
|
|
|
|
|
|
def format_user_presence_state(
|
|
state: UserPresenceState, now: int, include_user_id: bool = True
|
|
) -> JsonDict:
|
|
"""Convert UserPresenceState to a JSON format that can be sent down to clients
|
|
and to other servers.
|
|
|
|
Args:
|
|
state: The user presence state to format.
|
|
now: The current timestamp since the epoch in ms.
|
|
include_user_id: Whether to include `user_id` in the returned dictionary.
|
|
As this function can be used both to format presence updates for client /sync
|
|
responses and for federation /send requests, only the latter needs the include
|
|
the `user_id` field.
|
|
|
|
Returns:
|
|
A JSON dictionary with the following keys:
|
|
* presence: The presence state as a str.
|
|
* user_id: Optional. Included if `include_user_id` is truthy. The canonical
|
|
Matrix ID of the user.
|
|
* last_active_ago: Optional. Included if `last_active_ts` is set on `state`.
|
|
The timestamp that the user was last active.
|
|
* status_msg: Optional. Included if `status_msg` is set on `state`. The user's
|
|
status.
|
|
* currently_active: Optional. Included only if `state.state` is "online".
|
|
|
|
Example:
|
|
|
|
{
|
|
"presence": "online",
|
|
"user_id": "@alice:example.com",
|
|
"last_active_ago": 16783813918,
|
|
"status_msg": "Hello world!",
|
|
"currently_active": True
|
|
}
|
|
"""
|
|
content: JsonDict = {"presence": state.state}
|
|
if include_user_id:
|
|
content["user_id"] = state.user_id
|
|
if state.last_active_ts:
|
|
content["last_active_ago"] = now - state.last_active_ts
|
|
if state.status_msg:
|
|
content["status_msg"] = state.status_msg
|
|
if state.state == PresenceState.ONLINE:
|
|
content["currently_active"] = state.currently_active
|
|
|
|
return content
|
|
|
|
|
|
class PresenceEventSource(EventSource[int, UserPresenceState]):
|
|
def __init__(self, hs: "HomeServer"):
|
|
# We can't call get_presence_handler here because there's a cycle:
|
|
#
|
|
# Presence -> Notifier -> PresenceEventSource -> Presence
|
|
#
|
|
# Same with get_presence_router:
|
|
#
|
|
# AuthHandler -> Notifier -> PresenceEventSource -> ModuleApi -> AuthHandler
|
|
self.get_presence_handler = hs.get_presence_handler
|
|
self.get_presence_router = hs.get_presence_router
|
|
self.clock = hs.get_clock()
|
|
self.store = hs.get_datastore()
|
|
|
|
async def get_new_events(
|
|
self,
|
|
user: UserID,
|
|
from_key: Optional[int],
|
|
limit: Optional[int] = None,
|
|
room_ids: Optional[Collection[str]] = None,
|
|
is_guest: bool = False,
|
|
explicit_room_id: Optional[str] = None,
|
|
include_offline: bool = True,
|
|
service: Optional[ApplicationService] = None,
|
|
) -> Tuple[List[UserPresenceState], int]:
|
|
# The process for getting presence events are:
|
|
# 1. Get the rooms the user is in.
|
|
# 2. Get the list of user in the rooms.
|
|
# 3. Get the list of users that are in the user's presence list.
|
|
# 4. If there is a from_key set, cross reference the list of users
|
|
# with the `presence_stream_cache` to see which ones we actually
|
|
# need to check.
|
|
# 5. Load current state for the users.
|
|
#
|
|
# We don't try and limit the presence updates by the current token, as
|
|
# sending down the rare duplicate is not a concern.
|
|
|
|
user_id = user.to_string()
|
|
stream_change_cache = self.store.presence_stream_cache
|
|
|
|
with Measure(self.clock, "presence.get_new_events"):
|
|
if from_key is not None:
|
|
from_key = int(from_key)
|
|
|
|
# Check if this user should receive all current, online user presence. We only
|
|
# bother to do this if from_key is set, as otherwise the user will receive all
|
|
# user presence anyways.
|
|
if await self.store.should_user_receive_full_presence_with_token(
|
|
user_id, from_key
|
|
):
|
|
# This user has been specified by a module to receive all current, online
|
|
# user presence. Removing from_key and setting include_offline to false
|
|
# will do effectively this.
|
|
from_key = None
|
|
include_offline = False
|
|
|
|
max_token = self.store.get_current_presence_token()
|
|
if from_key == max_token:
|
|
# This is necessary as due to the way stream ID generators work
|
|
# we may get updates that have a stream ID greater than the max
|
|
# token (e.g. max_token is N but stream generator may return
|
|
# results for N+2, due to N+1 not having finished being
|
|
# persisted yet).
|
|
#
|
|
# This is usually fine, as it just means that we may send down
|
|
# some presence updates multiple times. However, we need to be
|
|
# careful that the sync stream either actually does make some
|
|
# progress or doesn't return, otherwise clients will end up
|
|
# tight looping calling /sync due to it immediately returning
|
|
# the same token repeatedly.
|
|
#
|
|
# Hence this guard where we just return nothing so that the sync
|
|
# doesn't return. C.f. #5503.
|
|
return [], max_token
|
|
|
|
# Figure out which other users this user should receive updates for
|
|
users_interested_in = await self._get_interested_in(user, explicit_room_id)
|
|
|
|
# We have a set of users that we're interested in the presence of. We want to
|
|
# cross-reference that with the users that have actually changed their presence.
|
|
|
|
# Check whether this user should see all user updates
|
|
|
|
if users_interested_in == PresenceRouter.ALL_USERS:
|
|
# Provide presence state for all users
|
|
presence_updates = await self._filter_all_presence_updates_for_user(
|
|
user_id, include_offline, from_key
|
|
)
|
|
|
|
return presence_updates, max_token
|
|
|
|
# Make mypy happy. users_interested_in should now be a set
|
|
assert not isinstance(users_interested_in, str)
|
|
|
|
# The set of users that we're interested in and that have had a presence update.
|
|
# We'll actually pull the presence updates for these users at the end.
|
|
interested_and_updated_users: Union[Set[str], FrozenSet[str]] = set()
|
|
|
|
if from_key:
|
|
# First get all users that have had a presence update
|
|
updated_users = stream_change_cache.get_all_entities_changed(from_key)
|
|
|
|
# Cross-reference users we're interested in with those that have had updates.
|
|
# Use a slightly-optimised method for processing smaller sets of updates.
|
|
if updated_users is not None and len(updated_users) < 500:
|
|
# For small deltas, it's quicker to get all changes and then
|
|
# cross-reference with the users we're interested in
|
|
get_updates_counter.labels("stream").inc()
|
|
for other_user_id in updated_users:
|
|
if other_user_id in users_interested_in:
|
|
# mypy thinks this variable could be a FrozenSet as it's possibly set
|
|
# to one in the `get_entities_changed` call below, and `add()` is not
|
|
# method on a FrozenSet. That doesn't affect us here though, as
|
|
# `interested_and_updated_users` is clearly a set() above.
|
|
interested_and_updated_users.add(other_user_id) # type: ignore
|
|
else:
|
|
# Too many possible updates. Find all users we can see and check
|
|
# if any of them have changed.
|
|
get_updates_counter.labels("full").inc()
|
|
|
|
interested_and_updated_users = (
|
|
stream_change_cache.get_entities_changed(
|
|
users_interested_in, from_key
|
|
)
|
|
)
|
|
else:
|
|
# No from_key has been specified. Return the presence for all users
|
|
# this user is interested in
|
|
interested_and_updated_users = users_interested_in
|
|
|
|
# Retrieve the current presence state for each user
|
|
users_to_state = await self.get_presence_handler().current_state_for_users(
|
|
interested_and_updated_users
|
|
)
|
|
presence_updates = list(users_to_state.values())
|
|
|
|
if not include_offline:
|
|
# Filter out offline presence states
|
|
presence_updates = self._filter_offline_presence_state(presence_updates)
|
|
|
|
return presence_updates, max_token
|
|
|
|
async def _filter_all_presence_updates_for_user(
|
|
self,
|
|
user_id: str,
|
|
include_offline: bool,
|
|
from_key: Optional[int] = None,
|
|
) -> List[UserPresenceState]:
|
|
"""
|
|
Computes the presence updates a user should receive.
|
|
|
|
First pulls presence updates from the database. Then consults PresenceRouter
|
|
for whether any updates should be excluded by user ID.
|
|
|
|
Args:
|
|
user_id: The User ID of the user to compute presence updates for.
|
|
include_offline: Whether to include offline presence states from the results.
|
|
from_key: The minimum stream ID of updates to pull from the database
|
|
before filtering.
|
|
|
|
Returns:
|
|
A list of presence states for the given user to receive.
|
|
"""
|
|
if from_key:
|
|
# Only return updates since the last sync
|
|
updated_users = self.store.presence_stream_cache.get_all_entities_changed(
|
|
from_key
|
|
)
|
|
if not updated_users:
|
|
updated_users = []
|
|
|
|
# Get the actual presence update for each change
|
|
users_to_state = await self.get_presence_handler().current_state_for_users(
|
|
updated_users
|
|
)
|
|
presence_updates = list(users_to_state.values())
|
|
|
|
if not include_offline:
|
|
# Filter out offline states
|
|
presence_updates = self._filter_offline_presence_state(presence_updates)
|
|
else:
|
|
users_to_state = await self.store.get_presence_for_all_users(
|
|
include_offline=include_offline
|
|
)
|
|
|
|
presence_updates = list(users_to_state.values())
|
|
|
|
# TODO: This feels wildly inefficient, and it's unfortunate we need to ask the
|
|
# module for information on a number of users when we then only take the info
|
|
# for a single user
|
|
|
|
# Filter through the presence router
|
|
users_to_state_set = await self.get_presence_router().get_users_for_states(
|
|
presence_updates
|
|
)
|
|
|
|
# We only want the mapping for the syncing user
|
|
presence_updates = list(users_to_state_set[user_id])
|
|
|
|
# Return presence information for all users
|
|
return presence_updates
|
|
|
|
def _filter_offline_presence_state(
|
|
self, presence_updates: Iterable[UserPresenceState]
|
|
) -> List[UserPresenceState]:
|
|
"""Given an iterable containing user presence updates, return a list with any offline
|
|
presence states removed.
|
|
|
|
Args:
|
|
presence_updates: Presence states to filter
|
|
|
|
Returns:
|
|
A new list with any offline presence states removed.
|
|
"""
|
|
return [
|
|
update
|
|
for update in presence_updates
|
|
if update.state != PresenceState.OFFLINE
|
|
]
|
|
|
|
def get_current_key(self) -> int:
|
|
return self.store.get_current_presence_token()
|
|
|
|
@cached(num_args=2, cache_context=True)
|
|
async def _get_interested_in(
|
|
self,
|
|
user: UserID,
|
|
explicit_room_id: Optional[str] = None,
|
|
cache_context: Optional[_CacheContext] = None,
|
|
) -> Union[Set[str], str]:
|
|
"""Returns the set of users that the given user should see presence
|
|
updates for.
|
|
|
|
Args:
|
|
user: The user to retrieve presence updates for.
|
|
explicit_room_id: The users that are in the room will be returned.
|
|
|
|
Returns:
|
|
A set of user IDs to return presence updates for, or "ALL" to return all
|
|
known updates.
|
|
"""
|
|
user_id = user.to_string()
|
|
users_interested_in = set()
|
|
users_interested_in.add(user_id) # So that we receive our own presence
|
|
|
|
# cache_context isn't likely to ever be None due to the @cached decorator,
|
|
# but we can't have a non-optional argument after the optional argument
|
|
# explicit_room_id either. Assert cache_context is not None so we can use it
|
|
# without mypy complaining.
|
|
assert cache_context
|
|
|
|
# Check with the presence router whether we should poll additional users for
|
|
# their presence information
|
|
additional_users = await self.get_presence_router().get_interested_users(
|
|
user.to_string()
|
|
)
|
|
if additional_users == PresenceRouter.ALL_USERS:
|
|
# If the module requested that this user see the presence updates of *all*
|
|
# users, then simply return that instead of calculating what rooms this
|
|
# user shares
|
|
return PresenceRouter.ALL_USERS
|
|
|
|
# Add the additional users from the router
|
|
users_interested_in.update(additional_users)
|
|
|
|
# Find the users who share a room with this user
|
|
users_who_share_room = await self.store.get_users_who_share_room_with_user(
|
|
user_id, on_invalidate=cache_context.invalidate
|
|
)
|
|
users_interested_in.update(users_who_share_room)
|
|
|
|
if explicit_room_id:
|
|
user_ids = await self.store.get_users_in_room(
|
|
explicit_room_id, on_invalidate=cache_context.invalidate
|
|
)
|
|
users_interested_in.update(user_ids)
|
|
|
|
return users_interested_in
|
|
|
|
|
|
def handle_timeouts(
|
|
user_states: List[UserPresenceState],
|
|
is_mine_fn: Callable[[str], bool],
|
|
syncing_user_ids: Set[str],
|
|
now: int,
|
|
) -> List[UserPresenceState]:
|
|
"""Checks the presence of users that have timed out and updates as
|
|
appropriate.
|
|
|
|
Args:
|
|
user_states: List of UserPresenceState's to check.
|
|
is_mine_fn: Function that returns if a user_id is ours
|
|
syncing_user_ids: Set of user_ids with active syncs.
|
|
now: Current time in ms.
|
|
|
|
Returns:
|
|
List of UserPresenceState updates
|
|
"""
|
|
changes = {} # Actual changes we need to notify people about
|
|
|
|
for state in user_states:
|
|
is_mine = is_mine_fn(state.user_id)
|
|
|
|
new_state = handle_timeout(state, is_mine, syncing_user_ids, now)
|
|
if new_state:
|
|
changes[state.user_id] = new_state
|
|
|
|
return list(changes.values())
|
|
|
|
|
|
def handle_timeout(
|
|
state: UserPresenceState, is_mine: bool, syncing_user_ids: Set[str], now: int
|
|
) -> Optional[UserPresenceState]:
|
|
"""Checks the presence of the user to see if any of the timers have elapsed
|
|
|
|
Args:
|
|
state
|
|
is_mine: Whether the user is ours
|
|
syncing_user_ids: Set of user_ids with active syncs.
|
|
now: Current time in ms.
|
|
|
|
Returns:
|
|
A UserPresenceState update or None if no update.
|
|
"""
|
|
if state.state == PresenceState.OFFLINE:
|
|
# No timeouts are associated with offline states.
|
|
return None
|
|
|
|
changed = False
|
|
user_id = state.user_id
|
|
|
|
if is_mine:
|
|
if state.state == PresenceState.ONLINE:
|
|
if now - state.last_active_ts > IDLE_TIMER:
|
|
# Currently online, but last activity ages ago so auto
|
|
# idle
|
|
state = state.copy_and_replace(state=PresenceState.UNAVAILABLE)
|
|
changed = True
|
|
elif now - state.last_active_ts > LAST_ACTIVE_GRANULARITY:
|
|
# So that we send down a notification that we've
|
|
# stopped updating.
|
|
changed = True
|
|
|
|
if now - state.last_federation_update_ts > FEDERATION_PING_INTERVAL:
|
|
# Need to send ping to other servers to ensure they don't
|
|
# timeout and set us to offline
|
|
changed = True
|
|
|
|
# If there are have been no sync for a while (and none ongoing),
|
|
# set presence to offline
|
|
if user_id not in syncing_user_ids:
|
|
# If the user has done something recently but hasn't synced,
|
|
# don't set them as offline.
|
|
sync_or_active = max(state.last_user_sync_ts, state.last_active_ts)
|
|
if now - sync_or_active > SYNC_ONLINE_TIMEOUT:
|
|
state = state.copy_and_replace(state=PresenceState.OFFLINE)
|
|
changed = True
|
|
else:
|
|
# We expect to be poked occasionally by the other side.
|
|
# This is to protect against forgetful/buggy servers, so that
|
|
# no one gets stuck online forever.
|
|
if now - state.last_federation_update_ts > FEDERATION_TIMEOUT:
|
|
# The other side seems to have disappeared.
|
|
state = state.copy_and_replace(state=PresenceState.OFFLINE)
|
|
changed = True
|
|
|
|
return state if changed else None
|
|
|
|
|
|
def handle_update(
|
|
prev_state: UserPresenceState,
|
|
new_state: UserPresenceState,
|
|
is_mine: bool,
|
|
wheel_timer: WheelTimer,
|
|
now: int,
|
|
) -> Tuple[UserPresenceState, bool, bool]:
|
|
"""Given a presence update:
|
|
1. Add any appropriate timers.
|
|
2. Check if we should notify anyone.
|
|
|
|
Args:
|
|
prev_state
|
|
new_state
|
|
is_mine: Whether the user is ours
|
|
wheel_timer
|
|
now: Time now in ms
|
|
|
|
Returns:
|
|
3-tuple: `(new_state, persist_and_notify, federation_ping)` where:
|
|
- new_state: is the state to actually persist
|
|
- persist_and_notify: whether to persist and notify people
|
|
- federation_ping: whether we should send a ping over federation
|
|
"""
|
|
user_id = new_state.user_id
|
|
|
|
persist_and_notify = False
|
|
federation_ping = False
|
|
|
|
# If the users are ours then we want to set up a bunch of timers
|
|
# to time things out.
|
|
if is_mine:
|
|
if new_state.state == PresenceState.ONLINE:
|
|
# Idle timer
|
|
wheel_timer.insert(
|
|
now=now, obj=user_id, then=new_state.last_active_ts + IDLE_TIMER
|
|
)
|
|
|
|
active = now - new_state.last_active_ts < LAST_ACTIVE_GRANULARITY
|
|
new_state = new_state.copy_and_replace(currently_active=active)
|
|
|
|
if active:
|
|
wheel_timer.insert(
|
|
now=now,
|
|
obj=user_id,
|
|
then=new_state.last_active_ts + LAST_ACTIVE_GRANULARITY,
|
|
)
|
|
|
|
if new_state.state != PresenceState.OFFLINE:
|
|
# User has stopped syncing
|
|
wheel_timer.insert(
|
|
now=now,
|
|
obj=user_id,
|
|
then=new_state.last_user_sync_ts + SYNC_ONLINE_TIMEOUT,
|
|
)
|
|
|
|
last_federate = new_state.last_federation_update_ts
|
|
if now - last_federate > FEDERATION_PING_INTERVAL:
|
|
# Been a while since we've poked remote servers
|
|
new_state = new_state.copy_and_replace(last_federation_update_ts=now)
|
|
federation_ping = True
|
|
|
|
else:
|
|
wheel_timer.insert(
|
|
now=now,
|
|
obj=user_id,
|
|
then=new_state.last_federation_update_ts + FEDERATION_TIMEOUT,
|
|
)
|
|
|
|
# Check whether the change was something worth notifying about
|
|
if should_notify(prev_state, new_state):
|
|
new_state = new_state.copy_and_replace(last_federation_update_ts=now)
|
|
persist_and_notify = True
|
|
|
|
return new_state, persist_and_notify, federation_ping
|
|
|
|
|
|
async def get_interested_parties(
|
|
store: DataStore, presence_router: PresenceRouter, states: List[UserPresenceState]
|
|
) -> Tuple[Dict[str, List[UserPresenceState]], Dict[str, List[UserPresenceState]]]:
|
|
"""Given a list of states return which entities (rooms, users)
|
|
are interested in the given states.
|
|
|
|
Args:
|
|
store: The homeserver's data store.
|
|
presence_router: A module for augmenting the destinations for presence updates.
|
|
states: A list of incoming user presence updates.
|
|
|
|
Returns:
|
|
A 2-tuple of `(room_ids_to_states, users_to_states)`,
|
|
with each item being a dict of `entity_name` -> `[UserPresenceState]`
|
|
"""
|
|
room_ids_to_states: Dict[str, List[UserPresenceState]] = {}
|
|
users_to_states: Dict[str, List[UserPresenceState]] = {}
|
|
for state in states:
|
|
room_ids = await store.get_rooms_for_user(state.user_id)
|
|
for room_id in room_ids:
|
|
room_ids_to_states.setdefault(room_id, []).append(state)
|
|
|
|
# Always notify self
|
|
users_to_states.setdefault(state.user_id, []).append(state)
|
|
|
|
# Ask a presence routing module for any additional parties if one
|
|
# is loaded.
|
|
router_users_to_states = await presence_router.get_users_for_states(states)
|
|
|
|
# Update the dictionaries with additional destinations and state to send
|
|
for user_id, user_states in router_users_to_states.items():
|
|
users_to_states.setdefault(user_id, []).extend(user_states)
|
|
|
|
return room_ids_to_states, users_to_states
|
|
|
|
|
|
async def get_interested_remotes(
|
|
store: DataStore,
|
|
presence_router: PresenceRouter,
|
|
states: List[UserPresenceState],
|
|
) -> Dict[str, Set[UserPresenceState]]:
|
|
"""Given a list of presence states figure out which remote servers
|
|
should be sent which.
|
|
|
|
All the presence states should be for local users only.
|
|
|
|
Args:
|
|
store: The homeserver's data store.
|
|
presence_router: A module for augmenting the destinations for presence updates.
|
|
states: A list of incoming user presence updates.
|
|
|
|
Returns:
|
|
A map from destinations to presence states to send to that destination.
|
|
"""
|
|
hosts_and_states: Dict[str, Set[UserPresenceState]] = {}
|
|
|
|
# First we look up the rooms each user is in (as well as any explicit
|
|
# subscriptions), then for each distinct room we look up the remote
|
|
# hosts in those rooms.
|
|
room_ids_to_states, users_to_states = await get_interested_parties(
|
|
store, presence_router, states
|
|
)
|
|
|
|
for room_id, states in room_ids_to_states.items():
|
|
user_ids = await store.get_users_in_room(room_id)
|
|
hosts = {get_domain_from_id(user_id) for user_id in user_ids}
|
|
for host in hosts:
|
|
hosts_and_states.setdefault(host, set()).update(states)
|
|
|
|
for user_id, states in users_to_states.items():
|
|
host = get_domain_from_id(user_id)
|
|
hosts_and_states.setdefault(host, set()).update(states)
|
|
|
|
return hosts_and_states
|
|
|
|
|
|
class PresenceFederationQueue:
|
|
"""Handles sending ad hoc presence updates over federation, which are *not*
|
|
due to state updates (that get handled via the presence stream), e.g.
|
|
federation pings and sending existing present states to newly joined hosts.
|
|
|
|
Only the last N minutes will be queued, so if a federation sender instance
|
|
is down for longer then some updates will be dropped. This is OK as presence
|
|
is ephemeral, and so it will self correct eventually.
|
|
|
|
On workers the class tracks the last received position of the stream from
|
|
replication, and handles querying for missed updates over HTTP replication,
|
|
c.f. `get_current_token` and `get_replication_rows`.
|
|
"""
|
|
|
|
# How long to keep entries in the queue for. Workers that are down for
|
|
# longer than this duration will miss out on older updates.
|
|
_KEEP_ITEMS_IN_QUEUE_FOR_MS = 5 * 60 * 1000
|
|
|
|
# How often to check if we can expire entries from the queue.
|
|
_CLEAR_ITEMS_EVERY_MS = 60 * 1000
|
|
|
|
def __init__(self, hs: "HomeServer", presence_handler: BasePresenceHandler):
|
|
self._clock = hs.get_clock()
|
|
self._notifier = hs.get_notifier()
|
|
self._instance_name = hs.get_instance_name()
|
|
self._presence_handler = presence_handler
|
|
self._repl_client = ReplicationGetStreamUpdates.make_client(hs)
|
|
|
|
# Should we keep a queue of recent presence updates? We only bother if
|
|
# another process may be handling federation sending.
|
|
self._queue_presence_updates = True
|
|
|
|
# Whether this instance is a presence writer.
|
|
self._presence_writer = self._instance_name in hs.config.worker.writers.presence
|
|
|
|
# The FederationSender instance, if this process sends federation traffic directly.
|
|
self._federation = None
|
|
|
|
if hs.should_send_federation():
|
|
self._federation = hs.get_federation_sender()
|
|
|
|
# We don't bother queuing up presence states if only this instance
|
|
# is sending federation.
|
|
if hs.config.worker.federation_shard_config.instances == [
|
|
self._instance_name
|
|
]:
|
|
self._queue_presence_updates = False
|
|
|
|
# The queue of recently queued updates as tuples of: `(timestamp,
|
|
# stream_id, destinations, user_ids)`. We don't store the full states
|
|
# for efficiency, and remote workers will already have the full states
|
|
# cached.
|
|
self._queue: List[Tuple[int, int, Collection[str], Set[str]]] = []
|
|
|
|
self._next_id = 1
|
|
|
|
# Map from instance name to current token
|
|
self._current_tokens: Dict[str, int] = {}
|
|
|
|
if self._queue_presence_updates:
|
|
self._clock.looping_call(self._clear_queue, self._CLEAR_ITEMS_EVERY_MS)
|
|
|
|
def _clear_queue(self) -> None:
|
|
"""Clear out older entries from the queue."""
|
|
clear_before = self._clock.time_msec() - self._KEEP_ITEMS_IN_QUEUE_FOR_MS
|
|
|
|
# The queue is sorted by timestamp, so we can bisect to find the right
|
|
# place to purge before. Note that we are searching using a 1-tuple with
|
|
# the time, which does The Right Thing since the queue is a tuple where
|
|
# the first item is a timestamp.
|
|
index = bisect(self._queue, (clear_before,))
|
|
self._queue = self._queue[index:]
|
|
|
|
def send_presence_to_destinations(
|
|
self, states: Collection[UserPresenceState], destinations: Collection[str]
|
|
) -> None:
|
|
"""Send the presence states to the given destinations.
|
|
|
|
Will forward to the local federation sender (if there is one) and queue
|
|
to send over replication (if there are other federation sender instances.).
|
|
|
|
Must only be called on the presence writer process.
|
|
"""
|
|
|
|
# This should only be called on a presence writer.
|
|
assert self._presence_writer
|
|
|
|
if self._federation:
|
|
self._federation.send_presence_to_destinations(
|
|
states=states,
|
|
destinations=destinations,
|
|
)
|
|
|
|
if not self._queue_presence_updates:
|
|
return
|
|
|
|
now = self._clock.time_msec()
|
|
|
|
stream_id = self._next_id
|
|
self._next_id += 1
|
|
|
|
self._queue.append((now, stream_id, destinations, {s.user_id for s in states}))
|
|
|
|
self._notifier.notify_replication()
|
|
|
|
def get_current_token(self, instance_name: str) -> int:
|
|
"""Get the current position of the stream.
|
|
|
|
On workers this returns the last stream ID received from replication.
|
|
"""
|
|
if instance_name == self._instance_name:
|
|
return self._next_id - 1
|
|
else:
|
|
return self._current_tokens.get(instance_name, 0)
|
|
|
|
async def get_replication_rows(
|
|
self,
|
|
instance_name: str,
|
|
from_token: int,
|
|
upto_token: int,
|
|
target_row_count: int,
|
|
) -> Tuple[List[Tuple[int, Tuple[str, str]]], int, bool]:
|
|
"""Get all the updates between the two tokens.
|
|
|
|
We return rows in the form of `(destination, user_id)` to keep the size
|
|
of each row bounded (rather than returning the sets in a row).
|
|
|
|
On workers this will query the presence writer process via HTTP replication.
|
|
"""
|
|
if instance_name != self._instance_name:
|
|
# If not local we query over http replication from the presence
|
|
# writer
|
|
result = await self._repl_client(
|
|
instance_name=instance_name,
|
|
stream_name=PresenceFederationStream.NAME,
|
|
from_token=from_token,
|
|
upto_token=upto_token,
|
|
)
|
|
return result["updates"], result["upto_token"], result["limited"]
|
|
|
|
# If the from_token is the current token then there's nothing to return
|
|
# and we can trivially no-op.
|
|
if from_token == self._next_id - 1:
|
|
return [], upto_token, False
|
|
|
|
# We can find the correct position in the queue by noting that there is
|
|
# exactly one entry per stream ID, and that the last entry has an ID of
|
|
# `self._next_id - 1`, so we can count backwards from the end.
|
|
#
|
|
# Since we are returning all states in the range `from_token < stream_id
|
|
# <= upto_token` we look for the index with a `stream_id` of `from_token
|
|
# + 1`.
|
|
#
|
|
# Since the start of the queue is periodically truncated we need to
|
|
# handle the case where `from_token` stream ID has already been dropped.
|
|
start_idx = max(from_token + 1 - self._next_id, -len(self._queue))
|
|
|
|
to_send: List[Tuple[int, Tuple[str, str]]] = []
|
|
limited = False
|
|
new_id = upto_token
|
|
for _, stream_id, destinations, user_ids in self._queue[start_idx:]:
|
|
if stream_id <= from_token:
|
|
# Paranoia check that we are actually only sending states that
|
|
# are have stream_id strictly greater than from_token. We should
|
|
# never hit this.
|
|
logger.warning(
|
|
"Tried returning presence federation stream ID: %d less than from_token: %d (next_id: %d, len: %d)",
|
|
stream_id,
|
|
from_token,
|
|
self._next_id,
|
|
len(self._queue),
|
|
)
|
|
continue
|
|
|
|
if stream_id > upto_token:
|
|
break
|
|
|
|
new_id = stream_id
|
|
|
|
to_send.extend(
|
|
(stream_id, (destination, user_id))
|
|
for destination in destinations
|
|
for user_id in user_ids
|
|
)
|
|
|
|
if len(to_send) > target_row_count:
|
|
limited = True
|
|
break
|
|
|
|
return to_send, new_id, limited
|
|
|
|
async def process_replication_rows(
|
|
self, stream_name: str, instance_name: str, token: int, rows: list
|
|
) -> None:
|
|
if stream_name != PresenceFederationStream.NAME:
|
|
return
|
|
|
|
# We keep track of the current tokens (so that we can catch up with anything we missed after a disconnect)
|
|
self._current_tokens[instance_name] = token
|
|
|
|
# If we're a federation sender we pull out the presence states to send
|
|
# and forward them on.
|
|
if not self._federation:
|
|
return
|
|
|
|
hosts_to_users: Dict[str, Set[str]] = {}
|
|
for row in rows:
|
|
hosts_to_users.setdefault(row.destination, set()).add(row.user_id)
|
|
|
|
for host, user_ids in hosts_to_users.items():
|
|
states = await self._presence_handler.current_state_for_users(user_ids)
|
|
self._federation.send_presence_to_destinations(
|
|
states=states.values(),
|
|
destinations=[host],
|
|
)
|