# Copyright 2014-2016 OpenMarket Ltd # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import json import logging import re import typing from typing import Any, Callable, Dict, Generator, Pattern import attr from frozendict import frozendict from twisted.internet import defer, task from twisted.internet.defer import Deferred from twisted.internet.interfaces import IDelayedCall, IReactorTime from twisted.internet.task import LoopingCall from twisted.python.failure import Failure from synapse.logging import context if typing.TYPE_CHECKING: pass logger = logging.getLogger(__name__) _WILDCARD_RUN = re.compile(r"([\?\*]+)") def _reject_invalid_json(val: Any) -> None: """Do not allow Infinity, -Infinity, or NaN values in JSON.""" raise ValueError("Invalid JSON value: '%s'" % val) def _handle_frozendict(obj: Any) -> Dict[Any, Any]: """Helper for json_encoder. Makes frozendicts serializable by returning the underlying dict """ if type(obj) is frozendict: # fishing the protected dict out of the object is a bit nasty, # but we don't really want the overhead of copying the dict. return obj._dict raise TypeError( "Object of type %s is not JSON serializable" % obj.__class__.__name__ ) # A custom JSON encoder which: # * handles frozendicts # * produces valid JSON (no NaNs etc) # * reduces redundant whitespace json_encoder = json.JSONEncoder( allow_nan=False, separators=(",", ":"), default=_handle_frozendict ) # Create a custom decoder to reject Python extensions to JSON. json_decoder = json.JSONDecoder(parse_constant=_reject_invalid_json) def unwrapFirstError(failure: Failure) -> Failure: # defer.gatherResults and DeferredLists wrap failures. failure.trap(defer.FirstError) return failure.value.subFailure # type: ignore[union-attr] # Issue in Twisted's annotations @attr.s(slots=True) class Clock: """ A Clock wraps a Twisted reactor and provides utilities on top of it. Args: reactor: The Twisted reactor to use. """ _reactor: IReactorTime = attr.ib() @defer.inlineCallbacks # type: ignore[arg-type] # Issue in Twisted's type annotations def sleep(self, seconds: float) -> "Generator[Deferred[float], Any, Any]": d: defer.Deferred[float] = defer.Deferred() with context.PreserveLoggingContext(): self._reactor.callLater(seconds, d.callback, seconds) res = yield d return res def time(self) -> float: """Returns the current system time in seconds since epoch.""" return self._reactor.seconds() def time_msec(self) -> int: """Returns the current system time in milliseconds since epoch.""" return int(self.time() * 1000) def looping_call(self, f: Callable, msec: float, *args, **kwargs) -> LoopingCall: """Call a function repeatedly. Waits `msec` initially before calling `f` for the first time. Note that the function will be called with no logcontext, so if it is anything other than trivial, you probably want to wrap it in run_as_background_process. Args: f: The function to call repeatedly. msec: How long to wait between calls in milliseconds. *args: Postional arguments to pass to function. **kwargs: Key arguments to pass to function. """ call = task.LoopingCall(f, *args, **kwargs) call.clock = self._reactor d = call.start(msec / 1000.0, now=False) d.addErrback(log_failure, "Looping call died", consumeErrors=False) return call def call_later(self, delay, callback, *args, **kwargs) -> IDelayedCall: """Call something later Note that the function will be called with no logcontext, so if it is anything other than trivial, you probably want to wrap it in run_as_background_process. Args: delay(float): How long to wait in seconds. callback(function): Function to call *args: Postional arguments to pass to function. **kwargs: Key arguments to pass to function. """ def wrapped_callback(*args, **kwargs): with context.PreserveLoggingContext(): callback(*args, **kwargs) with context.PreserveLoggingContext(): return self._reactor.callLater(delay, wrapped_callback, *args, **kwargs) def cancel_call_later(self, timer: IDelayedCall, ignore_errs: bool = False) -> None: try: timer.cancel() except Exception: if not ignore_errs: raise def log_failure(failure, msg, consumeErrors=True): """Creates a function suitable for passing to `Deferred.addErrback` that logs any failures that occur. Args: msg (str): Message to log consumeErrors (bool): If true consumes the failure, otherwise passes on down the callback chain Returns: func(Failure) """ logger.error( msg, exc_info=(failure.type, failure.value, failure.getTracebackObject()) ) if not consumeErrors: return failure def glob_to_regex(glob: str, word_boundary: bool = False) -> Pattern: """Converts a glob to a compiled regex object. Args: glob: pattern to match word_boundary: If True, the pattern will be allowed to match at word boundaries anywhere in the string. Otherwise, the pattern is anchored at the start and end of the string. Returns: compiled regex pattern """ # Patterns with wildcards must be simplified to avoid performance cliffs # - The glob `?**?**?` is equivalent to the glob `???*` # - The glob `???*` is equivalent to the regex `.{3,}` chunks = [] for chunk in _WILDCARD_RUN.split(glob): # No wildcards? re.escape() if not _WILDCARD_RUN.match(chunk): chunks.append(re.escape(chunk)) continue # Wildcards? Simplify. qmarks = chunk.count("?") if "*" in chunk: chunks.append(".{%d,}" % qmarks) else: chunks.append(".{%d}" % qmarks) res = "".join(chunks) if word_boundary: res = re_word_boundary(res) else: # \A anchors at start of string, \Z at end of string res = r"\A" + res + r"\Z" return re.compile(res, re.IGNORECASE) def re_word_boundary(r: str) -> str: """ Adds word boundary characters to the start and end of an expression to require that the match occur as a whole word, but do so respecting the fact that strings starting or ending with non-word characters will change word boundaries. """ # we can't use \b as it chokes on unicode. however \W seems to be okay # as shorthand for [^0-9A-Za-z_]. return r"(^|\W)%s(\W|$)" % (r,)