2016-01-07 05:26:29 +01:00
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2014-08-12 16:10:52 +02:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
2020-09-08 13:33:48 +02:00
|
|
|
import json
|
2015-02-11 17:48:05 +01:00
|
|
|
import logging
|
2018-10-17 17:14:04 +02:00
|
|
|
import re
|
2021-05-11 11:47:23 +02:00
|
|
|
from typing import Pattern
|
2018-04-29 13:54:38 +02:00
|
|
|
|
2018-06-22 10:37:10 +02:00
|
|
|
import attr
|
2020-10-28 16:51:15 +01:00
|
|
|
from frozendict import frozendict
|
2018-07-09 08:09:20 +02:00
|
|
|
|
2018-06-22 10:37:10 +02:00
|
|
|
from twisted.internet import defer, task
|
|
|
|
|
2019-07-04 18:32:02 +02:00
|
|
|
from synapse.logging import context
|
2018-06-22 10:37:10 +02:00
|
|
|
|
2015-02-11 17:48:05 +01:00
|
|
|
logger = logging.getLogger(__name__)
|
2014-08-12 16:10:52 +02:00
|
|
|
|
2020-08-19 13:26:03 +02:00
|
|
|
|
2021-05-11 11:47:23 +02:00
|
|
|
_WILDCARD_RUN = re.compile(r"([\?\*]+)")
|
|
|
|
|
|
|
|
|
2020-08-19 13:26:03 +02:00
|
|
|
def _reject_invalid_json(val):
|
|
|
|
"""Do not allow Infinity, -Infinity, or NaN values in JSON."""
|
2020-09-10 20:55:25 +02:00
|
|
|
raise ValueError("Invalid JSON value: '%s'" % val)
|
2020-08-19 13:26:03 +02:00
|
|
|
|
|
|
|
|
2020-10-28 16:51:15 +01:00
|
|
|
def _handle_frozendict(obj):
|
|
|
|
"""Helper for json_encoder. Makes frozendicts serializable by returning
|
|
|
|
the underlying dict
|
|
|
|
"""
|
|
|
|
if type(obj) is frozendict:
|
|
|
|
# fishing the protected dict out of the object is a bit nasty,
|
|
|
|
# but we don't really want the overhead of copying the dict.
|
|
|
|
return obj._dict
|
|
|
|
raise TypeError(
|
|
|
|
"Object of type %s is not JSON serializable" % obj.__class__.__name__
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# A custom JSON encoder which:
|
|
|
|
# * handles frozendicts
|
|
|
|
# * produces valid JSON (no NaNs etc)
|
|
|
|
# * reduces redundant whitespace
|
|
|
|
json_encoder = json.JSONEncoder(
|
|
|
|
allow_nan=False, separators=(",", ":"), default=_handle_frozendict
|
|
|
|
)
|
2020-08-19 13:26:03 +02:00
|
|
|
|
|
|
|
# Create a custom decoder to reject Python extensions to JSON.
|
|
|
|
json_decoder = json.JSONDecoder(parse_constant=_reject_invalid_json)
|
2020-08-07 14:02:55 +02:00
|
|
|
|
2014-08-12 16:10:52 +02:00
|
|
|
|
2015-05-12 14:14:29 +02:00
|
|
|
def unwrapFirstError(failure):
|
|
|
|
# defer.gatherResults and DeferredLists wrap failures.
|
|
|
|
failure.trap(defer.FirstError)
|
|
|
|
return failure.value.subFailure
|
|
|
|
|
|
|
|
|
2020-09-14 18:50:06 +02:00
|
|
|
@attr.s(slots=True)
|
2020-09-04 12:54:56 +02:00
|
|
|
class Clock:
|
2014-08-12 16:10:52 +02:00
|
|
|
"""
|
2018-06-22 10:37:10 +02:00
|
|
|
A Clock wraps a Twisted reactor and provides utilities on top of it.
|
2018-06-25 15:08:28 +02:00
|
|
|
|
|
|
|
Args:
|
|
|
|
reactor: The Twisted reactor to use.
|
2018-06-22 10:37:10 +02:00
|
|
|
"""
|
2019-06-20 11:32:02 +02:00
|
|
|
|
2018-06-22 10:37:10 +02:00
|
|
|
_reactor = attr.ib()
|
|
|
|
|
|
|
|
@defer.inlineCallbacks
|
|
|
|
def sleep(self, seconds):
|
|
|
|
d = defer.Deferred()
|
2019-07-03 16:07:04 +02:00
|
|
|
with context.PreserveLoggingContext():
|
2018-06-22 10:37:10 +02:00
|
|
|
self._reactor.callLater(seconds, d.callback, seconds)
|
|
|
|
res = yield d
|
2019-07-23 15:00:55 +02:00
|
|
|
return res
|
2014-08-12 16:10:52 +02:00
|
|
|
|
|
|
|
def time(self):
|
|
|
|
"""Returns the current system time in seconds since epoch."""
|
2018-06-22 10:37:10 +02:00
|
|
|
return self._reactor.seconds()
|
2014-08-12 16:10:52 +02:00
|
|
|
|
|
|
|
def time_msec(self):
|
2020-07-09 15:52:58 +02:00
|
|
|
"""Returns the current system time in milliseconds since epoch."""
|
2016-02-15 18:10:40 +01:00
|
|
|
return int(self.time() * 1000)
|
2014-08-12 16:10:52 +02:00
|
|
|
|
2019-07-29 10:03:14 +02:00
|
|
|
def looping_call(self, f, msec, *args, **kwargs):
|
2016-11-14 12:19:24 +01:00
|
|
|
"""Call a function repeatedly.
|
|
|
|
|
2019-07-03 10:31:27 +02:00
|
|
|
Waits `msec` initially before calling `f` for the first time.
|
|
|
|
|
|
|
|
Note that the function will be called with no logcontext, so if it is anything
|
|
|
|
other than trivial, you probably want to wrap it in run_as_background_process.
|
2016-11-14 12:19:24 +01:00
|
|
|
|
|
|
|
Args:
|
|
|
|
f(function): The function to call repeatedly.
|
|
|
|
msec(float): How long to wait between calls in milliseconds.
|
2019-07-29 10:03:14 +02:00
|
|
|
*args: Postional arguments to pass to function.
|
|
|
|
**kwargs: Key arguments to pass to function.
|
2016-11-14 12:19:24 +01:00
|
|
|
"""
|
2019-07-29 10:03:14 +02:00
|
|
|
call = task.LoopingCall(f, *args, **kwargs)
|
2018-06-22 10:37:10 +02:00
|
|
|
call.clock = self._reactor
|
2018-10-08 14:26:54 +02:00
|
|
|
d = call.start(msec / 1000.0, now=False)
|
2019-06-20 11:32:02 +02:00
|
|
|
d.addErrback(log_failure, "Looping call died", consumeErrors=False)
|
2017-10-23 16:56:38 +02:00
|
|
|
return call
|
2015-02-09 15:47:59 +01:00
|
|
|
|
2015-05-14 16:34:02 +02:00
|
|
|
def call_later(self, delay, callback, *args, **kwargs):
|
2015-11-10 16:50:58 +01:00
|
|
|
"""Call something later
|
|
|
|
|
2019-07-03 10:31:27 +02:00
|
|
|
Note that the function will be called with no logcontext, so if it is anything
|
|
|
|
other than trivial, you probably want to wrap it in run_as_background_process.
|
|
|
|
|
2015-11-10 16:50:58 +01:00
|
|
|
Args:
|
|
|
|
delay(float): How long to wait in seconds.
|
|
|
|
callback(function): Function to call
|
|
|
|
*args: Postional arguments to pass to function.
|
|
|
|
**kwargs: Key arguments to pass to function.
|
|
|
|
"""
|
2019-06-20 11:32:02 +02:00
|
|
|
|
2015-05-14 16:34:02 +02:00
|
|
|
def wrapped_callback(*args, **kwargs):
|
2019-07-03 16:07:04 +02:00
|
|
|
with context.PreserveLoggingContext():
|
2015-05-14 16:34:02 +02:00
|
|
|
callback(*args, **kwargs)
|
2015-05-08 17:32:18 +02:00
|
|
|
|
2019-07-03 16:07:04 +02:00
|
|
|
with context.PreserveLoggingContext():
|
2018-06-22 10:37:10 +02:00
|
|
|
return self._reactor.callLater(delay, wrapped_callback, *args, **kwargs)
|
2014-08-12 16:10:52 +02:00
|
|
|
|
2015-06-18 16:49:05 +02:00
|
|
|
def cancel_call_later(self, timer, ignore_errs=False):
|
|
|
|
try:
|
|
|
|
timer.cancel()
|
2017-10-23 16:52:32 +02:00
|
|
|
except Exception:
|
2015-06-18 16:49:05 +02:00
|
|
|
if not ignore_errs:
|
|
|
|
raise
|
2018-04-29 13:54:38 +02:00
|
|
|
|
|
|
|
|
2018-10-08 15:06:19 +02:00
|
|
|
def log_failure(failure, msg, consumeErrors=True):
|
2018-10-08 14:26:54 +02:00
|
|
|
"""Creates a function suitable for passing to `Deferred.addErrback` that
|
|
|
|
logs any failures that occur.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
msg (str): Message to log
|
|
|
|
consumeErrors (bool): If true consumes the failure, otherwise passes
|
|
|
|
on down the callback chain
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
func(Failure)
|
2018-10-05 12:23:08 +02:00
|
|
|
"""
|
|
|
|
|
2018-10-08 15:06:19 +02:00
|
|
|
logger.error(
|
2019-06-20 11:32:02 +02:00
|
|
|
msg, exc_info=(failure.type, failure.value, failure.getTracebackObject())
|
2018-10-08 15:06:19 +02:00
|
|
|
)
|
2018-10-08 14:26:54 +02:00
|
|
|
|
2018-10-08 15:06:19 +02:00
|
|
|
if not consumeErrors:
|
|
|
|
return failure
|
2018-10-17 17:14:04 +02:00
|
|
|
|
|
|
|
|
2021-05-11 11:47:23 +02:00
|
|
|
def glob_to_regex(glob: str, word_boundary: bool = False) -> Pattern:
|
2018-10-18 15:21:09 +02:00
|
|
|
"""Converts a glob to a compiled regex object.
|
|
|
|
|
2018-10-17 17:14:04 +02:00
|
|
|
Args:
|
2021-05-11 11:47:23 +02:00
|
|
|
glob: pattern to match
|
|
|
|
word_boundary: If True, the pattern will be allowed to match at word boundaries
|
|
|
|
anywhere in the string. Otherwise, the pattern is anchored at the start and
|
|
|
|
end of the string.
|
2018-10-17 17:14:04 +02:00
|
|
|
|
|
|
|
Returns:
|
2021-05-11 11:47:23 +02:00
|
|
|
compiled regex pattern
|
2018-10-17 17:14:04 +02:00
|
|
|
"""
|
2021-05-11 11:47:23 +02:00
|
|
|
|
|
|
|
# Patterns with wildcards must be simplified to avoid performance cliffs
|
|
|
|
# - The glob `?**?**?` is equivalent to the glob `???*`
|
|
|
|
# - The glob `???*` is equivalent to the regex `.{3,}`
|
|
|
|
chunks = []
|
|
|
|
for chunk in _WILDCARD_RUN.split(glob):
|
|
|
|
# No wildcards? re.escape()
|
|
|
|
if not _WILDCARD_RUN.match(chunk):
|
|
|
|
chunks.append(re.escape(chunk))
|
|
|
|
continue
|
|
|
|
|
|
|
|
# Wildcards? Simplify.
|
|
|
|
qmarks = chunk.count("?")
|
|
|
|
if "*" in chunk:
|
|
|
|
chunks.append(".{%d,}" % qmarks)
|
2018-10-17 17:14:04 +02:00
|
|
|
else:
|
2021-05-11 11:47:23 +02:00
|
|
|
chunks.append(".{%d}" % qmarks)
|
|
|
|
|
|
|
|
res = "".join(chunks)
|
2018-10-18 15:21:09 +02:00
|
|
|
|
2021-05-11 11:47:23 +02:00
|
|
|
if word_boundary:
|
|
|
|
res = re_word_boundary(res)
|
|
|
|
else:
|
|
|
|
# \A anchors at start of string, \Z at end of string
|
|
|
|
res = r"\A" + res + r"\Z"
|
|
|
|
|
|
|
|
return re.compile(res, re.IGNORECASE)
|
|
|
|
|
|
|
|
|
|
|
|
def re_word_boundary(r: str) -> str:
|
|
|
|
"""
|
|
|
|
Adds word boundary characters to the start and end of an
|
|
|
|
expression to require that the match occur as a whole word,
|
|
|
|
but do so respecting the fact that strings starting or ending
|
|
|
|
with non-word characters will change word boundaries.
|
|
|
|
"""
|
|
|
|
# we can't use \b as it chokes on unicode. however \W seems to be okay
|
|
|
|
# as shorthand for [^0-9A-Za-z_].
|
|
|
|
return r"(^|\W)%s(\W|$)" % (r,)
|