2016-01-06 23:26:29 -05:00
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2014-08-12 10:10:52 -04:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
2020-09-08 07:33:48 -04:00
|
|
|
import json
|
2015-02-11 11:48:05 -05:00
|
|
|
import logging
|
2018-10-17 11:14:04 -04:00
|
|
|
import re
|
2021-09-10 12:03:18 -04:00
|
|
|
import typing
|
2021-11-12 08:43:06 -05:00
|
|
|
from typing import Any, Callable, Dict, Generator, Optional, Pattern
|
2018-04-29 07:54:38 -04:00
|
|
|
|
2018-06-22 04:37:10 -04:00
|
|
|
import attr
|
2020-10-28 11:51:15 -04:00
|
|
|
from frozendict import frozendict
|
2018-07-09 02:09:20 -04:00
|
|
|
|
2018-06-22 04:37:10 -04:00
|
|
|
from twisted.internet import defer, task
|
2021-09-10 12:03:18 -04:00
|
|
|
from twisted.internet.defer import Deferred
|
|
|
|
from twisted.internet.interfaces import IDelayedCall, IReactorTime
|
|
|
|
from twisted.internet.task import LoopingCall
|
|
|
|
from twisted.python.failure import Failure
|
2018-06-22 04:37:10 -04:00
|
|
|
|
2019-07-04 12:32:02 -04:00
|
|
|
from synapse.logging import context
|
2018-06-22 04:37:10 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
if typing.TYPE_CHECKING:
|
|
|
|
pass
|
|
|
|
|
2015-02-11 11:48:05 -05:00
|
|
|
logger = logging.getLogger(__name__)
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2020-08-19 07:26:03 -04:00
|
|
|
|
2021-05-11 05:47:23 -04:00
|
|
|
_WILDCARD_RUN = re.compile(r"([\?\*]+)")
|
|
|
|
|
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def _reject_invalid_json(val: Any) -> None:
|
2020-08-19 07:26:03 -04:00
|
|
|
"""Do not allow Infinity, -Infinity, or NaN values in JSON."""
|
2020-09-10 14:55:25 -04:00
|
|
|
raise ValueError("Invalid JSON value: '%s'" % val)
|
2020-08-19 07:26:03 -04:00
|
|
|
|
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def _handle_frozendict(obj: Any) -> Dict[Any, Any]:
|
2020-10-28 11:51:15 -04:00
|
|
|
"""Helper for json_encoder. Makes frozendicts serializable by returning
|
|
|
|
the underlying dict
|
|
|
|
"""
|
|
|
|
if type(obj) is frozendict:
|
|
|
|
# fishing the protected dict out of the object is a bit nasty,
|
|
|
|
# but we don't really want the overhead of copying the dict.
|
2021-09-28 12:13:23 -04:00
|
|
|
try:
|
2021-10-08 09:49:41 -04:00
|
|
|
# Safety: we catch the AttributeError immediately below.
|
|
|
|
# See https://github.com/matrix-org/python-canonicaljson/issues/36#issuecomment-927816293
|
|
|
|
# for discussion on how frozendict's internals have changed over time.
|
|
|
|
return obj._dict # type: ignore[attr-defined]
|
2021-09-28 12:13:23 -04:00
|
|
|
except AttributeError:
|
|
|
|
# When the C implementation of frozendict is used,
|
|
|
|
# there isn't a `_dict` attribute with a dict
|
|
|
|
# so we resort to making a copy of the frozendict
|
|
|
|
return dict(obj)
|
2020-10-28 11:51:15 -04:00
|
|
|
raise TypeError(
|
|
|
|
"Object of type %s is not JSON serializable" % obj.__class__.__name__
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# A custom JSON encoder which:
|
|
|
|
# * handles frozendicts
|
|
|
|
# * produces valid JSON (no NaNs etc)
|
|
|
|
# * reduces redundant whitespace
|
|
|
|
json_encoder = json.JSONEncoder(
|
|
|
|
allow_nan=False, separators=(",", ":"), default=_handle_frozendict
|
|
|
|
)
|
2020-08-19 07:26:03 -04:00
|
|
|
|
|
|
|
# Create a custom decoder to reject Python extensions to JSON.
|
|
|
|
json_decoder = json.JSONDecoder(parse_constant=_reject_invalid_json)
|
2020-08-07 08:02:55 -04:00
|
|
|
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def unwrapFirstError(failure: Failure) -> Failure:
|
2015-05-12 08:14:29 -04:00
|
|
|
# defer.gatherResults and DeferredLists wrap failures.
|
|
|
|
failure.trap(defer.FirstError)
|
2021-09-10 12:03:18 -04:00
|
|
|
return failure.value.subFailure # type: ignore[union-attr] # Issue in Twisted's annotations
|
2015-05-12 08:14:29 -04:00
|
|
|
|
|
|
|
|
2020-09-14 12:50:06 -04:00
|
|
|
@attr.s(slots=True)
|
2020-09-04 06:54:56 -04:00
|
|
|
class Clock:
|
2014-08-12 10:10:52 -04:00
|
|
|
"""
|
2018-06-22 04:37:10 -04:00
|
|
|
A Clock wraps a Twisted reactor and provides utilities on top of it.
|
2018-06-25 09:08:28 -04:00
|
|
|
|
|
|
|
Args:
|
|
|
|
reactor: The Twisted reactor to use.
|
2018-06-22 04:37:10 -04:00
|
|
|
"""
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
_reactor: IReactorTime = attr.ib()
|
2018-06-22 04:37:10 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
@defer.inlineCallbacks # type: ignore[arg-type] # Issue in Twisted's type annotations
|
|
|
|
def sleep(self, seconds: float) -> "Generator[Deferred[float], Any, Any]":
|
|
|
|
d: defer.Deferred[float] = defer.Deferred()
|
2019-07-03 10:07:04 -04:00
|
|
|
with context.PreserveLoggingContext():
|
2018-06-22 04:37:10 -04:00
|
|
|
self._reactor.callLater(seconds, d.callback, seconds)
|
|
|
|
res = yield d
|
2019-07-23 09:00:55 -04:00
|
|
|
return res
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def time(self) -> float:
|
2014-08-12 10:10:52 -04:00
|
|
|
"""Returns the current system time in seconds since epoch."""
|
2018-06-22 04:37:10 -04:00
|
|
|
return self._reactor.seconds()
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def time_msec(self) -> int:
|
2020-07-09 09:52:58 -04:00
|
|
|
"""Returns the current system time in milliseconds since epoch."""
|
2016-02-15 12:10:40 -05:00
|
|
|
return int(self.time() * 1000)
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2021-11-12 08:43:06 -05:00
|
|
|
def looping_call(
|
|
|
|
self, f: Callable, msec: float, *args: Any, **kwargs: Any
|
|
|
|
) -> LoopingCall:
|
2016-11-14 06:19:24 -05:00
|
|
|
"""Call a function repeatedly.
|
|
|
|
|
2019-07-03 04:31:27 -04:00
|
|
|
Waits `msec` initially before calling `f` for the first time.
|
|
|
|
|
|
|
|
Note that the function will be called with no logcontext, so if it is anything
|
|
|
|
other than trivial, you probably want to wrap it in run_as_background_process.
|
2016-11-14 06:19:24 -05:00
|
|
|
|
|
|
|
Args:
|
2021-09-10 12:03:18 -04:00
|
|
|
f: The function to call repeatedly.
|
|
|
|
msec: How long to wait between calls in milliseconds.
|
2019-07-29 04:03:14 -04:00
|
|
|
*args: Postional arguments to pass to function.
|
|
|
|
**kwargs: Key arguments to pass to function.
|
2016-11-14 06:19:24 -05:00
|
|
|
"""
|
2019-07-29 04:03:14 -04:00
|
|
|
call = task.LoopingCall(f, *args, **kwargs)
|
2018-06-22 04:37:10 -04:00
|
|
|
call.clock = self._reactor
|
2018-10-08 08:26:54 -04:00
|
|
|
d = call.start(msec / 1000.0, now=False)
|
2019-06-20 05:32:02 -04:00
|
|
|
d.addErrback(log_failure, "Looping call died", consumeErrors=False)
|
2017-10-23 10:56:38 -04:00
|
|
|
return call
|
2015-02-09 09:47:59 -05:00
|
|
|
|
2021-11-12 08:43:06 -05:00
|
|
|
def call_later(
|
|
|
|
self, delay: float, callback: Callable, *args: Any, **kwargs: Any
|
|
|
|
) -> IDelayedCall:
|
2015-11-10 10:50:58 -05:00
|
|
|
"""Call something later
|
|
|
|
|
2019-07-03 04:31:27 -04:00
|
|
|
Note that the function will be called with no logcontext, so if it is anything
|
|
|
|
other than trivial, you probably want to wrap it in run_as_background_process.
|
|
|
|
|
2015-11-10 10:50:58 -05:00
|
|
|
Args:
|
2021-11-12 08:43:06 -05:00
|
|
|
delay: How long to wait in seconds.
|
|
|
|
callback: Function to call
|
2015-11-10 10:50:58 -05:00
|
|
|
*args: Postional arguments to pass to function.
|
|
|
|
**kwargs: Key arguments to pass to function.
|
|
|
|
"""
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2021-11-12 08:43:06 -05:00
|
|
|
def wrapped_callback(*args: Any, **kwargs: Any) -> None:
|
2019-07-03 10:07:04 -04:00
|
|
|
with context.PreserveLoggingContext():
|
2015-05-14 10:34:02 -04:00
|
|
|
callback(*args, **kwargs)
|
2015-05-08 11:32:18 -04:00
|
|
|
|
2019-07-03 10:07:04 -04:00
|
|
|
with context.PreserveLoggingContext():
|
2018-06-22 04:37:10 -04:00
|
|
|
return self._reactor.callLater(delay, wrapped_callback, *args, **kwargs)
|
2014-08-12 10:10:52 -04:00
|
|
|
|
2021-09-10 12:03:18 -04:00
|
|
|
def cancel_call_later(self, timer: IDelayedCall, ignore_errs: bool = False) -> None:
|
2015-06-18 10:49:05 -04:00
|
|
|
try:
|
|
|
|
timer.cancel()
|
2017-10-23 10:52:32 -04:00
|
|
|
except Exception:
|
2015-06-18 10:49:05 -04:00
|
|
|
if not ignore_errs:
|
|
|
|
raise
|
2018-04-29 07:54:38 -04:00
|
|
|
|
|
|
|
|
2021-11-12 08:43:06 -05:00
|
|
|
def log_failure(
|
|
|
|
failure: Failure, msg: str, consumeErrors: bool = True
|
|
|
|
) -> Optional[Failure]:
|
2018-10-08 08:26:54 -04:00
|
|
|
"""Creates a function suitable for passing to `Deferred.addErrback` that
|
|
|
|
logs any failures that occur.
|
|
|
|
|
|
|
|
Args:
|
2021-11-12 08:43:06 -05:00
|
|
|
failure: The Failure to log
|
|
|
|
msg: Message to log
|
|
|
|
consumeErrors: If true consumes the failure, otherwise passes on down
|
|
|
|
the callback chain
|
2018-10-08 08:26:54 -04:00
|
|
|
|
|
|
|
Returns:
|
2021-11-12 08:43:06 -05:00
|
|
|
The Failure if consumeErrors is false. None, otherwise.
|
2018-10-05 06:23:08 -04:00
|
|
|
"""
|
|
|
|
|
2018-10-08 09:06:19 -04:00
|
|
|
logger.error(
|
2021-11-12 08:43:06 -05:00
|
|
|
msg, exc_info=(failure.type, failure.value, failure.getTracebackObject()) # type: ignore[arg-type]
|
2018-10-08 09:06:19 -04:00
|
|
|
)
|
2018-10-08 08:26:54 -04:00
|
|
|
|
2018-10-08 09:06:19 -04:00
|
|
|
if not consumeErrors:
|
|
|
|
return failure
|
2021-11-12 08:43:06 -05:00
|
|
|
return None
|
2018-10-17 11:14:04 -04:00
|
|
|
|
|
|
|
|
2021-05-11 05:47:23 -04:00
|
|
|
def glob_to_regex(glob: str, word_boundary: bool = False) -> Pattern:
|
2018-10-18 09:21:09 -04:00
|
|
|
"""Converts a glob to a compiled regex object.
|
|
|
|
|
2018-10-17 11:14:04 -04:00
|
|
|
Args:
|
2021-05-11 05:47:23 -04:00
|
|
|
glob: pattern to match
|
|
|
|
word_boundary: If True, the pattern will be allowed to match at word boundaries
|
|
|
|
anywhere in the string. Otherwise, the pattern is anchored at the start and
|
|
|
|
end of the string.
|
2018-10-17 11:14:04 -04:00
|
|
|
|
|
|
|
Returns:
|
2021-05-11 05:47:23 -04:00
|
|
|
compiled regex pattern
|
2018-10-17 11:14:04 -04:00
|
|
|
"""
|
2021-05-11 05:47:23 -04:00
|
|
|
|
|
|
|
# Patterns with wildcards must be simplified to avoid performance cliffs
|
|
|
|
# - The glob `?**?**?` is equivalent to the glob `???*`
|
|
|
|
# - The glob `???*` is equivalent to the regex `.{3,}`
|
|
|
|
chunks = []
|
|
|
|
for chunk in _WILDCARD_RUN.split(glob):
|
|
|
|
# No wildcards? re.escape()
|
|
|
|
if not _WILDCARD_RUN.match(chunk):
|
|
|
|
chunks.append(re.escape(chunk))
|
|
|
|
continue
|
|
|
|
|
|
|
|
# Wildcards? Simplify.
|
|
|
|
qmarks = chunk.count("?")
|
|
|
|
if "*" in chunk:
|
|
|
|
chunks.append(".{%d,}" % qmarks)
|
2018-10-17 11:14:04 -04:00
|
|
|
else:
|
2021-05-11 05:47:23 -04:00
|
|
|
chunks.append(".{%d}" % qmarks)
|
|
|
|
|
|
|
|
res = "".join(chunks)
|
2018-10-18 09:21:09 -04:00
|
|
|
|
2021-05-11 05:47:23 -04:00
|
|
|
if word_boundary:
|
|
|
|
res = re_word_boundary(res)
|
|
|
|
else:
|
|
|
|
# \A anchors at start of string, \Z at end of string
|
|
|
|
res = r"\A" + res + r"\Z"
|
|
|
|
|
|
|
|
return re.compile(res, re.IGNORECASE)
|
|
|
|
|
|
|
|
|
|
|
|
def re_word_boundary(r: str) -> str:
|
|
|
|
"""
|
|
|
|
Adds word boundary characters to the start and end of an
|
|
|
|
expression to require that the match occur as a whole word,
|
|
|
|
but do so respecting the fact that strings starting or ending
|
|
|
|
with non-word characters will change word boundaries.
|
|
|
|
"""
|
|
|
|
# we can't use \b as it chokes on unicode. however \W seems to be okay
|
|
|
|
# as shorthand for [^0-9A-Za-z_].
|
|
|
|
return r"(^|\W)%s(\W|$)" % (r,)
|