2015-08-11 12:59:32 -04:00
|
|
|
# -*- coding: utf-8 -*-
|
2016-01-06 23:26:29 -05:00
|
|
|
# Copyright 2015, 2016 OpenMarket Ltd
|
2018-04-05 11:24:04 -04:00
|
|
|
# Copyright 2018 New Vector Ltd
|
2015-08-11 12:59:32 -04:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2020-05-11 13:45:23 -04:00
|
|
|
|
2018-07-09 02:09:20 -04:00
|
|
|
import functools
|
|
|
|
import inspect
|
2015-08-11 12:59:32 -04:00
|
|
|
import logging
|
2018-07-09 02:09:20 -04:00
|
|
|
import threading
|
2020-09-03 10:38:32 -04:00
|
|
|
from typing import Any, Callable, Generic, Optional, Tuple, TypeVar, Union, cast
|
2019-11-07 04:43:51 -05:00
|
|
|
from weakref import WeakValueDictionary
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2019-07-24 06:33:13 -04:00
|
|
|
from prometheus_client import Gauge
|
|
|
|
|
2018-07-09 02:09:20 -04:00
|
|
|
from twisted.internet import defer
|
|
|
|
|
2019-07-03 10:07:04 -04:00
|
|
|
from synapse.logging.context import make_deferred_yieldable, preserve_fn
|
|
|
|
from synapse.util import unwrapFirstError
|
2018-08-10 09:50:21 -04:00
|
|
|
from synapse.util.async_helpers import ObservableDeferred
|
2015-08-11 12:59:32 -04:00
|
|
|
from synapse.util.caches.lrucache import LruCache
|
2017-01-17 06:44:57 -05:00
|
|
|
from synapse.util.caches.treecache import TreeCache, iterate_tree_cache_entry
|
2015-08-12 05:13:35 -04:00
|
|
|
|
2017-04-25 05:23:11 -04:00
|
|
|
from . import register_cache
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2019-11-07 04:43:51 -05:00
|
|
|
CacheKey = Union[Tuple, Any]
|
|
|
|
|
2020-09-03 10:38:32 -04:00
|
|
|
F = TypeVar("F", bound=Callable[..., Any])
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2020-09-03 10:38:32 -04:00
|
|
|
|
|
|
|
class _CachedFunction(Generic[F]):
|
2019-10-02 08:29:01 -04:00
|
|
|
invalidate = None # type: Any
|
|
|
|
invalidate_all = None # type: Any
|
|
|
|
invalidate_many = None # type: Any
|
|
|
|
prefill = None # type: Any
|
|
|
|
cache = None # type: Any
|
|
|
|
num_args = None # type: Any
|
|
|
|
|
2020-09-03 10:38:32 -04:00
|
|
|
__name__ = None # type: str
|
|
|
|
|
|
|
|
# Note: This function signature is actually fiddled with by the synapse mypy
|
|
|
|
# plugin to a) make it a bound method, and b) remove any `cache_context` arg.
|
|
|
|
__call__ = None # type: F
|
2019-10-02 08:29:01 -04:00
|
|
|
|
|
|
|
|
2019-07-24 06:33:13 -04:00
|
|
|
cache_pending_metric = Gauge(
|
|
|
|
"synapse_util_caches_cache_pending",
|
|
|
|
"Number of lookups currently pending for this cache",
|
|
|
|
["name"],
|
|
|
|
)
|
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
_CacheSentinel = object()
|
|
|
|
|
|
|
|
|
2020-09-04 06:54:56 -04:00
|
|
|
class CacheEntry:
|
2019-06-20 05:32:02 -04:00
|
|
|
__slots__ = ["deferred", "callbacks", "invalidated"]
|
2017-01-17 06:18:13 -05:00
|
|
|
|
2018-04-05 11:24:04 -04:00
|
|
|
def __init__(self, deferred, callbacks):
|
2017-01-17 06:18:13 -05:00
|
|
|
self.deferred = deferred
|
|
|
|
self.callbacks = set(callbacks)
|
|
|
|
self.invalidated = False
|
|
|
|
|
|
|
|
def invalidate(self):
|
|
|
|
if not self.invalidated:
|
|
|
|
self.invalidated = True
|
|
|
|
for callback in self.callbacks:
|
|
|
|
callback()
|
|
|
|
self.callbacks.clear()
|
2017-01-13 12:46:17 -05:00
|
|
|
|
|
|
|
|
2020-09-04 06:54:56 -04:00
|
|
|
class Cache:
|
2016-06-02 06:29:44 -04:00
|
|
|
__slots__ = (
|
|
|
|
"cache",
|
|
|
|
"name",
|
|
|
|
"keylen",
|
|
|
|
"thread",
|
|
|
|
"metrics",
|
2017-01-17 06:18:13 -05:00
|
|
|
"_pending_deferred_cache",
|
2016-06-02 06:29:44 -04:00
|
|
|
)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2020-05-11 13:45:23 -04:00
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
name: str,
|
|
|
|
max_entries: int = 1000,
|
|
|
|
keylen: int = 1,
|
|
|
|
tree: bool = False,
|
|
|
|
iterable: bool = False,
|
|
|
|
apply_cache_factor_from_config: bool = True,
|
|
|
|
):
|
|
|
|
"""
|
|
|
|
Args:
|
|
|
|
name: The name of the cache
|
|
|
|
max_entries: Maximum amount of entries that the cache will hold
|
|
|
|
keylen: The length of the tuple used as the cache key
|
|
|
|
tree: Use a TreeCache instead of a dict as the underlying cache type
|
|
|
|
iterable: If True, count each item in the cached object as an entry,
|
|
|
|
rather than each cached object
|
|
|
|
apply_cache_factor_from_config: Whether cache factors specified in the
|
|
|
|
config file affect `max_entries`
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Cache
|
|
|
|
"""
|
2016-08-19 06:59:29 -04:00
|
|
|
cache_type = TreeCache if tree else dict
|
2017-01-17 06:18:13 -05:00
|
|
|
self._pending_deferred_cache = cache_type()
|
|
|
|
|
2016-08-19 06:59:29 -04:00
|
|
|
self.cache = LruCache(
|
2019-06-20 05:32:02 -04:00
|
|
|
max_size=max_entries,
|
|
|
|
keylen=keylen,
|
|
|
|
cache_type=cache_type,
|
2017-04-25 05:23:11 -04:00
|
|
|
size_callback=(lambda d: len(d)) if iterable else None,
|
2018-02-01 12:57:51 -05:00
|
|
|
evicted_callback=self._on_evicted,
|
2020-05-11 13:45:23 -04:00
|
|
|
apply_cache_factor_from_config=apply_cache_factor_from_config,
|
2016-08-19 06:59:29 -04:00
|
|
|
)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
self.name = name
|
|
|
|
self.keylen = keylen
|
2020-09-03 10:38:32 -04:00
|
|
|
self.thread = None # type: Optional[threading.Thread]
|
2019-07-24 06:33:13 -04:00
|
|
|
self.metrics = register_cache(
|
|
|
|
"cache",
|
|
|
|
name,
|
|
|
|
self.cache,
|
|
|
|
collect_callback=self._metrics_collection_callback,
|
|
|
|
)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2020-05-11 13:45:23 -04:00
|
|
|
@property
|
|
|
|
def max_entries(self):
|
|
|
|
return self.cache.max_size
|
|
|
|
|
2018-02-01 12:57:51 -05:00
|
|
|
def _on_evicted(self, evicted_count):
|
|
|
|
self.metrics.inc_evictions(evicted_count)
|
|
|
|
|
2019-07-24 06:33:13 -04:00
|
|
|
def _metrics_collection_callback(self):
|
|
|
|
cache_pending_metric.labels(self.name).set(len(self._pending_deferred_cache))
|
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
def check_thread(self):
|
|
|
|
expected_thread = self.thread
|
|
|
|
if expected_thread is None:
|
|
|
|
self.thread = threading.current_thread()
|
|
|
|
else:
|
|
|
|
if expected_thread is not threading.current_thread():
|
|
|
|
raise ValueError(
|
|
|
|
"Cache objects can only be accessed from the main thread"
|
|
|
|
)
|
|
|
|
|
2017-05-08 11:06:17 -04:00
|
|
|
def get(self, key, default=_CacheSentinel, callback=None, update_metrics=True):
|
2017-04-25 05:23:11 -04:00
|
|
|
"""Looks the key up in the caches.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
key(tuple)
|
|
|
|
default: What is returned if key is not in the caches. If not
|
|
|
|
specified then function throws KeyError instead
|
|
|
|
callback(fn): Gets called when the entry in the cache is invalidated
|
2017-05-08 11:06:17 -04:00
|
|
|
update_metrics (bool): whether to update the cache hit rate metrics
|
2017-04-25 05:23:11 -04:00
|
|
|
|
|
|
|
Returns:
|
2019-07-25 10:59:45 -04:00
|
|
|
Either an ObservableDeferred or the raw result
|
2017-04-25 05:23:11 -04:00
|
|
|
"""
|
2017-01-17 06:18:13 -05:00
|
|
|
callbacks = [callback] if callback else []
|
|
|
|
val = self._pending_deferred_cache.get(key, _CacheSentinel)
|
|
|
|
if val is not _CacheSentinel:
|
2018-04-05 11:24:04 -04:00
|
|
|
val.callbacks.update(callbacks)
|
|
|
|
if update_metrics:
|
|
|
|
self.metrics.inc_hits()
|
|
|
|
return val.deferred
|
2017-01-17 06:18:13 -05:00
|
|
|
|
|
|
|
val = self.cache.get(key, _CacheSentinel, callbacks=callbacks)
|
2015-08-11 12:59:32 -04:00
|
|
|
if val is not _CacheSentinel:
|
2016-06-02 06:29:44 -04:00
|
|
|
self.metrics.inc_hits()
|
2015-08-11 12:59:32 -04:00
|
|
|
return val
|
|
|
|
|
2017-05-08 11:06:17 -04:00
|
|
|
if update_metrics:
|
|
|
|
self.metrics.inc_misses()
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
if default is _CacheSentinel:
|
|
|
|
raise KeyError()
|
|
|
|
else:
|
|
|
|
return default
|
|
|
|
|
2017-01-17 06:18:13 -05:00
|
|
|
def set(self, key, value, callback=None):
|
2019-07-25 10:59:45 -04:00
|
|
|
if not isinstance(value, defer.Deferred):
|
|
|
|
raise TypeError("not a Deferred")
|
|
|
|
|
2017-01-17 06:18:13 -05:00
|
|
|
callbacks = [callback] if callback else []
|
2015-08-11 12:59:32 -04:00
|
|
|
self.check_thread()
|
2019-07-25 10:59:45 -04:00
|
|
|
observable = ObservableDeferred(value, consumeErrors=True)
|
2020-08-07 09:44:48 -04:00
|
|
|
observer = observable.observe()
|
2019-07-25 10:59:45 -04:00
|
|
|
entry = CacheEntry(deferred=observable, callbacks=callbacks)
|
2017-01-17 06:18:13 -05:00
|
|
|
|
|
|
|
existing_entry = self._pending_deferred_cache.pop(key, None)
|
|
|
|
if existing_entry:
|
|
|
|
existing_entry.invalidate()
|
|
|
|
|
|
|
|
self._pending_deferred_cache[key] = entry
|
|
|
|
|
2019-07-25 10:59:45 -04:00
|
|
|
def compare_and_pop():
|
|
|
|
"""Check if our entry is still the one in _pending_deferred_cache, and
|
|
|
|
if so, pop it.
|
|
|
|
|
|
|
|
Returns true if the entries matched.
|
|
|
|
"""
|
2018-04-05 11:24:04 -04:00
|
|
|
existing_entry = self._pending_deferred_cache.pop(key, None)
|
|
|
|
if existing_entry is entry:
|
2019-07-25 10:59:45 -04:00
|
|
|
return True
|
|
|
|
|
|
|
|
# oops, the _pending_deferred_cache has been updated since
|
|
|
|
# we started our query, so we are out of date.
|
|
|
|
#
|
|
|
|
# Better put back whatever we took out. (We do it this way
|
|
|
|
# round, rather than peeking into the _pending_deferred_cache
|
|
|
|
# and then removing on a match, to make the common case faster)
|
|
|
|
if existing_entry is not None:
|
|
|
|
self._pending_deferred_cache[key] = existing_entry
|
|
|
|
|
|
|
|
return False
|
|
|
|
|
|
|
|
def cb(result):
|
|
|
|
if compare_and_pop():
|
2018-04-05 11:24:04 -04:00
|
|
|
self.cache.set(key, result, entry.callbacks)
|
2017-01-17 06:18:13 -05:00
|
|
|
else:
|
2018-04-05 11:24:04 -04:00
|
|
|
# we're not going to put this entry into the cache, so need
|
|
|
|
# to make sure that the invalidation callbacks are called.
|
|
|
|
# That was probably done when _pending_deferred_cache was
|
|
|
|
# updated, but it's possible that `set` was called without
|
|
|
|
# `invalidate` being previously called, in which case it may
|
|
|
|
# not have been. Either way, let's double-check now.
|
2017-01-17 06:18:13 -05:00
|
|
|
entry.invalidate()
|
|
|
|
|
2019-07-25 10:59:45 -04:00
|
|
|
def eb(_fail):
|
|
|
|
compare_and_pop()
|
|
|
|
entry.invalidate()
|
|
|
|
|
|
|
|
# once the deferred completes, we can move the entry from the
|
|
|
|
# _pending_deferred_cache to the real cache.
|
|
|
|
#
|
|
|
|
observer.addCallbacks(cb, eb)
|
|
|
|
return observable
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2016-08-19 06:18:26 -04:00
|
|
|
def prefill(self, key, value, callback=None):
|
2017-01-17 06:18:13 -05:00
|
|
|
callbacks = [callback] if callback else []
|
|
|
|
self.cache.set(key, value, callbacks=callbacks)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
def invalidate(self, key):
|
|
|
|
self.check_thread()
|
2018-04-05 11:24:04 -04:00
|
|
|
self.cache.pop(key, None)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2018-04-05 11:24:04 -04:00
|
|
|
# if we have a pending lookup for this key, remove it from the
|
|
|
|
# _pending_deferred_cache, which will (a) stop it being returned
|
|
|
|
# for future queries and (b) stop it being persisted as a proper entry
|
|
|
|
# in self.cache.
|
2017-01-17 06:18:13 -05:00
|
|
|
entry = self._pending_deferred_cache.pop(key, None)
|
2018-04-05 11:24:04 -04:00
|
|
|
|
|
|
|
# run the invalidation callbacks now, rather than waiting for the
|
|
|
|
# deferred to resolve.
|
2017-01-17 06:18:13 -05:00
|
|
|
if entry:
|
|
|
|
entry.invalidate()
|
|
|
|
|
2016-01-21 14:16:25 -05:00
|
|
|
def invalidate_many(self, key):
|
|
|
|
self.check_thread()
|
|
|
|
if not isinstance(key, tuple):
|
2019-06-20 05:32:02 -04:00
|
|
|
raise TypeError("The cache key must be a tuple not %r" % (type(key),))
|
2016-01-21 14:16:25 -05:00
|
|
|
self.cache.del_multi(key)
|
|
|
|
|
2018-04-05 11:24:04 -04:00
|
|
|
# if we have a pending lookup for this key, remove it from the
|
|
|
|
# _pending_deferred_cache, as above
|
2017-01-17 09:43:32 -05:00
|
|
|
entry_dict = self._pending_deferred_cache.pop(key, None)
|
|
|
|
if entry_dict is not None:
|
2017-01-17 06:44:57 -05:00
|
|
|
for entry in iterate_tree_cache_entry(entry_dict):
|
2017-01-17 06:18:13 -05:00
|
|
|
entry.invalidate()
|
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
def invalidate_all(self):
|
|
|
|
self.check_thread()
|
|
|
|
self.cache.clear()
|
2020-06-15 07:03:36 -04:00
|
|
|
for entry in self._pending_deferred_cache.values():
|
2018-04-05 11:24:04 -04:00
|
|
|
entry.invalidate()
|
|
|
|
self._pending_deferred_cache.clear()
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
|
2020-09-04 06:54:56 -04:00
|
|
|
class _CacheDescriptorBase:
|
2020-08-19 07:09:07 -04:00
|
|
|
def __init__(self, orig: _CachedFunction, num_args, cache_context=False):
|
2017-03-22 09:54:20 -04:00
|
|
|
self.orig = orig
|
|
|
|
|
2019-12-12 12:03:28 -05:00
|
|
|
arg_spec = inspect.getfullargspec(orig)
|
2017-03-22 09:54:20 -04:00
|
|
|
all_args = arg_spec.args
|
|
|
|
|
|
|
|
if "cache_context" in all_args:
|
|
|
|
if not cache_context:
|
|
|
|
raise ValueError(
|
|
|
|
"Cannot have a 'cache_context' arg without setting"
|
|
|
|
" cache_context=True"
|
|
|
|
)
|
|
|
|
elif cache_context:
|
|
|
|
raise ValueError(
|
|
|
|
"Cannot have cache_context=True without having an arg"
|
|
|
|
" named `cache_context`"
|
|
|
|
)
|
|
|
|
|
|
|
|
if num_args is None:
|
|
|
|
num_args = len(all_args) - 1
|
|
|
|
if cache_context:
|
|
|
|
num_args -= 1
|
|
|
|
|
|
|
|
if len(all_args) < num_args + 1:
|
|
|
|
raise Exception(
|
|
|
|
"Not enough explicit positional arguments to key off for %r: "
|
|
|
|
"got %i args, but wanted %i. (@cached cannot key off *args or "
|
2019-06-20 05:32:02 -04:00
|
|
|
"**kwargs)" % (orig.__name__, len(all_args), num_args)
|
2017-03-22 09:54:20 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
self.num_args = num_args
|
2017-03-30 09:19:10 -04:00
|
|
|
|
|
|
|
# list of the names of the args used as the cache key
|
2019-06-20 05:32:02 -04:00
|
|
|
self.arg_names = all_args[1 : num_args + 1]
|
2017-03-22 09:54:20 -04:00
|
|
|
|
2017-03-30 09:19:10 -04:00
|
|
|
# self.arg_defaults is a map of arg name to its default value for each
|
|
|
|
# argument that has a default value
|
2017-03-28 06:14:15 -04:00
|
|
|
if arg_spec.defaults:
|
2019-06-20 05:32:02 -04:00
|
|
|
self.arg_defaults = dict(
|
|
|
|
zip(all_args[-len(arg_spec.defaults) :], arg_spec.defaults)
|
|
|
|
)
|
2017-03-28 06:14:15 -04:00
|
|
|
else:
|
|
|
|
self.arg_defaults = {}
|
|
|
|
|
2017-03-22 09:54:20 -04:00
|
|
|
if "cache_context" in self.arg_names:
|
2019-06-20 05:32:02 -04:00
|
|
|
raise Exception("cache_context arg cannot be included among the cache keys")
|
2017-03-22 09:54:20 -04:00
|
|
|
|
|
|
|
self.add_cache_context = cache_context
|
|
|
|
|
|
|
|
|
|
|
|
class CacheDescriptor(_CacheDescriptorBase):
|
2015-08-11 12:59:32 -04:00
|
|
|
""" A method decorator that applies a memoizing cache around the function.
|
|
|
|
|
|
|
|
This caches deferreds, rather than the results themselves. Deferreds that
|
|
|
|
fail are removed from the cache.
|
|
|
|
|
|
|
|
The function is presumed to take zero or more arguments, which are used in
|
|
|
|
a tuple as the key for the cache. Hits are served directly from the cache;
|
|
|
|
misses use the function body to generate the value.
|
|
|
|
|
|
|
|
The wrapped function has an additional member, a callable called
|
|
|
|
"invalidate". This can be used to remove individual entries from the cache.
|
|
|
|
|
|
|
|
The wrapped function has another additional callable, called "prefill",
|
|
|
|
which can be used to insert values into the cache specifically, without
|
|
|
|
calling the calculation function.
|
2016-08-19 06:18:26 -04:00
|
|
|
|
|
|
|
Cached functions can be "chained" (i.e. a cached function can call other cached
|
|
|
|
functions and get appropriately invalidated when they called caches are
|
|
|
|
invalidated) by adding a special "cache_context" argument to the function
|
|
|
|
and passing that as a kwarg to all caches called. For example::
|
|
|
|
|
2020-08-19 07:09:07 -04:00
|
|
|
@cached(cache_context=True)
|
2016-08-19 06:18:26 -04:00
|
|
|
def foo(self, key, cache_context):
|
2016-08-19 10:13:58 -04:00
|
|
|
r1 = yield self.bar1(key, on_invalidate=cache_context.invalidate)
|
|
|
|
r2 = yield self.bar2(key, on_invalidate=cache_context.invalidate)
|
2019-07-23 09:00:55 -04:00
|
|
|
return r1 + r2
|
2016-08-19 06:18:26 -04:00
|
|
|
|
2017-03-22 09:54:20 -04:00
|
|
|
Args:
|
|
|
|
num_args (int): number of positional arguments (excluding ``self`` and
|
|
|
|
``cache_context``) to use as cache keys. Defaults to all named
|
|
|
|
args of the function.
|
2015-08-11 12:59:32 -04:00
|
|
|
"""
|
2019-06-20 05:32:02 -04:00
|
|
|
|
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
orig,
|
|
|
|
max_entries=1000,
|
|
|
|
num_args=None,
|
|
|
|
tree=False,
|
|
|
|
cache_context=False,
|
|
|
|
iterable=False,
|
|
|
|
):
|
2016-03-01 08:21:46 -05:00
|
|
|
|
2020-08-19 07:09:07 -04:00
|
|
|
super().__init__(orig, num_args=num_args, cache_context=cache_context)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
self.max_entries = max_entries
|
2016-01-22 07:10:33 -05:00
|
|
|
self.tree = tree
|
2017-01-13 12:46:17 -05:00
|
|
|
self.iterable = iterable
|
|
|
|
|
2020-05-11 13:45:23 -04:00
|
|
|
def __get__(self, obj, owner):
|
2016-04-06 08:08:05 -04:00
|
|
|
cache = Cache(
|
2015-08-11 12:59:32 -04:00
|
|
|
name=self.orig.__name__,
|
|
|
|
max_entries=self.max_entries,
|
|
|
|
keylen=self.num_args,
|
2016-01-22 07:10:33 -05:00
|
|
|
tree=self.tree,
|
2017-01-13 12:46:17 -05:00
|
|
|
iterable=self.iterable,
|
2015-08-11 12:59:32 -04:00
|
|
|
)
|
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
def get_cache_key_gen(args, kwargs):
|
2017-03-28 06:14:15 -04:00
|
|
|
"""Given some args/kwargs return a generator that resolves into
|
|
|
|
the cache_key.
|
|
|
|
|
|
|
|
We loop through each arg name, looking up if its in the `kwargs`,
|
|
|
|
otherwise using the next argument in `args`. If there are no more
|
|
|
|
args then we try looking the arg name up in the defaults
|
|
|
|
"""
|
|
|
|
pos = 0
|
|
|
|
for nm in self.arg_names:
|
|
|
|
if nm in kwargs:
|
|
|
|
yield kwargs[nm]
|
|
|
|
elif pos < len(args):
|
|
|
|
yield args[pos]
|
|
|
|
pos += 1
|
|
|
|
else:
|
|
|
|
yield self.arg_defaults[nm]
|
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
# By default our cache key is a tuple, but if there is only one item
|
|
|
|
# then don't bother wrapping in a tuple. This is to save memory.
|
|
|
|
if self.num_args == 1:
|
|
|
|
nm = self.arg_names[0]
|
|
|
|
|
|
|
|
def get_cache_key(args, kwargs):
|
|
|
|
if nm in kwargs:
|
|
|
|
return kwargs[nm]
|
|
|
|
elif len(args):
|
|
|
|
return args[0]
|
|
|
|
else:
|
|
|
|
return self.arg_defaults[nm]
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
else:
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
def get_cache_key(args, kwargs):
|
|
|
|
return tuple(get_cache_key_gen(args, kwargs))
|
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
@functools.wraps(self.orig)
|
2019-10-02 08:29:01 -04:00
|
|
|
def _wrapped(*args, **kwargs):
|
2016-08-19 10:02:38 -04:00
|
|
|
# If we're passed a cache_context then we'll want to call its invalidate()
|
|
|
|
# whenever we are invalidated
|
2016-08-19 10:13:58 -04:00
|
|
|
invalidate_callback = kwargs.pop("on_invalidate", None)
|
2016-08-19 06:18:26 -04:00
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
cache_key = get_cache_key(args, kwargs)
|
2016-08-19 06:18:26 -04:00
|
|
|
|
2016-08-19 10:58:52 -04:00
|
|
|
# Add our own `cache_context` to argument list if the wrapped function
|
|
|
|
# has asked for one
|
|
|
|
if self.add_cache_context:
|
2019-11-07 04:43:51 -05:00
|
|
|
kwargs["cache_context"] = _CacheContext.get_instance(cache, cache_key)
|
2016-08-19 06:18:26 -04:00
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
try:
|
2016-08-19 10:13:58 -04:00
|
|
|
cached_result_d = cache.get(cache_key, callback=invalidate_callback)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2017-04-25 05:23:11 -04:00
|
|
|
if isinstance(cached_result_d, ObservableDeferred):
|
|
|
|
observer = cached_result_d.observe()
|
|
|
|
else:
|
2019-10-28 09:33:04 -04:00
|
|
|
observer = defer.succeed(cached_result_d)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
except KeyError:
|
2020-08-19 07:09:07 -04:00
|
|
|
ret = defer.maybeDeferred(preserve_fn(self.orig), obj, *args, **kwargs)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
def onErr(f):
|
2016-04-06 08:08:05 -04:00
|
|
|
cache.invalidate(cache_key)
|
2015-08-11 12:59:32 -04:00
|
|
|
return f
|
|
|
|
|
|
|
|
ret.addErrback(onErr)
|
|
|
|
|
2019-07-25 10:59:45 -04:00
|
|
|
result_d = cache.set(cache_key, ret, callback=invalidate_callback)
|
2017-03-30 08:22:24 -04:00
|
|
|
observer = result_d.observe()
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2019-07-25 10:59:45 -04:00
|
|
|
return make_deferred_yieldable(observer)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2019-10-02 08:29:01 -04:00
|
|
|
wrapped = cast(_CachedFunction, _wrapped)
|
|
|
|
|
2017-05-04 09:18:46 -04:00
|
|
|
if self.num_args == 1:
|
|
|
|
wrapped.invalidate = lambda key: cache.invalidate(key[0])
|
|
|
|
wrapped.prefill = lambda key, val: cache.prefill(key[0], val)
|
|
|
|
else:
|
|
|
|
wrapped.invalidate = cache.invalidate
|
|
|
|
wrapped.invalidate_all = cache.invalidate_all
|
|
|
|
wrapped.invalidate_many = cache.invalidate_many
|
|
|
|
wrapped.prefill = cache.prefill
|
|
|
|
|
2016-04-06 08:08:05 -04:00
|
|
|
wrapped.invalidate_all = cache.invalidate_all
|
|
|
|
wrapped.cache = cache
|
2017-05-22 10:04:42 -04:00
|
|
|
wrapped.num_args = self.num_args
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
obj.__dict__[self.orig.__name__] = wrapped
|
|
|
|
|
|
|
|
return wrapped
|
|
|
|
|
|
|
|
|
2017-03-22 09:54:20 -04:00
|
|
|
class CacheListDescriptor(_CacheDescriptorBase):
|
2015-08-11 12:59:32 -04:00
|
|
|
"""Wraps an existing cache to support bulk fetching of keys.
|
|
|
|
|
|
|
|
Given a list of keys it looks in the cache to find any hits, then passes
|
2017-03-30 08:22:24 -04:00
|
|
|
the list of missing keys to the wrapped function.
|
|
|
|
|
2019-10-29 07:48:24 -04:00
|
|
|
Once wrapped, the function returns a Deferred which resolves to the list
|
|
|
|
of results.
|
2015-08-11 12:59:32 -04:00
|
|
|
"""
|
|
|
|
|
2020-08-19 07:09:07 -04:00
|
|
|
def __init__(self, orig, cached_method_name, list_name, num_args=None):
|
2015-08-11 12:59:32 -04:00
|
|
|
"""
|
|
|
|
Args:
|
|
|
|
orig (function)
|
2020-07-09 09:52:58 -04:00
|
|
|
cached_method_name (str): The name of the cached method.
|
2015-08-11 12:59:32 -04:00
|
|
|
list_name (str): Name of the argument which is the bulk lookup list
|
2017-03-22 09:54:20 -04:00
|
|
|
num_args (int): number of positional arguments (excluding ``self``,
|
|
|
|
but including list_name) to use as cache keys. Defaults to all
|
|
|
|
named args of the function.
|
2015-08-11 12:59:32 -04:00
|
|
|
"""
|
2020-08-19 07:09:07 -04:00
|
|
|
super().__init__(orig, num_args=num_args)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
self.list_name = list_name
|
|
|
|
|
|
|
|
self.list_pos = self.arg_names.index(self.list_name)
|
2016-04-06 08:08:05 -04:00
|
|
|
self.cached_method_name = cached_method_name
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
self.sentinel = object()
|
|
|
|
|
|
|
|
if self.list_name not in self.arg_names:
|
|
|
|
raise Exception(
|
|
|
|
"Couldn't see arguments %r for %r."
|
2019-06-20 05:32:02 -04:00
|
|
|
% (self.list_name, cached_method_name)
|
2015-08-11 12:59:32 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
def __get__(self, obj, objtype=None):
|
2017-05-22 10:04:42 -04:00
|
|
|
cached_method = getattr(obj, self.cached_method_name)
|
|
|
|
cache = cached_method.cache
|
|
|
|
num_args = cached_method.num_args
|
2016-04-06 08:08:05 -04:00
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
@functools.wraps(self.orig)
|
|
|
|
def wrapped(*args, **kwargs):
|
2018-06-10 17:38:50 -04:00
|
|
|
# If we're passed a cache_context then we'll want to call its
|
|
|
|
# invalidate() whenever we are invalidated
|
2016-08-19 10:13:58 -04:00
|
|
|
invalidate_callback = kwargs.pop("on_invalidate", None)
|
2016-08-19 06:18:26 -04:00
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
arg_dict = inspect.getcallargs(self.orig, obj, *args, **kwargs)
|
|
|
|
keyargs = [arg_dict[arg_nm] for arg_nm in self.arg_names]
|
|
|
|
list_args = arg_dict[self.list_name]
|
|
|
|
|
2016-06-01 13:01:22 -04:00
|
|
|
results = {}
|
2018-06-10 17:38:50 -04:00
|
|
|
|
|
|
|
def update_results_dict(res, arg):
|
|
|
|
results[arg] = res
|
|
|
|
|
|
|
|
# list of deferreds to wait for
|
|
|
|
cached_defers = []
|
|
|
|
|
|
|
|
missing = set()
|
2017-05-22 10:12:19 -04:00
|
|
|
|
|
|
|
# If the cache takes a single arg then that is used as the key,
|
|
|
|
# otherwise a tuple is used.
|
|
|
|
if num_args == 1:
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2018-06-10 17:38:50 -04:00
|
|
|
def arg_to_cache_key(arg):
|
|
|
|
return arg
|
2019-06-20 05:32:02 -04:00
|
|
|
|
2017-05-22 10:12:19 -04:00
|
|
|
else:
|
2018-06-10 17:38:50 -04:00
|
|
|
keylist = list(keyargs)
|
2017-05-22 10:12:19 -04:00
|
|
|
|
2018-06-10 17:38:50 -04:00
|
|
|
def arg_to_cache_key(arg):
|
|
|
|
keylist[self.list_pos] = arg
|
|
|
|
return tuple(keylist)
|
2017-05-22 10:12:19 -04:00
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
for arg in list_args:
|
|
|
|
try:
|
2019-06-20 05:32:02 -04:00
|
|
|
res = cache.get(arg_to_cache_key(arg), callback=invalidate_callback)
|
2017-04-25 05:23:11 -04:00
|
|
|
if not isinstance(res, ObservableDeferred):
|
|
|
|
results[arg] = res
|
|
|
|
elif not res.has_succeeded():
|
2016-06-01 13:01:22 -04:00
|
|
|
res = res.observe()
|
2018-06-10 17:38:50 -04:00
|
|
|
res.addCallback(update_results_dict, arg)
|
|
|
|
cached_defers.append(res)
|
2016-06-01 13:01:22 -04:00
|
|
|
else:
|
2016-06-02 06:52:32 -04:00
|
|
|
results[arg] = res.get_result()
|
2015-08-11 12:59:32 -04:00
|
|
|
except KeyError:
|
2018-06-10 17:38:50 -04:00
|
|
|
missing.add(arg)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
if missing:
|
2019-07-25 10:59:45 -04:00
|
|
|
# we need a deferred for each entry in the list,
|
2018-06-10 17:38:50 -04:00
|
|
|
# which we put in the cache. Each deferred resolves with the
|
|
|
|
# relevant result for that key.
|
|
|
|
deferreds_map = {}
|
|
|
|
for arg in missing:
|
|
|
|
deferred = defer.Deferred()
|
|
|
|
deferreds_map[arg] = deferred
|
|
|
|
key = arg_to_cache_key(arg)
|
2019-07-25 10:59:45 -04:00
|
|
|
cache.set(key, deferred, callback=invalidate_callback)
|
2018-06-10 17:38:50 -04:00
|
|
|
|
|
|
|
def complete_all(res):
|
|
|
|
# the wrapped function has completed. It returns a
|
|
|
|
# a dict. We can now resolve the observable deferreds in
|
|
|
|
# the cache and update our own result map.
|
|
|
|
for e in missing:
|
|
|
|
val = res.get(e, None)
|
|
|
|
deferreds_map[e].callback(val)
|
|
|
|
results[e] = val
|
|
|
|
|
|
|
|
def errback(f):
|
|
|
|
# the wrapped function has failed. Invalidate any cache
|
|
|
|
# entries we're supposed to be populating, and fail
|
|
|
|
# their deferreds.
|
|
|
|
for e in missing:
|
|
|
|
key = arg_to_cache_key(e)
|
|
|
|
cache.invalidate(key)
|
|
|
|
deferreds_map[e].errback(f)
|
|
|
|
|
|
|
|
# return the failure, to propagate to our caller.
|
|
|
|
return f
|
|
|
|
|
2015-08-11 12:59:32 -04:00
|
|
|
args_to_call = dict(arg_dict)
|
2018-06-10 17:38:50 -04:00
|
|
|
args_to_call[self.list_name] = list(missing)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2019-06-20 05:32:02 -04:00
|
|
|
cached_defers.append(
|
|
|
|
defer.maybeDeferred(
|
2020-08-19 07:09:07 -04:00
|
|
|
preserve_fn(self.orig), **args_to_call
|
2019-06-20 05:32:02 -04:00
|
|
|
).addCallbacks(complete_all, errback)
|
|
|
|
)
|
2016-06-01 13:01:22 -04:00
|
|
|
|
|
|
|
if cached_defers:
|
2019-06-20 05:32:02 -04:00
|
|
|
d = defer.gatherResults(cached_defers, consumeErrors=True).addCallbacks(
|
|
|
|
lambda _: results, unwrapFirstError
|
2018-06-10 17:38:50 -04:00
|
|
|
)
|
2019-07-03 10:07:04 -04:00
|
|
|
return make_deferred_yieldable(d)
|
2016-06-01 13:01:22 -04:00
|
|
|
else:
|
2019-10-28 09:33:04 -04:00
|
|
|
return defer.succeed(results)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
|
|
|
obj.__dict__[self.orig.__name__] = wrapped
|
|
|
|
|
|
|
|
return wrapped
|
|
|
|
|
|
|
|
|
2019-11-07 04:43:51 -05:00
|
|
|
class _CacheContext:
|
|
|
|
"""Holds cache information from the cached function higher in the calling order.
|
|
|
|
|
|
|
|
Can be used to invalidate the higher level cache entry if something changes
|
|
|
|
on a lower level.
|
|
|
|
"""
|
|
|
|
|
|
|
|
_cache_context_objects = (
|
|
|
|
WeakValueDictionary()
|
|
|
|
) # type: WeakValueDictionary[Tuple[Cache, CacheKey], _CacheContext]
|
|
|
|
|
|
|
|
def __init__(self, cache, cache_key): # type: (Cache, CacheKey) -> None
|
|
|
|
self._cache = cache
|
|
|
|
self._cache_key = cache_key
|
|
|
|
|
|
|
|
def invalidate(self): # type: () -> None
|
|
|
|
"""Invalidates the cache entry referred to by the context."""
|
|
|
|
self._cache.invalidate(self._cache_key)
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def get_instance(cls, cache, cache_key): # type: (Cache, CacheKey) -> _CacheContext
|
|
|
|
"""Returns an instance constructed with the given arguments.
|
|
|
|
|
|
|
|
A new instance is only created if none already exists.
|
|
|
|
"""
|
|
|
|
|
|
|
|
# We make sure there are no identical _CacheContext instances. This is
|
|
|
|
# important in particular to dedupe when we add callbacks to lru cache
|
|
|
|
# nodes, otherwise the number of callbacks would grow.
|
|
|
|
return cls._cache_context_objects.setdefault(
|
|
|
|
(cache, cache_key), cls(cache, cache_key)
|
|
|
|
)
|
2016-08-19 06:18:26 -04:00
|
|
|
|
|
|
|
|
2019-06-20 05:32:02 -04:00
|
|
|
def cached(
|
2020-09-03 10:38:32 -04:00
|
|
|
max_entries: int = 1000,
|
|
|
|
num_args: Optional[int] = None,
|
|
|
|
tree: bool = False,
|
|
|
|
cache_context: bool = False,
|
|
|
|
iterable: bool = False,
|
|
|
|
) -> Callable[[F], _CachedFunction[F]]:
|
|
|
|
func = lambda orig: CacheDescriptor(
|
2015-08-11 12:59:32 -04:00
|
|
|
orig,
|
|
|
|
max_entries=max_entries,
|
|
|
|
num_args=num_args,
|
2016-01-22 07:10:33 -05:00
|
|
|
tree=tree,
|
2016-08-19 10:02:38 -04:00
|
|
|
cache_context=cache_context,
|
2017-01-13 12:46:17 -05:00
|
|
|
iterable=iterable,
|
2015-08-11 12:59:32 -04:00
|
|
|
)
|
|
|
|
|
2020-09-03 10:38:32 -04:00
|
|
|
return cast(Callable[[F], _CachedFunction[F]], func)
|
2015-08-11 12:59:32 -04:00
|
|
|
|
2020-09-03 10:38:32 -04:00
|
|
|
|
|
|
|
def cachedList(
|
|
|
|
cached_method_name: str, list_name: str, num_args: Optional[int] = None
|
|
|
|
) -> Callable[[F], _CachedFunction[F]]:
|
2015-08-12 11:42:46 -04:00
|
|
|
"""Creates a descriptor that wraps a function in a `CacheListDescriptor`.
|
|
|
|
|
|
|
|
Used to do batch lookups for an already created cache. A single argument
|
|
|
|
is specified as a list that is iterated through to lookup keys in the
|
|
|
|
original cache. A new list consisting of the keys that weren't in the cache
|
|
|
|
get passed to the original function, the result of which is stored in the
|
|
|
|
cache.
|
|
|
|
|
|
|
|
Args:
|
2020-09-03 10:38:32 -04:00
|
|
|
cached_method_name: The name of the single-item lookup method.
|
2018-06-10 17:38:50 -04:00
|
|
|
This is only used to find the cache to use.
|
2020-09-03 10:38:32 -04:00
|
|
|
list_name: The name of the argument that is the list to use to
|
2015-08-12 11:42:46 -04:00
|
|
|
do batch lookups in the cache.
|
2020-09-03 10:38:32 -04:00
|
|
|
num_args: Number of arguments to use as the key in the cache
|
2017-03-22 09:54:20 -04:00
|
|
|
(including list_name). Defaults to all named parameters.
|
2015-08-12 11:42:46 -04:00
|
|
|
|
|
|
|
Example:
|
|
|
|
|
2020-09-04 06:54:56 -04:00
|
|
|
class Example:
|
2015-08-12 11:42:46 -04:00
|
|
|
@cached(num_args=2)
|
|
|
|
def do_something(self, first_arg):
|
|
|
|
...
|
|
|
|
|
|
|
|
@cachedList(do_something.cache, list_name="second_args", num_args=2)
|
|
|
|
def batch_do_something(self, first_arg, second_args):
|
|
|
|
...
|
|
|
|
"""
|
2020-09-03 10:38:32 -04:00
|
|
|
func = lambda orig: CacheListDescriptor(
|
2015-08-11 12:59:32 -04:00
|
|
|
orig,
|
2016-04-06 08:08:05 -04:00
|
|
|
cached_method_name=cached_method_name,
|
2015-08-11 12:59:32 -04:00
|
|
|
list_name=list_name,
|
|
|
|
num_args=num_args,
|
|
|
|
)
|
2020-09-03 10:38:32 -04:00
|
|
|
|
|
|
|
return cast(Callable[[F], _CachedFunction[F]], func)
|