2016-03-24 11:47:31 -06:00
|
|
|
# Copyright 2016 OpenMarket Ltd
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2018-04-12 05:08:59 -06:00
|
|
|
import logging
|
2021-12-20 11:12:08 -07:00
|
|
|
from typing import (
|
|
|
|
TYPE_CHECKING,
|
|
|
|
Any,
|
|
|
|
Awaitable,
|
|
|
|
Callable,
|
|
|
|
Dict,
|
|
|
|
Generic,
|
|
|
|
Iterable,
|
|
|
|
Optional,
|
|
|
|
TypeVar,
|
|
|
|
)
|
2021-06-14 03:26:09 -06:00
|
|
|
|
|
|
|
import attr
|
2016-03-24 11:47:31 -06:00
|
|
|
|
2018-04-13 00:32:29 -06:00
|
|
|
from twisted.internet import defer
|
|
|
|
|
2019-07-03 08:07:04 -06:00
|
|
|
from synapse.logging.context import make_deferred_yieldable, run_in_background
|
2021-12-20 11:12:08 -07:00
|
|
|
from synapse.logging.opentracing import (
|
|
|
|
active_span,
|
|
|
|
start_active_span,
|
|
|
|
start_active_span_follows_from,
|
|
|
|
)
|
2021-03-08 12:00:07 -07:00
|
|
|
from synapse.util import Clock
|
2021-12-20 11:12:08 -07:00
|
|
|
from synapse.util.async_helpers import AbstractObservableDeferred, ObservableDeferred
|
2018-05-21 18:47:37 -06:00
|
|
|
from synapse.util.caches import register_cache
|
2018-04-12 05:08:59 -06:00
|
|
|
|
|
|
|
logger = logging.getLogger(__name__)
|
2016-03-24 11:47:31 -06:00
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
if TYPE_CHECKING:
|
|
|
|
import opentracing
|
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
# the type of the key in the cache
|
|
|
|
KV = TypeVar("KV")
|
|
|
|
|
|
|
|
# the type of the result from the operation
|
|
|
|
RV = TypeVar("RV")
|
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
@attr.s(auto_attribs=True)
|
|
|
|
class ResponseCacheContext(Generic[KV]):
|
|
|
|
"""Information about a missed ResponseCache hit
|
2016-03-24 11:47:31 -06:00
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
This object can be passed into the callback for additional feedback
|
|
|
|
"""
|
|
|
|
|
|
|
|
cache_key: KV
|
|
|
|
"""The cache key that caused the cache miss
|
|
|
|
|
|
|
|
This should be considered read-only.
|
|
|
|
|
|
|
|
TODO: in attrs 20.1, make it frozen with an on_setattr.
|
|
|
|
"""
|
|
|
|
|
|
|
|
should_cache: bool = True
|
|
|
|
"""Whether the result should be cached once the request completes.
|
|
|
|
|
|
|
|
This can be modified by the callback if it decides its result should not be cached.
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
@attr.s(auto_attribs=True)
|
|
|
|
class ResponseCacheEntry:
|
|
|
|
result: AbstractObservableDeferred
|
|
|
|
"""The (possibly incomplete) result of the operation.
|
|
|
|
|
|
|
|
Note that we continue to store an ObservableDeferred even after the operation
|
|
|
|
completes (rather than switching to an immediate value), since that makes it
|
|
|
|
easier to cache Failure results.
|
|
|
|
"""
|
|
|
|
|
|
|
|
opentracing_span_context: "Optional[opentracing.SpanContext]"
|
|
|
|
"""The opentracing span which generated/is generating the result"""
|
|
|
|
|
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
class ResponseCache(Generic[KV]):
|
2016-03-24 11:47:31 -06:00
|
|
|
"""
|
|
|
|
This caches a deferred response. Until the deferred completes it will be
|
|
|
|
returned from the cache. This means that if the client retries the request
|
|
|
|
while the response is still being computed, that original response will be
|
|
|
|
used rather than trying to compute a new response.
|
|
|
|
"""
|
|
|
|
|
2021-03-08 12:00:07 -07:00
|
|
|
def __init__(self, clock: Clock, name: str, timeout_ms: float = 0):
|
2021-12-20 11:12:08 -07:00
|
|
|
self._result_cache: Dict[KV, ResponseCacheEntry] = {}
|
2016-03-24 11:47:31 -06:00
|
|
|
|
2021-03-08 12:00:07 -07:00
|
|
|
self.clock = clock
|
2016-07-21 03:30:12 -06:00
|
|
|
self.timeout_sec = timeout_ms / 1000.0
|
|
|
|
|
2018-04-12 05:08:59 -06:00
|
|
|
self._name = name
|
2020-05-11 11:45:23 -06:00
|
|
|
self._metrics = register_cache("response_cache", name, self, resizable=False)
|
2018-04-10 16:14:47 -06:00
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
def size(self) -> int:
|
2021-12-20 11:12:08 -07:00
|
|
|
return len(self._result_cache)
|
2018-04-10 16:14:47 -06:00
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
def __len__(self) -> int:
|
2018-05-21 18:47:37 -06:00
|
|
|
return self.size()
|
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
def keys(self) -> Iterable[KV]:
|
|
|
|
"""Get the keys currently in the result cache
|
2018-04-04 01:58:53 -06:00
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
Returns both incomplete entries, and (if the timeout on this cache is non-zero),
|
|
|
|
complete entries which are still in the cache.
|
2018-04-13 00:32:29 -06:00
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
Note that the returned iterator is not safe in the face of concurrent execution:
|
|
|
|
behaviour is undefined if `wrap` is called during iteration.
|
|
|
|
"""
|
|
|
|
return self._result_cache.keys()
|
|
|
|
|
|
|
|
def _get(self, key: KV) -> Optional[ResponseCacheEntry]:
|
|
|
|
"""Look up the given key.
|
2018-04-04 01:58:53 -06:00
|
|
|
|
|
|
|
Args:
|
2021-12-20 11:12:08 -07:00
|
|
|
key: key to get in the cache
|
2018-04-04 01:58:53 -06:00
|
|
|
|
|
|
|
Returns:
|
2021-12-20 11:12:08 -07:00
|
|
|
The entry for this key, if any; else None.
|
2018-04-04 01:58:53 -06:00
|
|
|
"""
|
2021-12-20 11:12:08 -07:00
|
|
|
entry = self._result_cache.get(key)
|
|
|
|
if entry is not None:
|
2018-04-10 16:14:47 -06:00
|
|
|
self._metrics.inc_hits()
|
2021-12-20 11:12:08 -07:00
|
|
|
return entry
|
2016-03-24 11:47:31 -06:00
|
|
|
else:
|
2018-04-10 16:14:47 -06:00
|
|
|
self._metrics.inc_misses()
|
2016-03-24 11:47:31 -06:00
|
|
|
return None
|
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
def _set(
|
2021-12-20 11:12:08 -07:00
|
|
|
self,
|
|
|
|
context: ResponseCacheContext[KV],
|
|
|
|
deferred: "defer.Deferred[RV]",
|
|
|
|
opentracing_span_context: "Optional[opentracing.SpanContext]",
|
|
|
|
) -> ResponseCacheEntry:
|
2018-04-04 01:58:53 -06:00
|
|
|
"""Set the entry for the given key to the given deferred.
|
|
|
|
|
|
|
|
*deferred* should run its callbacks in the sentinel logcontext (ie,
|
|
|
|
you should wrap normal synapse deferreds with
|
2019-07-03 08:07:04 -06:00
|
|
|
synapse.logging.context.run_in_background).
|
2018-04-04 01:58:53 -06:00
|
|
|
|
|
|
|
Args:
|
2021-06-14 03:26:09 -06:00
|
|
|
context: Information about the cache miss
|
2020-10-09 09:35:11 -06:00
|
|
|
deferred: The deferred which resolves to the result.
|
2021-12-20 11:12:08 -07:00
|
|
|
opentracing_span_context: An opentracing span wrapping the calculation
|
2018-04-04 01:58:53 -06:00
|
|
|
|
|
|
|
Returns:
|
2021-12-20 11:12:08 -07:00
|
|
|
The cache entry object.
|
2018-04-04 01:58:53 -06:00
|
|
|
"""
|
2016-04-06 08:44:22 -06:00
|
|
|
result = ObservableDeferred(deferred, consumeErrors=True)
|
2021-06-14 03:26:09 -06:00
|
|
|
key = context.cache_key
|
2021-12-20 11:12:08 -07:00
|
|
|
entry = ResponseCacheEntry(result, opentracing_span_context)
|
|
|
|
self._result_cache[key] = entry
|
2016-03-24 11:47:31 -06:00
|
|
|
|
2021-10-06 04:20:49 -06:00
|
|
|
def on_complete(r: RV) -> RV:
|
2021-06-14 03:26:09 -06:00
|
|
|
# if this cache has a non-zero timeout, and the callback has not cleared
|
|
|
|
# the should_cache bit, we leave it in the cache for now and schedule
|
|
|
|
# its removal later.
|
|
|
|
if self.timeout_sec and context.should_cache:
|
2016-07-21 03:30:12 -06:00
|
|
|
self.clock.call_later(
|
2021-12-20 11:12:08 -07:00
|
|
|
self.timeout_sec, self._result_cache.pop, key, None
|
2016-07-21 03:30:12 -06:00
|
|
|
)
|
|
|
|
else:
|
2021-06-14 03:26:09 -06:00
|
|
|
# otherwise, remove the result immediately.
|
2021-12-20 11:12:08 -07:00
|
|
|
self._result_cache.pop(key, None)
|
2016-03-24 11:47:31 -06:00
|
|
|
return r
|
|
|
|
|
2021-12-20 11:12:08 -07:00
|
|
|
# make sure we do this *after* adding the entry to result_cache,
|
2021-06-14 03:26:09 -06:00
|
|
|
# in case the result is already complete (in which case flipping the order would
|
|
|
|
# leave us with a stuck entry in the cache).
|
|
|
|
result.addBoth(on_complete)
|
2021-12-20 11:12:08 -07:00
|
|
|
return entry
|
2018-04-12 05:08:59 -06:00
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
async def wrap(
|
|
|
|
self,
|
|
|
|
key: KV,
|
|
|
|
callback: Callable[..., Awaitable[RV]],
|
|
|
|
*args: Any,
|
|
|
|
cache_context: bool = False,
|
|
|
|
**kwargs: Any,
|
|
|
|
) -> RV:
|
2018-04-12 05:08:59 -06:00
|
|
|
"""Wrap together a *get* and *set* call, taking care of logcontexts
|
|
|
|
|
|
|
|
First looks up the key in the cache, and if it is present makes it
|
|
|
|
follow the synapse logcontext rules and returns it.
|
|
|
|
|
|
|
|
Otherwise, makes a call to *callback(*args, **kwargs)*, which should
|
|
|
|
follow the synapse logcontext rules, and adds the result to the cache.
|
|
|
|
|
|
|
|
Example usage:
|
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
async def handle_request(request):
|
2018-04-12 05:08:59 -06:00
|
|
|
# etc
|
2019-07-23 07:00:55 -06:00
|
|
|
return result
|
2018-04-12 05:08:59 -06:00
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
result = await response_cache.wrap(
|
2018-04-12 05:08:59 -06:00
|
|
|
key,
|
|
|
|
handle_request,
|
|
|
|
request,
|
|
|
|
)
|
|
|
|
|
|
|
|
Args:
|
2020-10-09 09:35:11 -06:00
|
|
|
key: key to get/set in the cache
|
2018-04-12 05:08:59 -06:00
|
|
|
|
2020-10-09 09:35:11 -06:00
|
|
|
callback: function to call if the key is not found in
|
2018-04-12 05:08:59 -06:00
|
|
|
the cache
|
|
|
|
|
|
|
|
*args: positional parameters to pass to the callback, if it is used
|
|
|
|
|
2021-06-14 03:26:09 -06:00
|
|
|
cache_context: if set, the callback will be given a `cache_context` kw arg,
|
|
|
|
which will be a ResponseCacheContext object.
|
|
|
|
|
2019-06-25 07:19:21 -06:00
|
|
|
**kwargs: named parameters to pass to the callback, if it is used
|
2018-04-12 05:08:59 -06:00
|
|
|
|
|
|
|
Returns:
|
2021-06-14 03:26:09 -06:00
|
|
|
The result of the callback (from the cache, or otherwise)
|
2018-04-12 05:08:59 -06:00
|
|
|
"""
|
2021-12-20 11:12:08 -07:00
|
|
|
entry = self._get(key)
|
|
|
|
if not entry:
|
2020-02-06 06:31:05 -07:00
|
|
|
logger.debug(
|
2018-04-12 05:08:59 -06:00
|
|
|
"[%s]: no cached result for [%s], calculating new one", self._name, key
|
|
|
|
)
|
2021-06-14 03:26:09 -06:00
|
|
|
context = ResponseCacheContext(cache_key=key)
|
|
|
|
if cache_context:
|
|
|
|
kwargs["cache_context"] = context
|
2021-12-20 11:12:08 -07:00
|
|
|
|
|
|
|
span_context: Optional[opentracing.SpanContext] = None
|
|
|
|
|
|
|
|
async def cb() -> RV:
|
|
|
|
# NB it is important that we do not `await` before setting span_context!
|
|
|
|
nonlocal span_context
|
|
|
|
with start_active_span(f"ResponseCache[{self._name}].calculate"):
|
|
|
|
span = active_span()
|
|
|
|
if span:
|
|
|
|
span_context = span.context
|
|
|
|
return await callback(*args, **kwargs)
|
|
|
|
|
|
|
|
d = run_in_background(cb)
|
|
|
|
entry = self._set(context, d, span_context)
|
|
|
|
return await make_deferred_yieldable(entry.result.observe())
|
|
|
|
|
|
|
|
result = entry.result.observe()
|
|
|
|
if result.called:
|
2018-04-12 05:08:59 -06:00
|
|
|
logger.info("[%s]: using completed cached result for [%s]", self._name, key)
|
|
|
|
else:
|
|
|
|
logger.info(
|
|
|
|
"[%s]: using incomplete cached result for [%s]", self._name, key
|
|
|
|
)
|
2021-12-20 11:12:08 -07:00
|
|
|
|
|
|
|
span_context = entry.opentracing_span_context
|
|
|
|
with start_active_span_follows_from(
|
|
|
|
f"ResponseCache[{self._name}].wait",
|
|
|
|
contexts=(span_context,) if span_context else (),
|
|
|
|
):
|
|
|
|
return await make_deferred_yieldable(result)
|