2020-05-11 11:45:23 -06:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
# Copyright 2019 Matrix.org Foundation C.I.C.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
import os
|
2020-05-27 06:17:01 -06:00
|
|
|
import re
|
2020-06-10 11:27:49 -06:00
|
|
|
import threading
|
2020-05-11 11:45:23 -06:00
|
|
|
from typing import Callable, Dict
|
|
|
|
|
|
|
|
from ._base import Config, ConfigError
|
|
|
|
|
|
|
|
# The prefix for all cache factor-related environment variables
|
|
|
|
_CACHE_PREFIX = "SYNAPSE_CACHE_FACTOR"
|
2020-05-27 06:17:01 -06:00
|
|
|
|
|
|
|
# Map from canonicalised cache name to cache.
|
|
|
|
_CACHES = {}
|
|
|
|
|
2020-06-10 11:27:49 -06:00
|
|
|
# a lock on the contents of _CACHES
|
|
|
|
_CACHES_LOCK = threading.Lock()
|
|
|
|
|
2020-05-11 11:45:23 -06:00
|
|
|
_DEFAULT_FACTOR_SIZE = 0.5
|
|
|
|
_DEFAULT_EVENT_CACHE_SIZE = "10K"
|
|
|
|
|
|
|
|
|
|
|
|
class CacheProperties(object):
|
|
|
|
def __init__(self):
|
|
|
|
# The default factor size for all caches
|
|
|
|
self.default_factor_size = float(
|
|
|
|
os.environ.get(_CACHE_PREFIX, _DEFAULT_FACTOR_SIZE)
|
|
|
|
)
|
|
|
|
self.resize_all_caches_func = None
|
|
|
|
|
|
|
|
|
|
|
|
properties = CacheProperties()
|
|
|
|
|
|
|
|
|
2020-05-27 06:17:01 -06:00
|
|
|
def _canonicalise_cache_name(cache_name: str) -> str:
|
|
|
|
"""Gets the canonical form of the cache name.
|
|
|
|
|
|
|
|
Since we specify cache names in config and environment variables we need to
|
|
|
|
ignore case and special characters. For example, some caches have asterisks
|
2020-05-27 06:34:46 -06:00
|
|
|
in their name to denote that they're not attached to a particular database
|
2020-05-27 06:17:01 -06:00
|
|
|
function, and these asterisks need to be stripped out
|
|
|
|
"""
|
|
|
|
|
|
|
|
cache_name = re.sub(r"[^A-Za-z_1-9]", "", cache_name)
|
|
|
|
|
|
|
|
return cache_name.lower()
|
|
|
|
|
|
|
|
|
2020-05-11 11:45:23 -06:00
|
|
|
def add_resizable_cache(cache_name: str, cache_resize_callback: Callable):
|
|
|
|
"""Register a cache that's size can dynamically change
|
|
|
|
|
|
|
|
Args:
|
|
|
|
cache_name: A reference to the cache
|
|
|
|
cache_resize_callback: A callback function that will be ran whenever
|
|
|
|
the cache needs to be resized
|
|
|
|
"""
|
2020-05-27 06:17:01 -06:00
|
|
|
# Some caches have '*' in them which we strip out.
|
|
|
|
cache_name = _canonicalise_cache_name(cache_name)
|
|
|
|
|
2020-06-10 11:27:49 -06:00
|
|
|
# sometimes caches are initialised from background threads, so we need to make
|
|
|
|
# sure we don't conflict with another thread running a resize operation
|
|
|
|
with _CACHES_LOCK:
|
|
|
|
_CACHES[cache_name] = cache_resize_callback
|
2020-05-11 11:45:23 -06:00
|
|
|
|
|
|
|
# Ensure all loaded caches are sized appropriately
|
|
|
|
#
|
|
|
|
# This method should only run once the config has been read,
|
|
|
|
# as it uses values read from it
|
|
|
|
if properties.resize_all_caches_func:
|
|
|
|
properties.resize_all_caches_func()
|
|
|
|
|
|
|
|
|
|
|
|
class CacheConfig(Config):
|
|
|
|
section = "caches"
|
|
|
|
_environ = os.environ
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def reset():
|
|
|
|
"""Resets the caches to their defaults. Used for tests."""
|
|
|
|
properties.default_factor_size = float(
|
|
|
|
os.environ.get(_CACHE_PREFIX, _DEFAULT_FACTOR_SIZE)
|
|
|
|
)
|
|
|
|
properties.resize_all_caches_func = None
|
2020-06-10 11:27:49 -06:00
|
|
|
with _CACHES_LOCK:
|
|
|
|
_CACHES.clear()
|
2020-05-11 11:45:23 -06:00
|
|
|
|
|
|
|
def generate_config_section(self, **kwargs):
|
|
|
|
return """\
|
|
|
|
## Caching ##
|
|
|
|
|
|
|
|
# Caching can be configured through the following options.
|
|
|
|
#
|
|
|
|
# A cache 'factor' is a multiplier that can be applied to each of
|
|
|
|
# Synapse's caches in order to increase or decrease the maximum
|
|
|
|
# number of entries that can be stored.
|
|
|
|
|
|
|
|
# The number of events to cache in memory. Not affected by
|
|
|
|
# caches.global_factor.
|
|
|
|
#
|
|
|
|
#event_cache_size: 10K
|
|
|
|
|
|
|
|
caches:
|
|
|
|
# Controls the global cache factor, which is the default cache factor
|
|
|
|
# for all caches if a specific factor for that cache is not otherwise
|
|
|
|
# set.
|
|
|
|
#
|
|
|
|
# This can also be set by the "SYNAPSE_CACHE_FACTOR" environment
|
|
|
|
# variable. Setting by environment variable takes priority over
|
|
|
|
# setting through the config file.
|
|
|
|
#
|
|
|
|
# Defaults to 0.5, which will half the size of all caches.
|
|
|
|
#
|
|
|
|
#global_factor: 1.0
|
|
|
|
|
|
|
|
# A dictionary of cache name to cache factor for that individual
|
|
|
|
# cache. Overrides the global cache factor for a given cache.
|
|
|
|
#
|
|
|
|
# These can also be set through environment variables comprised
|
|
|
|
# of "SYNAPSE_CACHE_FACTOR_" + the name of the cache in capital
|
|
|
|
# letters and underscores. Setting by environment variable
|
|
|
|
# takes priority over setting through the config file.
|
|
|
|
# Ex. SYNAPSE_CACHE_FACTOR_GET_USERS_WHO_SHARE_ROOM_WITH_USER=2.0
|
|
|
|
#
|
2020-05-27 06:17:01 -06:00
|
|
|
# Some caches have '*' and other characters that are not
|
|
|
|
# alphanumeric or underscores. These caches can be named with or
|
|
|
|
# without the special characters stripped. For example, to specify
|
|
|
|
# the cache factor for `*stateGroupCache*` via an environment
|
2020-05-27 06:34:46 -06:00
|
|
|
# variable would be `SYNAPSE_CACHE_FACTOR_STATEGROUPCACHE=2.0`.
|
2020-05-27 06:17:01 -06:00
|
|
|
#
|
2020-05-11 11:45:23 -06:00
|
|
|
per_cache_factors:
|
|
|
|
#get_users_who_share_room_with_user: 2.0
|
|
|
|
"""
|
|
|
|
|
|
|
|
def read_config(self, config, **kwargs):
|
|
|
|
self.event_cache_size = self.parse_size(
|
|
|
|
config.get("event_cache_size", _DEFAULT_EVENT_CACHE_SIZE)
|
|
|
|
)
|
|
|
|
self.cache_factors = {} # type: Dict[str, float]
|
|
|
|
|
|
|
|
cache_config = config.get("caches") or {}
|
|
|
|
self.global_factor = cache_config.get(
|
|
|
|
"global_factor", properties.default_factor_size
|
|
|
|
)
|
|
|
|
if not isinstance(self.global_factor, (int, float)):
|
|
|
|
raise ConfigError("caches.global_factor must be a number.")
|
|
|
|
|
|
|
|
# Set the global one so that it's reflected in new caches
|
|
|
|
properties.default_factor_size = self.global_factor
|
|
|
|
|
|
|
|
# Load cache factors from the config
|
|
|
|
individual_factors = cache_config.get("per_cache_factors") or {}
|
|
|
|
if not isinstance(individual_factors, dict):
|
|
|
|
raise ConfigError("caches.per_cache_factors must be a dictionary")
|
|
|
|
|
2020-05-27 06:17:01 -06:00
|
|
|
# Canonicalise the cache names *before* updating with the environment
|
|
|
|
# variables.
|
|
|
|
individual_factors = {
|
|
|
|
_canonicalise_cache_name(key): val
|
|
|
|
for key, val in individual_factors.items()
|
|
|
|
}
|
|
|
|
|
2020-05-11 11:45:23 -06:00
|
|
|
# Override factors from environment if necessary
|
|
|
|
individual_factors.update(
|
|
|
|
{
|
2020-05-27 06:17:01 -06:00
|
|
|
_canonicalise_cache_name(key[len(_CACHE_PREFIX) + 1 :]): float(val)
|
2020-05-11 11:45:23 -06:00
|
|
|
for key, val in self._environ.items()
|
|
|
|
if key.startswith(_CACHE_PREFIX + "_")
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
for cache, factor in individual_factors.items():
|
|
|
|
if not isinstance(factor, (int, float)):
|
|
|
|
raise ConfigError(
|
2020-05-27 06:17:01 -06:00
|
|
|
"caches.per_cache_factors.%s must be a number" % (cache,)
|
2020-05-11 11:45:23 -06:00
|
|
|
)
|
2020-05-27 06:17:01 -06:00
|
|
|
self.cache_factors[cache] = factor
|
2020-05-11 11:45:23 -06:00
|
|
|
|
|
|
|
# Resize all caches (if necessary) with the new factors we've loaded
|
|
|
|
self.resize_all_caches()
|
|
|
|
|
|
|
|
# Store this function so that it can be called from other classes without
|
|
|
|
# needing an instance of Config
|
|
|
|
properties.resize_all_caches_func = self.resize_all_caches
|
|
|
|
|
|
|
|
def resize_all_caches(self):
|
|
|
|
"""Ensure all cache sizes are up to date
|
|
|
|
|
|
|
|
For each cache, run the mapped callback function with either
|
|
|
|
a specific cache factor or the default, global one.
|
|
|
|
"""
|
2020-06-10 11:27:49 -06:00
|
|
|
# block other threads from modifying _CACHES while we iterate it.
|
|
|
|
with _CACHES_LOCK:
|
|
|
|
for cache_name, callback in _CACHES.items():
|
|
|
|
new_factor = self.cache_factors.get(cache_name, self.global_factor)
|
|
|
|
callback(new_factor)
|