2014-08-12 08:10:52 -06:00
|
|
|
# -*- coding: utf-8 -*-
|
2016-01-06 21:26:29 -07:00
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2014-08-12 08:10:52 -06:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
2014-08-14 11:40:50 -06:00
|
|
|
from twisted.internet import defer
|
2015-03-09 11:01:19 -06:00
|
|
|
from .appservice import (
|
|
|
|
ApplicationServiceStore, ApplicationServiceTransactionStore
|
|
|
|
)
|
2015-03-20 11:08:15 -06:00
|
|
|
from ._base import Cache
|
2014-08-12 08:10:52 -06:00
|
|
|
from .directory import DirectoryStore
|
2015-03-20 07:52:56 -06:00
|
|
|
from .events import EventsStore
|
2016-02-15 10:10:40 -07:00
|
|
|
from .presence import PresenceStore, UserPresenceState
|
2014-08-12 08:10:52 -06:00
|
|
|
from .profile import ProfileStore
|
|
|
|
from .registration import RegistrationStore
|
|
|
|
from .room import RoomStore
|
|
|
|
from .roommember import RoomMemberStore
|
|
|
|
from .stream import StreamStore
|
|
|
|
from .transactions import TransactionStore
|
2014-08-28 11:19:47 -06:00
|
|
|
from .keys import KeyStore
|
2014-10-28 10:42:35 -06:00
|
|
|
from .event_federation import EventFederationStore
|
2014-11-19 11:20:59 -07:00
|
|
|
from .pusher import PusherStore
|
2015-01-22 10:38:53 -07:00
|
|
|
from .push_rule import PushRuleStore
|
2014-12-02 12:51:47 -07:00
|
|
|
from .media_repository import MediaRepositoryStore
|
2015-01-22 08:50:17 -07:00
|
|
|
from .rejections import RejectionsStore
|
2016-01-04 07:05:37 -07:00
|
|
|
from .event_push_actions import EventPushActionsStore
|
2014-10-27 05:58:32 -06:00
|
|
|
|
2014-10-14 09:59:51 -06:00
|
|
|
from .state import StateStore
|
2014-10-15 10:09:04 -06:00
|
|
|
from .signatures import SignatureStore
|
2015-01-27 10:48:13 -07:00
|
|
|
from .filtering import FilteringStore
|
2015-07-06 11:46:47 -06:00
|
|
|
from .end_to_end_keys import EndToEndKeyStore
|
2014-10-15 10:09:04 -06:00
|
|
|
|
2015-07-07 03:55:31 -06:00
|
|
|
from .receipts import ReceiptsStore
|
2015-10-09 08:48:31 -06:00
|
|
|
from .search import SearchStore
|
2015-10-28 10:06:57 -06:00
|
|
|
from .tags import TagsStore
|
2015-12-01 11:41:32 -07:00
|
|
|
from .account_data import AccountDataStore
|
2015-07-07 03:55:31 -06:00
|
|
|
|
2016-03-08 04:45:50 -07:00
|
|
|
from .util.id_generators import IdGenerator, StreamIdGenerator, ChainedIdGenerator
|
2016-01-26 08:51:06 -07:00
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
from synapse.api.constants import PresenceState
|
2016-01-29 07:37:59 -07:00
|
|
|
from synapse.util.caches.stream_change_cache import StreamChangeCache
|
|
|
|
|
2016-01-26 08:51:06 -07:00
|
|
|
|
2014-08-19 07:20:03 -06:00
|
|
|
import logging
|
2014-08-12 08:10:52 -06:00
|
|
|
|
|
|
|
|
2014-08-19 07:20:03 -06:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2014-09-10 08:42:15 -06:00
|
|
|
|
2015-03-20 11:08:15 -06:00
|
|
|
# Number of msec of granularity to store the user IP 'last seen' time. Smaller
|
|
|
|
# times give more inserts into the database even for readonly API hits
|
|
|
|
# 120 seconds == 2 minutes
|
2016-02-02 10:18:50 -07:00
|
|
|
LAST_SEEN_GRANULARITY = 120 * 1000
|
2014-08-19 07:20:03 -06:00
|
|
|
|
2014-09-10 08:42:15 -06:00
|
|
|
|
2014-08-14 10:34:37 -06:00
|
|
|
class DataStore(RoomMemberStore, RoomStore,
|
2015-03-20 07:52:56 -06:00
|
|
|
RegistrationStore, StreamStore, ProfileStore,
|
2014-10-31 08:00:14 -06:00
|
|
|
PresenceStore, TransactionStore,
|
2014-10-28 10:42:35 -06:00
|
|
|
DirectoryStore, KeyStore, StateStore, SignatureStore,
|
2015-02-02 09:05:34 -07:00
|
|
|
ApplicationServiceStore,
|
2014-12-02 12:51:47 -07:00
|
|
|
EventFederationStore,
|
|
|
|
MediaRepositoryStore,
|
2015-01-22 08:50:17 -07:00
|
|
|
RejectionsStore,
|
2015-01-27 10:48:13 -07:00
|
|
|
FilteringStore,
|
2014-12-18 08:15:22 -07:00
|
|
|
PusherStore,
|
2015-03-20 07:52:56 -06:00
|
|
|
PushRuleStore,
|
2015-03-16 04:16:59 -06:00
|
|
|
ApplicationServiceTransactionStore,
|
2015-03-20 07:52:56 -06:00
|
|
|
EventsStore,
|
2015-07-07 03:55:31 -06:00
|
|
|
ReceiptsStore,
|
2015-07-06 11:46:47 -06:00
|
|
|
EndToEndKeyStore,
|
2015-10-09 08:48:31 -06:00
|
|
|
SearchStore,
|
2015-10-28 10:06:57 -06:00
|
|
|
TagsStore,
|
2015-12-01 11:41:32 -07:00
|
|
|
AccountDataStore,
|
2016-01-04 07:05:37 -07:00
|
|
|
EventPushActionsStore
|
2014-12-02 12:51:47 -07:00
|
|
|
):
|
2014-08-12 08:10:52 -06:00
|
|
|
|
2016-01-28 07:32:05 -07:00
|
|
|
def __init__(self, db_conn, hs):
|
2014-08-18 08:50:41 -06:00
|
|
|
self.hs = hs
|
2016-01-29 07:41:16 -07:00
|
|
|
self.database_engine = hs.database_engine
|
2014-08-12 08:10:52 -06:00
|
|
|
|
2016-01-28 07:32:05 -07:00
|
|
|
cur = db_conn.cursor()
|
|
|
|
try:
|
|
|
|
cur.execute("SELECT MIN(stream_ordering) FROM events",)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
self.min_stream_token = rows[0][0] if rows and rows[0] and rows[0][0] else -1
|
|
|
|
self.min_stream_token = min(self.min_stream_token, -1)
|
|
|
|
finally:
|
|
|
|
cur.close()
|
2014-08-18 09:00:46 -06:00
|
|
|
|
2015-03-20 11:08:15 -06:00
|
|
|
self.client_ip_last_seen = Cache(
|
|
|
|
name="client_ip_last_seen",
|
|
|
|
keylen=4,
|
2014-09-24 07:18:08 -06:00
|
|
|
)
|
2014-09-23 08:28:32 -06:00
|
|
|
|
2016-01-26 08:51:06 -07:00
|
|
|
self._stream_id_gen = StreamIdGenerator(
|
|
|
|
db_conn, "events", "stream_ordering"
|
|
|
|
)
|
|
|
|
self._receipts_id_gen = StreamIdGenerator(
|
|
|
|
db_conn, "receipts_linearized", "stream_id"
|
|
|
|
)
|
|
|
|
self._account_data_id_gen = StreamIdGenerator(
|
|
|
|
db_conn, "account_data_max_stream_id", "stream_id"
|
|
|
|
)
|
2016-02-15 10:10:40 -07:00
|
|
|
self._presence_id_gen = StreamIdGenerator(
|
|
|
|
db_conn, "presence_stream", "stream_id"
|
|
|
|
)
|
2016-01-26 08:51:06 -07:00
|
|
|
|
2016-03-01 07:32:56 -07:00
|
|
|
self._transaction_id_gen = IdGenerator(db_conn, "sent_transactions", "id")
|
|
|
|
self._state_groups_id_gen = IdGenerator(db_conn, "state_groups", "id")
|
|
|
|
self._access_tokens_id_gen = IdGenerator(db_conn, "access_tokens", "id")
|
|
|
|
self._refresh_tokens_id_gen = IdGenerator(db_conn, "refresh_tokens", "id")
|
|
|
|
self._pushers_id_gen = IdGenerator(db_conn, "pushers", "id")
|
|
|
|
self._push_rule_id_gen = IdGenerator(db_conn, "push_rules", "id")
|
|
|
|
self._push_rules_enable_id_gen = IdGenerator(db_conn, "push_rules_enable", "id")
|
2016-03-01 06:35:37 -07:00
|
|
|
self._push_rules_stream_id_gen = ChainedIdGenerator(
|
|
|
|
self._stream_id_gen, db_conn, "push_rules_stream", "stream_id"
|
|
|
|
)
|
2016-01-26 08:51:06 -07:00
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
events_max = self._stream_id_gen.get_max_token()
|
2016-01-29 07:49:11 -07:00
|
|
|
event_cache_prefill, min_event_val = self._get_cache_dict(
|
2016-01-29 07:37:59 -07:00
|
|
|
db_conn, "events",
|
|
|
|
entity_column="room_id",
|
|
|
|
stream_column="stream_ordering",
|
|
|
|
max_value=events_max,
|
|
|
|
)
|
|
|
|
self._events_stream_cache = StreamChangeCache(
|
2016-01-29 07:49:11 -07:00
|
|
|
"EventsRoomStreamChangeCache", min_event_val,
|
2016-01-29 07:37:59 -07:00
|
|
|
prefilled_cache=event_cache_prefill,
|
|
|
|
)
|
|
|
|
|
2016-01-29 09:52:48 -07:00
|
|
|
self._membership_stream_cache = StreamChangeCache(
|
|
|
|
"MembershipStreamChangeCache", events_max,
|
|
|
|
)
|
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
account_max = self._account_data_id_gen.get_max_token()
|
2016-01-29 07:37:59 -07:00
|
|
|
self._account_data_stream_cache = StreamChangeCache(
|
2016-01-29 07:53:59 -07:00
|
|
|
"AccountDataAndTagsChangeCache", account_max,
|
2016-01-29 07:37:59 -07:00
|
|
|
)
|
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
self.__presence_on_startup = self._get_active_presence(db_conn)
|
|
|
|
|
|
|
|
presence_cache_prefill, min_presence_val = self._get_cache_dict(
|
|
|
|
db_conn, "presence_stream",
|
|
|
|
entity_column="user_id",
|
|
|
|
stream_column="stream_id",
|
|
|
|
max_value=self._presence_id_gen.get_max_token(),
|
|
|
|
)
|
|
|
|
self.presence_stream_cache = StreamChangeCache(
|
|
|
|
"PresenceStreamChangeCache", min_presence_val,
|
|
|
|
prefilled_cache=presence_cache_prefill
|
|
|
|
)
|
|
|
|
|
2016-03-04 09:19:42 -07:00
|
|
|
push_rules_prefill, push_rules_id = self._get_cache_dict(
|
2016-03-04 09:20:22 -07:00
|
|
|
db_conn, "push_rules_stream",
|
2016-03-04 09:19:42 -07:00
|
|
|
entity_column="user_id",
|
|
|
|
stream_column="stream_id",
|
|
|
|
max_value=self._push_rules_stream_id_gen.get_max_token()[0],
|
|
|
|
)
|
|
|
|
|
2016-03-04 07:44:01 -07:00
|
|
|
self.push_rules_stream_cache = StreamChangeCache(
|
2016-03-04 09:19:42 -07:00
|
|
|
"PushRulesStreamChangeCache", push_rules_id,
|
|
|
|
prefilled_cache=push_rules_prefill,
|
2016-03-04 07:44:01 -07:00
|
|
|
)
|
|
|
|
|
2016-01-26 08:51:06 -07:00
|
|
|
super(DataStore, self).__init__(hs)
|
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
def take_presence_startup_info(self):
|
|
|
|
active_on_startup = self.__presence_on_startup
|
|
|
|
self.__presence_on_startup = None
|
|
|
|
return active_on_startup
|
|
|
|
|
2016-01-29 07:37:59 -07:00
|
|
|
def _get_cache_dict(self, db_conn, table, entity_column, stream_column, max_value):
|
2016-01-29 08:39:17 -07:00
|
|
|
# Fetch a mapping of room_id -> max stream position for "recent" rooms.
|
|
|
|
# It doesn't really matter how many we get, the StreamChangeCache will
|
|
|
|
# do the right thing to ensure it respects the max size of cache.
|
2016-01-29 07:37:59 -07:00
|
|
|
sql = (
|
|
|
|
"SELECT %(entity)s, MAX(%(stream)s) FROM %(table)s"
|
2016-01-29 07:42:01 -07:00
|
|
|
" WHERE %(stream)s > ? - 100000"
|
2016-01-29 07:37:59 -07:00
|
|
|
" GROUP BY %(entity)s"
|
|
|
|
) % {
|
|
|
|
"table": table,
|
|
|
|
"entity": entity_column,
|
|
|
|
"stream": stream_column,
|
|
|
|
}
|
|
|
|
|
2016-01-29 07:41:16 -07:00
|
|
|
sql = self.database_engine.convert_param_style(sql)
|
|
|
|
|
2016-01-29 07:37:59 -07:00
|
|
|
txn = db_conn.cursor()
|
|
|
|
txn.execute(sql, (int(max_value),))
|
|
|
|
rows = txn.fetchall()
|
2016-02-15 10:10:40 -07:00
|
|
|
txn.close()
|
2016-01-29 07:37:59 -07:00
|
|
|
|
2016-01-29 07:49:11 -07:00
|
|
|
cache = {
|
|
|
|
row[0]: int(row[1])
|
2016-01-29 07:37:59 -07:00
|
|
|
for row in rows
|
|
|
|
}
|
|
|
|
|
2016-01-29 07:49:11 -07:00
|
|
|
if cache:
|
|
|
|
min_val = min(cache.values())
|
|
|
|
else:
|
|
|
|
min_val = max_value
|
|
|
|
|
|
|
|
return cache, min_val
|
|
|
|
|
2016-02-15 10:10:40 -07:00
|
|
|
def _get_active_presence(self, db_conn):
|
|
|
|
"""Fetch non-offline presence from the database so that we can register
|
|
|
|
the appropriate time outs.
|
|
|
|
"""
|
|
|
|
|
|
|
|
sql = (
|
2016-02-18 03:11:43 -07:00
|
|
|
"SELECT user_id, state, last_active_ts, last_federation_update_ts,"
|
|
|
|
" last_user_sync_ts, status_msg, currently_active FROM presence_stream"
|
2016-02-15 10:10:40 -07:00
|
|
|
" WHERE state != ?"
|
|
|
|
)
|
|
|
|
sql = self.database_engine.convert_param_style(sql)
|
|
|
|
|
|
|
|
txn = db_conn.cursor()
|
|
|
|
txn.execute(sql, (PresenceState.OFFLINE,))
|
|
|
|
rows = self.cursor_to_dict(txn)
|
2016-02-18 09:39:28 -07:00
|
|
|
txn.close()
|
2016-02-15 10:10:40 -07:00
|
|
|
|
|
|
|
for row in rows:
|
|
|
|
row["currently_active"] = bool(row["currently_active"])
|
|
|
|
|
|
|
|
return [UserPresenceState(**row) for row in rows]
|
|
|
|
|
2014-08-13 09:27:14 -06:00
|
|
|
@defer.inlineCallbacks
|
2015-08-25 09:23:06 -06:00
|
|
|
def insert_client_ip(self, user, access_token, ip, user_agent):
|
2015-03-20 11:08:15 -06:00
|
|
|
now = int(self._clock.time_msec())
|
2015-08-25 09:23:06 -06:00
|
|
|
key = (user.to_string(), access_token, ip)
|
2014-08-18 09:00:46 -06:00
|
|
|
|
2015-03-20 11:08:15 -06:00
|
|
|
try:
|
2015-08-07 04:52:21 -06:00
|
|
|
last_seen = self.client_ip_last_seen.get(key)
|
2015-03-20 11:08:15 -06:00
|
|
|
except KeyError:
|
|
|
|
last_seen = None
|
2014-08-19 07:20:03 -06:00
|
|
|
|
2015-03-20 11:08:15 -06:00
|
|
|
# Rate-limited inserts
|
|
|
|
if last_seen is not None and (now - last_seen) < LAST_SEEN_GRANULARITY:
|
|
|
|
defer.returnValue(None)
|
2014-08-18 09:00:46 -06:00
|
|
|
|
2015-08-07 04:52:21 -06:00
|
|
|
self.client_ip_last_seen.prefill(key, now)
|
2014-08-18 09:00:46 -06:00
|
|
|
|
2015-05-01 03:46:48 -06:00
|
|
|
# It's safe not to lock here: a) no unique constraint,
|
|
|
|
# b) LAST_SEEN_GRANULARITY makes concurrent updates incredibly unlikely
|
2015-04-07 11:05:39 -06:00
|
|
|
yield self._simple_upsert(
|
2014-09-26 09:36:24 -06:00
|
|
|
"user_ips",
|
2015-03-24 10:17:39 -06:00
|
|
|
keyvalues={
|
2015-04-14 06:54:09 -06:00
|
|
|
"user_id": user.to_string(),
|
2014-09-26 09:36:24 -06:00
|
|
|
"access_token": access_token,
|
2014-09-29 06:35:15 -06:00
|
|
|
"ip": ip,
|
|
|
|
"user_agent": user_agent,
|
2015-03-24 10:17:39 -06:00
|
|
|
},
|
|
|
|
values={
|
2015-03-20 11:08:15 -06:00
|
|
|
"last_seen": now,
|
2015-03-19 09:59:48 -06:00
|
|
|
},
|
2015-03-20 09:59:18 -06:00
|
|
|
desc="insert_client_ip",
|
2015-05-01 03:46:48 -06:00
|
|
|
lock=False,
|
2014-09-26 09:36:24 -06:00
|
|
|
)
|
|
|
|
|
2015-09-22 05:57:40 -06:00
|
|
|
@defer.inlineCallbacks
|
|
|
|
def count_daily_users(self):
|
2015-09-22 06:47:40 -06:00
|
|
|
"""
|
|
|
|
Counts the number of users who used this homeserver in the last 24 hours.
|
|
|
|
"""
|
2015-09-22 05:57:40 -06:00
|
|
|
def _count_users(txn):
|
|
|
|
txn.execute(
|
|
|
|
"SELECT COUNT(DISTINCT user_id) AS users"
|
|
|
|
" FROM user_ips"
|
|
|
|
" WHERE last_seen > ?",
|
|
|
|
# This is close enough to a day for our purposes.
|
|
|
|
(int(self._clock.time_msec()) - (1000 * 60 * 60 * 24),)
|
|
|
|
)
|
|
|
|
rows = self.cursor_to_dict(txn)
|
|
|
|
if rows:
|
|
|
|
return rows[0]["users"]
|
|
|
|
return 0
|
|
|
|
|
|
|
|
ret = yield self.runInteraction("count_users", _count_users)
|
|
|
|
defer.returnValue(ret)
|
|
|
|
|
2014-09-29 07:59:52 -06:00
|
|
|
def get_user_ip_and_agents(self, user):
|
|
|
|
return self._simple_select_list(
|
|
|
|
table="user_ips",
|
2015-04-14 06:54:09 -06:00
|
|
|
keyvalues={"user_id": user.to_string()},
|
2014-09-29 07:59:52 -06:00
|
|
|
retcols=[
|
2015-08-25 09:23:06 -06:00
|
|
|
"access_token", "ip", "user_agent", "last_seen"
|
2014-09-29 07:59:52 -06:00
|
|
|
],
|
2015-03-20 09:59:18 -06:00
|
|
|
desc="get_user_ip_and_agents",
|
2014-09-29 07:59:52 -06:00
|
|
|
)
|
|
|
|
|
2014-08-22 10:00:10 -06:00
|
|
|
|
2015-04-28 06:39:42 -06:00
|
|
|
def are_all_users_on_domain(txn, database_engine, domain):
|
|
|
|
sql = database_engine.convert_param_style(
|
|
|
|
"SELECT COUNT(*) FROM users WHERE name NOT LIKE ?"
|
|
|
|
)
|
2015-04-27 04:46:00 -06:00
|
|
|
pat = "%:" + domain
|
2015-04-28 06:39:42 -06:00
|
|
|
txn.execute(sql, (pat,))
|
|
|
|
num_not_matching = txn.fetchall()[0][0]
|
2015-04-27 04:46:00 -06:00
|
|
|
if num_not_matching == 0:
|
|
|
|
return True
|
2015-04-27 04:49:18 -06:00
|
|
|
return False
|