2019-03-27 04:06:21 -06:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
# Copyright 2017 Vector Creations Ltd
|
|
|
|
# Copyright 2019 New Vector Ltd
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2020-01-14 07:08:06 -07:00
|
|
|
|
2019-03-27 10:15:59 -06:00
|
|
|
import heapq
|
2020-01-14 07:08:06 -07:00
|
|
|
from typing import Tuple, Type
|
2019-03-27 09:18:28 -06:00
|
|
|
|
|
|
|
import attr
|
|
|
|
|
2020-03-25 08:54:01 -06:00
|
|
|
from ._base import Stream, db_query_to_update_function
|
2019-03-27 04:06:21 -06:00
|
|
|
|
2019-03-27 09:18:28 -06:00
|
|
|
|
|
|
|
"""Handling of the 'events' replication stream
|
|
|
|
|
|
|
|
This stream contains rows of various types. Each row therefore contains a 'type'
|
|
|
|
identifier before the real data. For example::
|
|
|
|
|
2019-03-27 10:15:59 -06:00
|
|
|
RDATA events batch ["state", ["!room:id", "m.type", "", "$event:id"]]
|
2019-03-27 09:18:28 -06:00
|
|
|
RDATA events 12345 ["ev", ["$event:id", "!room:id", "m.type", null, null]]
|
|
|
|
|
|
|
|
An "ev" row is sent for each new event. The fields in the data part are:
|
|
|
|
|
|
|
|
* The new event id
|
|
|
|
* The room id for the event
|
|
|
|
* The type of the new event
|
|
|
|
* The state key of the event, for state events
|
|
|
|
* The event id of an event which is redacted by this event.
|
|
|
|
|
2019-03-27 10:15:59 -06:00
|
|
|
A "state" row is sent whenever the "current state" in a room changes. The fields in the
|
|
|
|
data part are:
|
|
|
|
|
|
|
|
* The room id for the state change
|
|
|
|
* The event type of the state which has changed
|
|
|
|
* The state_key of the state which has changed
|
|
|
|
* The event id of the new state
|
|
|
|
|
2019-03-27 09:18:28 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
@attr.s(slots=True, frozen=True)
|
|
|
|
class EventsStreamRow(object):
|
|
|
|
"""A parsed row from the events replication stream"""
|
2019-06-20 03:32:02 -06:00
|
|
|
|
2019-03-27 09:18:28 -06:00
|
|
|
type = attr.ib() # str: the TypeId of one of the *EventsStreamRows
|
|
|
|
data = attr.ib() # BaseEventsStreamRow
|
|
|
|
|
|
|
|
|
|
|
|
class BaseEventsStreamRow(object):
|
|
|
|
"""Base class for rows to be sent in the events stream.
|
|
|
|
|
|
|
|
Specifies how to identify, serialize and deserialize the different types.
|
|
|
|
"""
|
|
|
|
|
2020-01-14 07:08:06 -07:00
|
|
|
# Unique string that ids the type. Must be overriden in sub classes.
|
|
|
|
TypeId = None # type: str
|
2019-03-27 09:18:28 -06:00
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def from_data(cls, data):
|
|
|
|
"""Parse the data from the replication stream into a row.
|
|
|
|
|
|
|
|
By default we just call the constructor with the data list as arguments
|
|
|
|
|
|
|
|
Args:
|
|
|
|
data: The value of the data object from the replication stream
|
|
|
|
"""
|
|
|
|
return cls(*data)
|
|
|
|
|
|
|
|
|
|
|
|
@attr.s(slots=True, frozen=True)
|
|
|
|
class EventsStreamEventRow(BaseEventsStreamRow):
|
|
|
|
TypeId = "ev"
|
|
|
|
|
2019-06-20 03:32:02 -06:00
|
|
|
event_id = attr.ib() # str
|
|
|
|
room_id = attr.ib() # str
|
|
|
|
type = attr.ib() # str
|
|
|
|
state_key = attr.ib() # str, optional
|
|
|
|
redacts = attr.ib() # str, optional
|
2019-05-16 03:18:53 -06:00
|
|
|
relates_to = attr.ib() # str, optional
|
2019-03-27 09:18:28 -06:00
|
|
|
|
|
|
|
|
2019-03-27 10:15:59 -06:00
|
|
|
@attr.s(slots=True, frozen=True)
|
|
|
|
class EventsStreamCurrentStateRow(BaseEventsStreamRow):
|
|
|
|
TypeId = "state"
|
|
|
|
|
2019-06-20 03:32:02 -06:00
|
|
|
room_id = attr.ib() # str
|
|
|
|
type = attr.ib() # str
|
2019-03-27 10:15:59 -06:00
|
|
|
state_key = attr.ib() # str
|
2019-06-20 03:32:02 -06:00
|
|
|
event_id = attr.ib() # str, optional
|
2019-03-27 10:15:59 -06:00
|
|
|
|
|
|
|
|
2020-01-14 07:08:06 -07:00
|
|
|
_EventRows = (
|
|
|
|
EventsStreamEventRow,
|
|
|
|
EventsStreamCurrentStateRow,
|
|
|
|
) # type: Tuple[Type[BaseEventsStreamRow], ...]
|
|
|
|
|
|
|
|
TypeToRow = {Row.TypeId: Row for Row in _EventRows}
|
2019-03-27 04:06:21 -06:00
|
|
|
|
|
|
|
|
|
|
|
class EventsStream(Stream):
|
|
|
|
"""We received a new event, or an event went from being an outlier to not
|
|
|
|
"""
|
2019-06-20 03:32:02 -06:00
|
|
|
|
2019-03-27 04:06:21 -06:00
|
|
|
NAME = "events"
|
|
|
|
|
|
|
|
def __init__(self, hs):
|
2019-03-27 09:18:28 -06:00
|
|
|
self._store = hs.get_datastore()
|
2020-01-14 07:08:06 -07:00
|
|
|
self.current_token = self._store.get_current_events_token # type: ignore
|
2020-03-25 08:54:01 -06:00
|
|
|
self.update_function = db_query_to_update_function(self._update_function) # type: ignore
|
2019-03-27 04:06:21 -06:00
|
|
|
|
|
|
|
super(EventsStream, self).__init__(hs)
|
2019-03-27 09:18:28 -06:00
|
|
|
|
2020-03-25 08:54:01 -06:00
|
|
|
async def _update_function(self, from_token, current_token, limit=None):
|
2020-01-16 02:16:12 -07:00
|
|
|
event_rows = await self._store.get_all_new_forward_event_rows(
|
2019-06-20 03:32:02 -06:00
|
|
|
from_token, current_token, limit
|
2019-03-27 09:18:28 -06:00
|
|
|
)
|
|
|
|
event_updates = (
|
2019-06-20 03:32:02 -06:00
|
|
|
(row[0], EventsStreamEventRow.TypeId, row[1:]) for row in event_rows
|
2019-03-27 09:18:28 -06:00
|
|
|
)
|
2019-03-27 10:15:59 -06:00
|
|
|
|
2020-01-16 02:16:12 -07:00
|
|
|
state_rows = await self._store.get_all_updated_current_state_deltas(
|
2019-03-27 10:15:59 -06:00
|
|
|
from_token, current_token, limit
|
|
|
|
)
|
|
|
|
state_updates = (
|
2019-06-20 03:32:02 -06:00
|
|
|
(row[0], EventsStreamCurrentStateRow.TypeId, row[1:]) for row in state_rows
|
2019-03-27 10:15:59 -06:00
|
|
|
)
|
|
|
|
|
|
|
|
all_updates = heapq.merge(event_updates, state_updates)
|
|
|
|
|
2019-07-23 07:00:55 -06:00
|
|
|
return all_updates
|
2019-03-27 09:18:28 -06:00
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def parse_row(cls, row):
|
|
|
|
(typ, data) = row
|
|
|
|
data = TypeToRow[typ].from_data(data)
|
|
|
|
return EventsStreamRow(typ, data)
|