1
0

Cache event creation info and context

~1.3s to ~1.1s time savings by re-using some calculations
that will be the same for every event type in the batch

TODO: Find a way to make store_state_group_id_for_event_id batch persist
in the db which brings it down to about 0.8s
This commit is contained in:
Eric Eastwood
2022-01-19 17:42:02 -06:00
parent cc4eb72f2e
commit 491e91dd40
4 changed files with 68 additions and 17 deletions

View File

@@ -69,4 +69,4 @@ fi
# Run the tests!
echo "Images built; running complement"
go test -v -tags synapse_blacklist,msc2403,msc2716 -count=1 $EXTRA_COMPLEMENT_ARGS ./tests/...
go test -v -tags synapse_blacklist,msc2403,msc2716 -count=1 $EXTRA_COMPLEMENT_ARGS ./tests/

View File

@@ -991,6 +991,8 @@ class EventCreationHandler:
and full_state_ids_at_event
and builder.internal_metadata.is_historical()
):
# Add explicit state to the insertion event so the rest of the batch
# can inherit the same state and `state_group`
old_state = await self.store.get_events_as_list(full_state_ids_at_event)
context = await self.state.compute_event_context(event, old_state=old_state)
else:

View File

@@ -1,8 +1,11 @@
import logging
from typing import TYPE_CHECKING, List, Tuple
from typing import TYPE_CHECKING, Dict, List, NamedTuple, Tuple
from synapse.api.constants import EventContentFields, EventTypes
from synapse.appservice import ApplicationService
from synapse.events import EventBase
from synapse.events.snapshot import EventContext
from synapse.events.validator import EventValidator
from synapse.http.servlet import assert_params_in_dict
from synapse.types import JsonDict, Requester, UserID, create_requester
from synapse.util.stringutils import random_string
@@ -13,6 +16,11 @@ if TYPE_CHECKING:
logger = logging.getLogger(__name__)
class EventCreationCacheItem(NamedTuple):
event: EventBase
context: EventContext
class RoomBatchHandler:
def __init__(self, hs: "HomeServer"):
self.hs = hs
@@ -20,6 +28,8 @@ class RoomBatchHandler:
self.state_store = hs.get_storage().state
self.event_creation_handler = hs.get_event_creation_handler()
self.room_member_handler = hs.get_room_member_handler()
self.validator = EventValidator()
self.event_builder_factory = hs.get_event_builder_factory()
self.auth = hs.get_auth()
async def inherit_depth_from_prev_ids(self, prev_event_ids: List[str]) -> int:
@@ -290,6 +300,12 @@ class RoomBatchHandler:
"""
assert app_service_requester.app_service
room_version_obj = await self.store.get_room_version(room_id)
# Map from event type to the shared info to re-use and create another
# event in the batch with the same type
event_type_creation_cache: Dict[str, EventCreationCacheItem] = {}
# Make the historical event chain float off on its own by specifying no
# prev_events for the first event in the chain which causes the HS to
# ask for the state at the start of the batch later.
@@ -309,28 +325,60 @@ class RoomBatchHandler:
"origin_server_ts": ev["origin_server_ts"],
"content": ev["content"],
"room_id": room_id,
"sender": ev["sender"], # requester.user.to_string(),
"sender": ev["sender"],
"prev_events": prev_event_ids.copy(),
}
# Mark all events as historical
event_dict["content"][EventContentFields.MSC2716_HISTORICAL] = True
event, context = await self.event_creation_handler.create_event(
await self.create_requester_for_user_id_from_app_service(
ev["sender"], app_service_requester.app_service
),
event_dict,
# Only the first event in the chain should be floating.
# The rest should hang off each other in a chain.
allow_no_prev_events=index == 0,
prev_event_ids=event_dict.get("prev_events"),
auth_event_ids=auth_event_ids,
historical=True,
depth=inherited_depth,
)
# We can skip a bunch of context and state calculations if we
# already have an event with the same type to base off of.
cached_creation_info = event_type_creation_cache.get(ev["type"])
assert context._state_group
if cached_creation_info is None:
event, context = await self.event_creation_handler.create_event(
await self.create_requester_for_user_id_from_app_service(
ev["sender"], app_service_requester.app_service
),
event_dict,
# Only the first event in the chain should be floating.
# The rest should hang off each other in a chain.
allow_no_prev_events=index == 0,
prev_event_ids=event_dict.get("prev_events"),
auth_event_ids=auth_event_ids,
historical=True,
depth=inherited_depth,
)
event_type_creation_cache[event.type] = EventCreationCacheItem(
event=event, context=context
)
else:
builder = self.event_builder_factory.for_room_version(
room_version_obj, event_dict
)
builder.internal_metadata.historical = True
# TODO: Can we get away without this? Does it validate on persist?
# self.validator.validate_builder(builder)
shared_event, shared_context = cached_creation_info
event = await builder.build(
prev_event_ids=prev_event_ids,
auth_event_ids=shared_event.auth_event_ids().copy(),
depth=inherited_depth,
)
# We can re-use the context per-event type because it will
# calculate out to be the same for all events in the batch. We
# also get the benefit of sharing the same state_group.
context = shared_context
# TODO: Do we need to check `third_party_event_rules.check_event_allowed(...)`?
# TODO: Can we get away without this?
# self.validator.validate_new(event, self.config)
# Normally this is done when persisting the event but we have to
# pre-emptively do it here because we create all the events first,

View File

@@ -14,6 +14,7 @@
from typing import Optional
from typing import List
from synapse.storage._base import SQLBaseStore