2018-07-31 13:52:49 +01:00
|
|
|
# Copyright 2018 New Vector Ltd
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
import abc
|
|
|
|
import logging
|
|
|
|
import re
|
2020-06-16 13:51:47 +01:00
|
|
|
import urllib
|
2020-05-01 17:19:56 +01:00
|
|
|
from inspect import signature
|
2021-03-08 20:00:07 +01:00
|
|
|
from typing import TYPE_CHECKING, Dict, List, Tuple
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-09-29 11:06:11 +01:00
|
|
|
from prometheus_client import Counter, Gauge
|
|
|
|
|
|
|
|
from synapse.api.errors import HttpResponseException, SynapseError
|
|
|
|
from synapse.http import RequestTimedOutError
|
2020-07-03 19:02:19 +01:00
|
|
|
from synapse.logging.opentracing import inject_active_span_byte_dict, trace
|
2018-07-31 13:52:49 +01:00
|
|
|
from synapse.util.caches.response_cache import ResponseCache
|
|
|
|
from synapse.util.stringutils import random_string
|
|
|
|
|
2021-03-08 20:00:07 +01:00
|
|
|
if TYPE_CHECKING:
|
|
|
|
from synapse.server import HomeServer
|
|
|
|
|
2018-07-31 13:52:49 +01:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2020-09-29 11:06:11 +01:00
|
|
|
_pending_outgoing_requests = Gauge(
|
|
|
|
"synapse_pending_outgoing_replication_requests",
|
|
|
|
"Number of active outgoing replication requests, by replication method name",
|
|
|
|
["name"],
|
|
|
|
)
|
|
|
|
|
|
|
|
_outgoing_request_counter = Counter(
|
|
|
|
"synapse_outgoing_replication_requests",
|
|
|
|
"Number of outgoing replication requests, by replication method name and result",
|
|
|
|
["name", "code"],
|
|
|
|
)
|
|
|
|
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-09-16 21:15:55 +02:00
|
|
|
class ReplicationEndpoint(metaclass=abc.ABCMeta):
|
2018-07-31 13:52:49 +01:00
|
|
|
"""Helper base class for defining new replication HTTP endpoints.
|
|
|
|
|
|
|
|
This creates an endpoint under `/_synapse/replication/:NAME/:PATH_ARGS..`
|
2020-02-26 16:58:33 +00:00
|
|
|
(with a `/:txn_id` suffix for cached requests), where NAME is a name,
|
2018-07-31 13:52:49 +01:00
|
|
|
PATH_ARGS are a tuple of parameters to be encoded in the URL.
|
|
|
|
|
|
|
|
For example, if `NAME` is "send_event" and `PATH_ARGS` is `("event_id",)`,
|
|
|
|
with `CACHE` set to true then this generates an endpoint:
|
|
|
|
|
|
|
|
/_synapse/replication/send_event/:event_id/:txn_id
|
|
|
|
|
2018-08-08 10:35:47 +01:00
|
|
|
For POST/PUT requests the payload is serialized to json and sent as the
|
|
|
|
body, while for GET requests the payload is added as query parameters. See
|
2018-07-31 13:52:49 +01:00
|
|
|
`_serialize_payload` for details.
|
|
|
|
|
|
|
|
Incoming requests are handled by overriding `_handle_request`. Servers
|
|
|
|
must call `register` to register the path with the HTTP server.
|
|
|
|
|
|
|
|
Requests can be sent by calling the client returned by `make_client`.
|
2020-05-01 17:19:56 +01:00
|
|
|
Requests are sent to master process by default, but can be sent to other
|
|
|
|
named processes by specifying an `instance_name` keyword argument.
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
Attributes:
|
|
|
|
NAME (str): A name for the endpoint, added to the path as well as used
|
|
|
|
in logging and metrics.
|
|
|
|
PATH_ARGS (tuple[str]): A list of parameters to be added to the path.
|
|
|
|
Adding parameters to the path (rather than payload) can make it
|
|
|
|
easier to follow along in the log files.
|
2018-08-08 10:35:47 +01:00
|
|
|
METHOD (str): The method of the HTTP request, defaults to POST. Can be
|
|
|
|
one of POST, PUT or GET. If GET then the payload is sent as query
|
|
|
|
parameters rather than a JSON body.
|
2018-07-31 13:52:49 +01:00
|
|
|
CACHE (bool): Whether server should cache the result of the request/
|
|
|
|
If true then transparently adds a txn_id to all requests, and
|
|
|
|
`_handle_request` must return a Deferred.
|
|
|
|
RETRY_ON_TIMEOUT(bool): Whether or not to retry the request when a 504
|
|
|
|
is received.
|
|
|
|
"""
|
|
|
|
|
2020-01-14 14:08:06 +00:00
|
|
|
NAME = abc.abstractproperty() # type: str # type: ignore
|
|
|
|
PATH_ARGS = abc.abstractproperty() # type: Tuple[str, ...] # type: ignore
|
2018-08-08 10:35:47 +01:00
|
|
|
METHOD = "POST"
|
2018-07-31 13:52:49 +01:00
|
|
|
CACHE = True
|
|
|
|
RETRY_ON_TIMEOUT = True
|
|
|
|
|
2021-03-08 20:00:07 +01:00
|
|
|
def __init__(self, hs: "HomeServer"):
|
2018-07-31 13:52:49 +01:00
|
|
|
if self.CACHE:
|
|
|
|
self.response_cache = ResponseCache(
|
2021-03-08 20:00:07 +01:00
|
|
|
hs.get_clock(), "repl." + self.NAME, timeout_ms=30 * 60 * 1000
|
2020-10-09 11:35:11 -04:00
|
|
|
) # type: ResponseCache[str]
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-05-01 17:19:56 +01:00
|
|
|
# We reserve `instance_name` as a parameter to sending requests, so we
|
|
|
|
# assert here that sub classes don't try and use the name.
|
|
|
|
assert (
|
|
|
|
"instance_name" not in self.PATH_ARGS
|
2020-07-09 09:52:58 -04:00
|
|
|
), "`instance_name` is a reserved parameter name"
|
2020-05-01 17:19:56 +01:00
|
|
|
assert (
|
|
|
|
"instance_name"
|
|
|
|
not in signature(self.__class__._serialize_payload).parameters
|
2020-07-09 09:52:58 -04:00
|
|
|
), "`instance_name` is a reserved parameter name"
|
2020-05-01 17:19:56 +01:00
|
|
|
|
2018-08-08 10:35:47 +01:00
|
|
|
assert self.METHOD in ("PUT", "POST", "GET")
|
|
|
|
|
2020-12-04 10:56:28 -05:00
|
|
|
self._replication_secret = None
|
|
|
|
if hs.config.worker.worker_replication_secret:
|
|
|
|
self._replication_secret = hs.config.worker.worker_replication_secret
|
|
|
|
|
|
|
|
def _check_auth(self, request) -> None:
|
|
|
|
# Get the authorization header.
|
|
|
|
auth_headers = request.requestHeaders.getRawHeaders(b"Authorization")
|
|
|
|
|
|
|
|
if len(auth_headers) > 1:
|
|
|
|
raise RuntimeError("Too many Authorization headers.")
|
|
|
|
parts = auth_headers[0].split(b" ")
|
|
|
|
if parts[0] == b"Bearer" and len(parts) == 2:
|
|
|
|
received_secret = parts[1].decode("ascii")
|
|
|
|
if self._replication_secret == received_secret:
|
|
|
|
# Success!
|
|
|
|
return
|
|
|
|
|
|
|
|
raise RuntimeError("Invalid Authorization header.")
|
|
|
|
|
2018-07-31 13:52:49 +01:00
|
|
|
@abc.abstractmethod
|
2020-08-03 07:12:55 -04:00
|
|
|
async def _serialize_payload(**kwargs):
|
2018-07-31 13:52:49 +01:00
|
|
|
"""Static method that is called when creating a request.
|
|
|
|
|
|
|
|
Concrete implementations should have explicit parameters (rather than
|
|
|
|
kwargs) so that an appropriate exception is raised if the client is
|
|
|
|
called with unexpected parameters. All PATH_ARGS must appear in
|
|
|
|
argument list.
|
|
|
|
|
|
|
|
Returns:
|
2020-08-03 07:12:55 -04:00
|
|
|
dict: If POST/PUT request then dictionary must be JSON serialisable,
|
|
|
|
otherwise must be appropriate for adding as query args.
|
2018-07-31 13:52:49 +01:00
|
|
|
"""
|
|
|
|
return {}
|
|
|
|
|
|
|
|
@abc.abstractmethod
|
2019-10-29 13:00:51 +00:00
|
|
|
async def _handle_request(self, request, **kwargs):
|
2018-07-31 13:52:49 +01:00
|
|
|
"""Handle incoming request.
|
|
|
|
|
|
|
|
This is called with the request object and PATH_ARGS.
|
|
|
|
|
|
|
|
Returns:
|
2019-10-29 13:00:51 +00:00
|
|
|
tuple[int, dict]: HTTP status code and a JSON serialisable dict
|
|
|
|
to be used as response body of request.
|
2018-07-31 13:52:49 +01:00
|
|
|
"""
|
|
|
|
pass
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def make_client(cls, hs):
|
|
|
|
"""Create a client that makes requests.
|
|
|
|
|
2021-04-23 12:21:55 +01:00
|
|
|
Returns a callable that accepts the same parameters as
|
|
|
|
`_serialize_payload`, and also accepts an optional `instance_name`
|
|
|
|
parameter to specify which instance to hit (the instance must be in
|
|
|
|
the `instance_map` config).
|
2018-07-31 13:52:49 +01:00
|
|
|
"""
|
|
|
|
clock = hs.get_clock()
|
|
|
|
client = hs.get_simple_http_client()
|
2020-05-22 16:11:35 +01:00
|
|
|
local_instance_name = hs.get_instance_name()
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-05-14 14:00:58 +01:00
|
|
|
master_host = hs.config.worker_replication_host
|
|
|
|
master_port = hs.config.worker_replication_http_port
|
|
|
|
|
|
|
|
instance_map = hs.config.worker.instance_map
|
|
|
|
|
2020-09-29 11:06:11 +01:00
|
|
|
outgoing_gauge = _pending_outgoing_requests.labels(cls.NAME)
|
|
|
|
|
2020-12-04 10:56:28 -05:00
|
|
|
replication_secret = None
|
|
|
|
if hs.config.worker.worker_replication_secret:
|
|
|
|
replication_secret = hs.config.worker.worker_replication_secret.encode(
|
|
|
|
"ascii"
|
|
|
|
)
|
|
|
|
|
2019-09-05 17:44:55 +01:00
|
|
|
@trace(opname="outgoing_replication_request")
|
2020-09-29 11:06:11 +01:00
|
|
|
@outgoing_gauge.track_inprogress()
|
2021-01-18 15:24:04 +00:00
|
|
|
async def send_request(*, instance_name="master", **kwargs):
|
2020-05-22 16:11:35 +01:00
|
|
|
if instance_name == local_instance_name:
|
|
|
|
raise Exception("Trying to send HTTP request to self")
|
2020-05-14 14:00:58 +01:00
|
|
|
if instance_name == "master":
|
|
|
|
host = master_host
|
|
|
|
port = master_port
|
|
|
|
elif instance_name in instance_map:
|
|
|
|
host = instance_map[instance_name].host
|
|
|
|
port = instance_map[instance_name].port
|
|
|
|
else:
|
|
|
|
raise Exception(
|
|
|
|
"Instance %r not in 'instance_map' config" % (instance_name,)
|
|
|
|
)
|
2020-05-01 17:19:56 +01:00
|
|
|
|
2020-08-03 07:12:55 -04:00
|
|
|
data = await cls._serialize_payload(**kwargs)
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2019-01-30 14:19:52 +00:00
|
|
|
url_args = [
|
|
|
|
urllib.parse.quote(kwargs[name], safe="") for name in cls.PATH_ARGS
|
|
|
|
]
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
if cls.CACHE:
|
|
|
|
txn_id = random_string(10)
|
|
|
|
url_args.append(txn_id)
|
|
|
|
|
2018-08-08 10:35:47 +01:00
|
|
|
if cls.METHOD == "POST":
|
2018-07-31 13:52:49 +01:00
|
|
|
request_func = client.post_json_get_json
|
2018-08-08 10:35:47 +01:00
|
|
|
elif cls.METHOD == "PUT":
|
|
|
|
request_func = client.put_json
|
|
|
|
elif cls.METHOD == "GET":
|
2018-07-31 13:52:49 +01:00
|
|
|
request_func = client.get_json
|
2018-08-08 10:35:47 +01:00
|
|
|
else:
|
|
|
|
# We have already asserted in the constructor that a
|
|
|
|
# compatible was picked, but lets be paranoid.
|
|
|
|
raise Exception(
|
|
|
|
"Unknown METHOD on %s replication endpoint" % (cls.NAME,)
|
|
|
|
)
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
uri = "http://%s:%s/_synapse/replication/%s/%s" % (
|
|
|
|
host,
|
|
|
|
port,
|
|
|
|
cls.NAME,
|
|
|
|
"/".join(url_args),
|
|
|
|
)
|
|
|
|
|
|
|
|
try:
|
|
|
|
# We keep retrying the same request for timeouts. This is so that we
|
|
|
|
# have a good idea that the request has either succeeded or failed on
|
|
|
|
# the master, and so whether we should clean up or not.
|
|
|
|
while True:
|
2020-01-14 14:08:06 +00:00
|
|
|
headers = {} # type: Dict[bytes, List[bytes]]
|
2020-12-04 10:56:28 -05:00
|
|
|
# Add an authorization header, if configured.
|
|
|
|
if replication_secret:
|
|
|
|
headers[b"Authorization"] = [b"Bearer " + replication_secret]
|
2019-09-05 14:46:04 +01:00
|
|
|
inject_active_span_byte_dict(headers, None, check_destination=False)
|
2018-07-31 13:52:49 +01:00
|
|
|
try:
|
2020-08-03 07:12:55 -04:00
|
|
|
result = await request_func(uri, data, headers=headers)
|
2018-07-31 13:52:49 +01:00
|
|
|
break
|
2020-09-29 11:06:11 +01:00
|
|
|
except RequestTimedOutError:
|
|
|
|
if not cls.RETRY_ON_TIMEOUT:
|
2018-07-31 13:52:49 +01:00
|
|
|
raise
|
|
|
|
|
2020-09-29 11:06:11 +01:00
|
|
|
logger.warning("%s request timed out; retrying", cls.NAME)
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
# If we timed out we probably don't need to worry about backing
|
|
|
|
# off too much, but lets just wait a little anyway.
|
2020-08-03 07:12:55 -04:00
|
|
|
await clock.sleep(1)
|
2018-08-03 09:25:15 +01:00
|
|
|
except HttpResponseException as e:
|
2018-07-31 13:52:49 +01:00
|
|
|
# We convert to SynapseError as we know that it was a SynapseError
|
2020-09-29 11:06:11 +01:00
|
|
|
# on the main process that we should send to the client. (And
|
2018-07-31 13:52:49 +01:00
|
|
|
# importantly, not stack traces everywhere)
|
2020-09-29 11:06:11 +01:00
|
|
|
_outgoing_request_counter.labels(cls.NAME, e.code).inc()
|
2018-08-03 09:25:15 +01:00
|
|
|
raise e.to_synapse_error()
|
2020-09-29 11:06:11 +01:00
|
|
|
except Exception as e:
|
|
|
|
_outgoing_request_counter.labels(cls.NAME, "ERR").inc()
|
|
|
|
raise SynapseError(502, "Failed to talk to main process") from e
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-09-29 11:06:11 +01:00
|
|
|
_outgoing_request_counter.labels(cls.NAME, 200).inc()
|
2019-07-23 23:00:55 +10:00
|
|
|
return result
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
return send_request
|
|
|
|
|
|
|
|
def register(self, http_server):
|
|
|
|
"""Called by the server to register this as a handler to the
|
|
|
|
appropriate path.
|
|
|
|
"""
|
|
|
|
|
|
|
|
url_args = list(self.PATH_ARGS)
|
2018-08-08 10:35:47 +01:00
|
|
|
method = self.METHOD
|
2018-07-31 13:52:49 +01:00
|
|
|
|
|
|
|
if self.CACHE:
|
|
|
|
url_args.append("txn_id")
|
|
|
|
|
|
|
|
args = "/".join("(?P<%s>[^/]+)" % (arg,) for arg in url_args)
|
|
|
|
pattern = re.compile("^/_synapse/replication/%s/%s$" % (self.NAME, args))
|
|
|
|
|
2019-08-22 18:08:07 +01:00
|
|
|
http_server.register_paths(
|
2020-12-04 10:56:28 -05:00
|
|
|
method,
|
|
|
|
[pattern],
|
|
|
|
self._check_auth_and_handle,
|
|
|
|
self.__class__.__name__,
|
2019-08-22 18:08:07 +01:00
|
|
|
)
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-12-04 10:56:28 -05:00
|
|
|
def _check_auth_and_handle(self, request, **kwargs):
|
2018-08-08 10:29:58 +01:00
|
|
|
"""Called on new incoming requests when caching is enabled. Checks
|
2018-08-09 09:56:10 +01:00
|
|
|
if there is a cached response for the request and returns that,
|
2018-08-08 10:29:58 +01:00
|
|
|
otherwise calls `_handle_request` and caches its response.
|
2018-07-31 13:52:49 +01:00
|
|
|
"""
|
|
|
|
# We just use the txn_id here, but we probably also want to use the
|
|
|
|
# other PATH_ARGS as well.
|
|
|
|
|
2020-12-04 10:56:28 -05:00
|
|
|
# Check the authorization headers before handling the request.
|
|
|
|
if self._replication_secret:
|
|
|
|
self._check_auth(request)
|
|
|
|
|
|
|
|
if self.CACHE:
|
|
|
|
txn_id = kwargs.pop("txn_id")
|
|
|
|
|
|
|
|
return self.response_cache.wrap(
|
|
|
|
txn_id, self._handle_request, request, **kwargs
|
|
|
|
)
|
2018-07-31 13:52:49 +01:00
|
|
|
|
2020-12-04 10:56:28 -05:00
|
|
|
return self._handle_request(request, **kwargs)
|