2014-12-02 10:09:51 -05:00
|
|
|
#
|
2023-11-21 15:29:58 -05:00
|
|
|
# This file is licensed under the Affero General Public License (AGPL) version 3.
|
|
|
|
#
|
2024-01-23 06:26:48 -05:00
|
|
|
# Copyright 2020-2021 The Matrix.org Foundation C.I.C.
|
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2023-11-21 15:29:58 -05:00
|
|
|
# Copyright (C) 2023 New Vector, Ltd
|
|
|
|
#
|
|
|
|
# This program is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU Affero General Public License as
|
|
|
|
# published by the Free Software Foundation, either version 3 of the
|
|
|
|
# License, or (at your option) any later version.
|
|
|
|
#
|
|
|
|
# See the GNU Affero General Public License for more details:
|
|
|
|
# <https://www.gnu.org/licenses/agpl-3.0.html>.
|
|
|
|
#
|
|
|
|
# Originally licensed under the Apache License, Version 2.0:
|
|
|
|
# <http://www.apache.org/licenses/LICENSE-2.0>.
|
|
|
|
#
|
|
|
|
# [This file includes modifications made by New Vector Limited]
|
2014-12-02 10:09:51 -05:00
|
|
|
#
|
|
|
|
#
|
|
|
|
|
2018-05-10 07:10:27 -04:00
|
|
|
import logging
|
2023-10-06 07:22:55 -04:00
|
|
|
import re
|
2023-11-15 09:19:24 -05:00
|
|
|
from typing import IO, TYPE_CHECKING, Dict, List, Optional, Tuple
|
2021-01-15 10:57:37 -05:00
|
|
|
|
2019-10-08 08:55:16 -04:00
|
|
|
from synapse.api.errors import Codes, SynapseError
|
2023-10-06 07:22:55 -04:00
|
|
|
from synapse.http.server import respond_with_json
|
|
|
|
from synapse.http.servlet import RestServlet, parse_bytes_from_args
|
2021-03-12 11:37:57 -05:00
|
|
|
from synapse.http.site import SynapseRequest
|
2023-02-27 08:26:05 -05:00
|
|
|
from synapse.media.media_storage import SpamMediaException
|
2014-12-02 10:09:51 -05:00
|
|
|
|
2021-01-15 10:57:37 -05:00
|
|
|
if TYPE_CHECKING:
|
2023-02-27 08:26:05 -05:00
|
|
|
from synapse.media.media_repository import MediaRepository
|
2021-03-23 07:12:48 -04:00
|
|
|
from synapse.server import HomeServer
|
2021-01-15 10:57:37 -05:00
|
|
|
|
2014-12-02 10:09:51 -05:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2023-11-15 09:19:24 -05:00
|
|
|
# The name of the lock to use when uploading media.
|
|
|
|
_UPLOAD_MEDIA_LOCK_NAME = "upload_media"
|
2014-12-02 14:55:18 -05:00
|
|
|
|
2016-04-19 06:24:59 -04:00
|
|
|
|
2023-11-15 09:19:24 -05:00
|
|
|
class BaseUploadServlet(RestServlet):
|
2021-01-15 10:57:37 -05:00
|
|
|
def __init__(self, hs: "HomeServer", media_repo: "MediaRepository"):
|
2019-06-29 03:06:55 -04:00
|
|
|
super().__init__()
|
2016-04-19 06:24:59 -04:00
|
|
|
|
|
|
|
self.media_repo = media_repo
|
|
|
|
self.filepaths = media_repo.filepaths
|
2022-02-23 06:04:02 -05:00
|
|
|
self.store = hs.get_datastores().main
|
2023-11-15 09:19:24 -05:00
|
|
|
self.server_name = hs.hostname
|
2016-04-19 06:24:59 -04:00
|
|
|
self.auth = hs.get_auth()
|
2021-09-24 07:25:21 -04:00
|
|
|
self.max_upload_size = hs.config.media.max_upload_size
|
2016-04-19 06:24:59 -04:00
|
|
|
|
2023-11-15 09:19:24 -05:00
|
|
|
def _get_file_metadata(
|
|
|
|
self, request: SynapseRequest
|
|
|
|
) -> Tuple[int, Optional[str], str]:
|
2022-02-07 10:06:52 -05:00
|
|
|
raw_content_length = request.getHeader("Content-Length")
|
|
|
|
if raw_content_length is None:
|
2015-04-21 11:35:53 -04:00
|
|
|
raise SynapseError(msg="Request must specify a Content-Length", code=400)
|
2022-02-07 10:06:52 -05:00
|
|
|
try:
|
|
|
|
content_length = int(raw_content_length)
|
|
|
|
except ValueError:
|
|
|
|
raise SynapseError(msg="Content-Length value is invalid", code=400)
|
|
|
|
if content_length > self.max_upload_size:
|
2019-10-08 08:55:16 -04:00
|
|
|
raise SynapseError(
|
|
|
|
msg="Upload request body is too large",
|
|
|
|
code=413,
|
|
|
|
errcode=Codes.TOO_LARGE,
|
|
|
|
)
|
2015-04-21 11:35:53 -04:00
|
|
|
|
2021-07-16 13:22:36 -04:00
|
|
|
args: Dict[bytes, List[bytes]] = request.args # type: ignore
|
2021-06-08 08:30:48 -04:00
|
|
|
upload_name_bytes = parse_bytes_from_args(args, "filename")
|
|
|
|
if upload_name_bytes:
|
2015-08-26 12:27:23 -04:00
|
|
|
try:
|
2021-07-16 13:22:36 -04:00
|
|
|
upload_name: Optional[str] = upload_name_bytes.decode("utf8")
|
2015-08-26 12:27:23 -04:00
|
|
|
except UnicodeDecodeError:
|
|
|
|
raise SynapseError(
|
2022-02-07 10:06:52 -05:00
|
|
|
msg="Invalid UTF-8 filename parameter: %r" % (upload_name_bytes,),
|
|
|
|
code=400,
|
2015-08-26 12:27:23 -04:00
|
|
|
)
|
2015-06-30 04:33:48 -04:00
|
|
|
|
2020-09-29 12:15:27 -04:00
|
|
|
# If the name is falsey (e.g. an empty byte string) ensure it is None.
|
|
|
|
else:
|
|
|
|
upload_name = None
|
|
|
|
|
2015-04-21 11:35:53 -04:00
|
|
|
headers = request.requestHeaders
|
|
|
|
|
2018-08-20 09:54:49 -04:00
|
|
|
if headers.hasHeader(b"Content-Type"):
|
2021-03-01 12:23:46 -05:00
|
|
|
content_type_headers = headers.getRawHeaders(b"Content-Type")
|
|
|
|
assert content_type_headers # for mypy
|
|
|
|
media_type = content_type_headers[0].decode("ascii")
|
2015-04-21 11:35:53 -04:00
|
|
|
else:
|
2021-11-01 13:26:02 -04:00
|
|
|
media_type = "application/octet-stream"
|
2015-04-21 11:35:53 -04:00
|
|
|
|
2018-04-28 17:56:59 -04:00
|
|
|
# if headers.hasHeader(b"Content-Disposition"):
|
|
|
|
# disposition = headers.getRawHeaders(b"Content-Disposition")[0]
|
2015-04-21 11:35:53 -04:00
|
|
|
# TODO(markjh): parse content-dispostion
|
|
|
|
|
2023-11-15 09:19:24 -05:00
|
|
|
return content_length, upload_name, media_type
|
|
|
|
|
|
|
|
|
|
|
|
class UploadServlet(BaseUploadServlet):
|
|
|
|
PATTERNS = [re.compile("/_matrix/media/(r0|v3|v1)/upload$")]
|
|
|
|
|
|
|
|
async def on_POST(self, request: SynapseRequest) -> None:
|
|
|
|
requester = await self.auth.get_user_by_req(request)
|
|
|
|
content_length, upload_name, media_type = self._get_file_metadata(request)
|
|
|
|
|
2021-02-03 11:44:16 -05:00
|
|
|
try:
|
2021-07-16 13:22:36 -04:00
|
|
|
content: IO = request.content # type: ignore
|
2021-02-03 11:44:16 -05:00
|
|
|
content_uri = await self.media_repo.create_content(
|
2021-03-01 12:23:46 -05:00
|
|
|
media_type, upload_name, content, content_length, requester.user
|
2021-02-03 11:44:16 -05:00
|
|
|
)
|
|
|
|
except SpamMediaException:
|
|
|
|
# For uploading of media we want to respond with a 400, instead of
|
|
|
|
# the default 404, as that would just be confusing.
|
|
|
|
raise SynapseError(400, "Bad content")
|
2015-04-21 11:35:53 -04:00
|
|
|
|
2022-09-15 08:57:16 -04:00
|
|
|
logger.info("Uploaded content with URI '%s'", content_uri)
|
2017-01-10 09:19:50 -05:00
|
|
|
|
2022-09-15 08:57:16 -04:00
|
|
|
respond_with_json(
|
|
|
|
request, 200, {"content_uri": str(content_uri)}, send_cors=True
|
|
|
|
)
|
2023-11-15 09:19:24 -05:00
|
|
|
|
|
|
|
|
|
|
|
class AsyncUploadServlet(BaseUploadServlet):
|
|
|
|
PATTERNS = [
|
|
|
|
re.compile(
|
|
|
|
"/_matrix/media/v3/upload/(?P<server_name>[^/]*)/(?P<media_id>[^/]*)$"
|
|
|
|
)
|
|
|
|
]
|
|
|
|
|
|
|
|
async def on_PUT(
|
|
|
|
self, request: SynapseRequest, server_name: str, media_id: str
|
|
|
|
) -> None:
|
|
|
|
requester = await self.auth.get_user_by_req(request)
|
|
|
|
|
|
|
|
if server_name != self.server_name:
|
|
|
|
raise SynapseError(
|
|
|
|
404,
|
|
|
|
"Non-local server name specified",
|
|
|
|
errcode=Codes.NOT_FOUND,
|
|
|
|
)
|
|
|
|
|
|
|
|
lock = await self.store.try_acquire_lock(_UPLOAD_MEDIA_LOCK_NAME, media_id)
|
|
|
|
if not lock:
|
|
|
|
raise SynapseError(
|
|
|
|
409,
|
|
|
|
"Media ID cannot be overwritten",
|
|
|
|
errcode=Codes.CANNOT_OVERWRITE_MEDIA,
|
|
|
|
)
|
|
|
|
|
|
|
|
async with lock:
|
|
|
|
await self.media_repo.verify_can_upload(media_id, requester.user)
|
|
|
|
content_length, upload_name, media_type = self._get_file_metadata(request)
|
|
|
|
|
|
|
|
try:
|
|
|
|
content: IO = request.content # type: ignore
|
|
|
|
await self.media_repo.update_content(
|
|
|
|
media_id,
|
|
|
|
media_type,
|
|
|
|
upload_name,
|
|
|
|
content,
|
|
|
|
content_length,
|
|
|
|
requester.user,
|
|
|
|
)
|
|
|
|
except SpamMediaException:
|
|
|
|
# For uploading of media we want to respond with a 400, instead of
|
|
|
|
# the default 404, as that would just be confusing.
|
|
|
|
raise SynapseError(400, "Bad content")
|
|
|
|
|
|
|
|
logger.info("Uploaded content for media ID %r", media_id)
|
|
|
|
respond_with_json(request, 200, {}, send_cors=True)
|