Merge pull request #259 from matrix-org/markjh/unicode_content_disposition

Support unicode attachment filenames
This commit is contained in:
Erik Johnston 2015-08-27 10:03:58 +01:00
commit e330c802e4
3 changed files with 43 additions and 12 deletions

View File

@ -33,6 +33,8 @@ import os
import cgi import cgi
import logging import logging
import urllib
import urlparse
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
@ -42,10 +44,13 @@ def parse_media_id(request):
# This allows users to append e.g. /test.png to the URL. Useful for # This allows users to append e.g. /test.png to the URL. Useful for
# clients that parse the URL to see content type. # clients that parse the URL to see content type.
server_name, media_id = request.postpath[:2] server_name, media_id = request.postpath[:2]
if len(request.postpath) > 2 and is_ascii(request.postpath[-1]): file_name = None
return server_name, media_id, request.postpath[-1] if len(request.postpath) > 2:
else: try:
return server_name, media_id, None file_name = urlparse.unquote(request.postpath[-1]).decode("utf-8")
except UnicodeDecodeError:
pass
return server_name, media_id, file_name
except: except:
raise SynapseError( raise SynapseError(
404, 404,
@ -143,6 +148,16 @@ class BaseMediaResource(Resource):
upload_name = params.get("filename", None) upload_name = params.get("filename", None)
if upload_name and not is_ascii(upload_name): if upload_name and not is_ascii(upload_name):
upload_name = None upload_name = None
else:
upload_name_utf8 = params.get("filename*", None)
if upload_name_utf8.lower().startswith("utf-8''"):
upload_name = upload_name_utf8[7:]
if upload_name:
upload_name = urlparse.unquote(upload_name)
try:
upload_name = upload_name.decode("utf-8")
except UnicodeDecodeError:
upload_name = None
else: else:
upload_name = None upload_name = None
@ -181,9 +196,19 @@ class BaseMediaResource(Resource):
if os.path.isfile(file_path): if os.path.isfile(file_path):
request.setHeader(b"Content-Type", media_type.encode("UTF-8")) request.setHeader(b"Content-Type", media_type.encode("UTF-8"))
if upload_name: if upload_name:
if is_ascii(upload_name):
request.setHeader( request.setHeader(
b"Content-Disposition", b"Content-Disposition",
b"inline; filename=%s" % (upload_name.encode("utf-8"),), b"inline; filename=%s" % (
urllib.quote(upload_name.encode("utf-8")),
),
)
else:
request.setHeader(
b"Content-Disposition",
b"inline; filename*=utf-8''%s" % (
urllib.quote(upload_name.encode("utf-8")),
),
) )
# cache for at least a day. # cache for at least a day.

View File

@ -15,7 +15,7 @@
from synapse.http.server import respond_with_json, request_handler from synapse.http.server import respond_with_json, request_handler
from synapse.util.stringutils import random_string, is_ascii from synapse.util.stringutils import random_string
from synapse.api.errors import SynapseError from synapse.api.errors import SynapseError
from twisted.web.server import NOT_DONE_YET from twisted.web.server import NOT_DONE_YET
@ -86,9 +86,13 @@ class UploadResource(BaseMediaResource):
upload_name = request.args.get("filename", None) upload_name = request.args.get("filename", None)
if upload_name: if upload_name:
upload_name = upload_name[0] try:
if upload_name and not is_ascii(upload_name): upload_name = upload_name[0].decode('UTF-8')
raise SynapseError(400, "filename must be ascii") except UnicodeDecodeError:
raise SynapseError(
msg="Invalid UTF-8 filename parameter: %r" % (upload_name),
code=400,
)
headers = request.requestHeaders headers = request.requestHeaders

View File

@ -38,6 +38,8 @@ def random_string_with_symbols(length):
def is_ascii(s): def is_ascii(s):
try: try:
s.encode("ascii") s.encode("ascii")
except UnicodeEncodeError:
return False
except UnicodeDecodeError: except UnicodeDecodeError:
return False return False
else: else: