2014-08-12 15:10:52 +01:00
|
|
|
# -*- coding: utf-8 -*-
|
2016-01-07 04:26:29 +00:00
|
|
|
# Copyright 2014-2016 OpenMarket Ltd
|
2014-08-12 15:10:52 +01:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2014-08-13 03:14:34 +01:00
|
|
|
|
2014-08-12 15:10:52 +01:00
|
|
|
import random
|
|
|
|
import string
|
2018-07-09 16:09:20 +10:00
|
|
|
|
2018-12-04 11:55:52 +01:00
|
|
|
import six
|
|
|
|
from six import PY2, PY3
|
2018-04-28 13:57:00 +02:00
|
|
|
from six.moves import range
|
2014-08-12 15:10:52 +01:00
|
|
|
|
2019-06-20 19:32:02 +10:00
|
|
|
_string_with_symbols = string.digits + string.ascii_letters + ".,;:^&*-_+=#~@"
|
2015-03-13 15:23:37 +00:00
|
|
|
|
2019-05-03 12:38:03 +01:00
|
|
|
# random_string and random_string_with_symbols are used for a range of things,
|
|
|
|
# some cryptographically important, some less so. We use SystemRandom to make sure
|
|
|
|
# we get cryptographically-secure randoms.
|
|
|
|
rand = random.SystemRandom()
|
|
|
|
|
2014-08-12 15:10:52 +01:00
|
|
|
|
|
|
|
def random_string(length):
|
2019-06-20 19:32:02 +10:00
|
|
|
return "".join(rand.choice(string.ascii_letters) for _ in range(length))
|
2015-03-13 15:23:37 +00:00
|
|
|
|
|
|
|
|
|
|
|
def random_string_with_symbols(length):
|
2019-06-20 19:32:02 +10:00
|
|
|
return "".join(rand.choice(_string_with_symbols) for _ in range(length))
|
2015-06-30 10:31:59 +01:00
|
|
|
|
|
|
|
|
|
|
|
def is_ascii(s):
|
2018-08-20 23:54:49 +10:00
|
|
|
|
|
|
|
if PY3:
|
|
|
|
if isinstance(s, bytes):
|
|
|
|
try:
|
2019-06-20 19:32:02 +10:00
|
|
|
s.decode("ascii").encode("ascii")
|
2018-08-20 23:54:49 +10:00
|
|
|
except UnicodeDecodeError:
|
|
|
|
return False
|
|
|
|
except UnicodeEncodeError:
|
|
|
|
return False
|
|
|
|
return True
|
|
|
|
|
2015-06-30 10:31:59 +01:00
|
|
|
try:
|
|
|
|
s.encode("ascii")
|
2015-08-26 16:26:37 +01:00
|
|
|
except UnicodeEncodeError:
|
|
|
|
return False
|
2015-06-30 10:31:59 +01:00
|
|
|
except UnicodeDecodeError:
|
|
|
|
return False
|
|
|
|
else:
|
|
|
|
return True
|
2017-04-25 14:38:51 +01:00
|
|
|
|
|
|
|
|
|
|
|
def to_ascii(s):
|
|
|
|
"""Converts a string to ascii if it is ascii, otherwise leave it alone.
|
|
|
|
|
|
|
|
If given None then will return None.
|
|
|
|
"""
|
2018-08-20 23:54:49 +10:00
|
|
|
if PY3:
|
|
|
|
return s
|
|
|
|
|
2017-04-25 14:38:51 +01:00
|
|
|
if s is None:
|
|
|
|
return None
|
|
|
|
|
|
|
|
try:
|
|
|
|
return s.encode("ascii")
|
|
|
|
except UnicodeEncodeError:
|
|
|
|
return s
|
2018-12-04 11:55:52 +01:00
|
|
|
|
|
|
|
|
|
|
|
def exception_to_unicode(e):
|
|
|
|
"""Helper function to extract the text of an exception as a unicode string
|
|
|
|
|
|
|
|
Args:
|
|
|
|
e (Exception): exception to be stringified
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
unicode
|
|
|
|
"""
|
|
|
|
# urgh, this is a mess. The basic problem here is that psycopg2 constructs its
|
|
|
|
# exceptions with PyErr_SetString, with a (possibly non-ascii) argument. str() will
|
|
|
|
# then produce the raw byte sequence. Under Python 2, this will then cause another
|
|
|
|
# error if it gets mixed with a `unicode` object, as per
|
|
|
|
# https://github.com/matrix-org/synapse/issues/4252
|
|
|
|
|
|
|
|
# First of all, if we're under python3, everything is fine because it will sort this
|
|
|
|
# nonsense out for us.
|
|
|
|
if not PY2:
|
|
|
|
return str(e)
|
|
|
|
|
|
|
|
# otherwise let's have a stab at decoding the exception message. We'll circumvent
|
|
|
|
# Exception.__str__(), which would explode if someone raised Exception(u'non-ascii')
|
|
|
|
# and instead look at what is in the args member.
|
|
|
|
|
|
|
|
if len(e.args) == 0:
|
2019-06-20 19:32:02 +10:00
|
|
|
return ""
|
2018-12-04 11:55:52 +01:00
|
|
|
elif len(e.args) > 1:
|
|
|
|
return six.text_type(repr(e.args))
|
|
|
|
|
|
|
|
msg = e.args[0]
|
|
|
|
if isinstance(msg, bytes):
|
2019-06-20 19:32:02 +10:00
|
|
|
return msg.decode("utf-8", errors="replace")
|
2018-12-04 11:55:52 +01:00
|
|
|
else:
|
|
|
|
return msg
|