synapse-product/synapse/push/push_rule_evaluator.py

232 lines
6.9 KiB
Python
Raw Normal View History

# -*- coding: utf-8 -*-
2016-01-06 23:26:29 -05:00
# Copyright 2015, 2016 OpenMarket Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import logging
import re
2016-01-18 09:09:47 -05:00
from synapse.types import UserID
from synapse.util.caches import CACHE_SIZE_FACTOR, register_cache
from synapse.util.caches.lrucache import LruCache
2016-01-18 09:09:47 -05:00
logger = logging.getLogger(__name__)
2016-01-18 09:09:47 -05:00
GLOB_REGEX = re.compile(r'\\\[(\\\!|)(.*)\\\]')
IS_GLOB = re.compile(r'[\?\*\[\]]')
INEQUALITY_EXPR = re.compile("^([=<>]*)([0-9]*)$")
STARTS_WITH_WORD_CHAR_REGEX = re.compile(r"^\w")
ENDS_WITH_WORD_CHAR_REGEX = re.compile(r"\w$")
2016-01-18 09:09:47 -05:00
def _room_member_count(ev, condition, room_member_count):
if 'is' not in condition:
return False
m = INEQUALITY_EXPR.match(condition['is'])
if not m:
return False
ineq = m.group(1)
rhs = m.group(2)
if not rhs.isdigit():
return False
rhs = int(rhs)
if ineq == '' or ineq == '==':
return room_member_count == rhs
elif ineq == '<':
return room_member_count < rhs
elif ineq == '>':
return room_member_count > rhs
elif ineq == '>=':
return room_member_count >= rhs
elif ineq == '<=':
return room_member_count <= rhs
else:
return False
def tweaks_for_actions(actions):
tweaks = {}
for a in actions:
if not isinstance(a, dict):
continue
if 'set_tweak' in a and 'value' in a:
tweaks[a['set_tweak']] = a['value']
return tweaks
2016-01-18 09:09:47 -05:00
class PushRuleEvaluatorForEvent(object):
def __init__(self, event, room_member_count):
2016-01-18 09:09:47 -05:00
self._event = event
self._room_member_count = room_member_count
2016-01-18 10:42:23 -05:00
# Maps strings of e.g. 'content.body' -> event["content"]["body"]
2016-01-18 09:09:47 -05:00
self._value_cache = _flatten_dict(event)
def matches(self, condition, user_id, display_name):
2016-01-18 09:09:47 -05:00
if condition['kind'] == 'event_match':
2016-01-18 05:09:14 -05:00
return self._event_match(condition, user_id)
elif condition['kind'] == 'contains_display_name':
2016-01-18 09:09:47 -05:00
return self._contains_display_name(display_name)
elif condition['kind'] == 'room_member_count':
2016-01-18 09:09:47 -05:00
return _room_member_count(
self._event, condition, self._room_member_count
)
else:
return True
2016-01-18 05:09:14 -05:00
def _event_match(self, condition, user_id):
2016-01-18 09:09:47 -05:00
pattern = condition.get('pattern', None)
2016-01-18 05:09:14 -05:00
if not pattern:
pattern_type = condition.get('pattern_type', None)
if pattern_type == "user_id":
pattern = user_id
elif pattern_type == "user_localpart":
pattern = UserID.from_string(user_id).localpart
2016-01-18 09:09:47 -05:00
if not pattern:
logger.warn("event_match condition with no pattern")
return False
# XXX: optimisation: cache our pattern regexps
if condition['key'] == 'content.body':
body = self._event["content"].get("body", None)
if not body:
return False
2016-01-18 09:09:47 -05:00
return _glob_matches(pattern, body, word_boundary=True)
2016-01-18 09:09:47 -05:00
else:
haystack = self._get_value(condition['key'])
if haystack is None:
return False
return _glob_matches(pattern, haystack)
2016-01-18 09:09:47 -05:00
def _contains_display_name(self, display_name):
if not display_name:
return False
body = self._event["content"].get("body", None)
if not body:
return False
2016-01-18 09:09:47 -05:00
return _glob_matches(display_name, body, word_boundary=True)
2016-01-18 09:09:47 -05:00
def _get_value(self, dotted_key):
return self._value_cache.get(dotted_key, None)
# Caches (glob, word_boundary) -> regex for push. See _glob_matches
regex_cache = LruCache(50000 * CACHE_SIZE_FACTOR)
register_cache("regex_push_cache", regex_cache)
def _glob_matches(glob, value, word_boundary=False):
"""Tests if value matches glob.
2016-01-18 09:09:47 -05:00
Args:
glob (string)
value (string): String to test against glob.
word_boundary (bool): Whether to match against word boundaries or entire
string. Defaults to False.
2016-01-18 09:09:47 -05:00
Returns:
bool
"""
2016-01-18 12:04:36 -05:00
try:
r = regex_cache.get((glob, word_boundary), None)
if not r:
r = _glob_to_re(glob, word_boundary)
regex_cache[(glob, word_boundary)] = r
return r.search(value)
2016-01-19 09:43:24 -05:00
except re.error:
logger.warn("Failed to parse glob to regex: %r", glob)
return False
2016-01-18 09:09:47 -05:00
def _glob_to_re(glob, word_boundary):
"""Generates regex for a given glob.
Args:
glob (string)
word_boundary (bool): Whether to match against word boundaries or entire
string. Defaults to False.
Returns:
regex object
"""
if IS_GLOB.search(glob):
r = re.escape(glob)
r = r.replace(r'\*', '.*?')
r = r.replace(r'\?', '.')
# handle [abc], [a-z] and [!a-z] style ranges.
r = GLOB_REGEX.sub(
lambda x: (
'[%s%s]' % (
x.group(1) and '^' or '',
x.group(2).replace(r'\\\-', '-')
)
),
r,
)
if word_boundary:
r = _re_word_boundary(r)
return re.compile(r, flags=re.IGNORECASE)
else:
r = "^" + r + "$"
return re.compile(r, flags=re.IGNORECASE)
elif word_boundary:
r = re.escape(glob)
r = _re_word_boundary(r)
return re.compile(r, flags=re.IGNORECASE)
else:
r = "^" + re.escape(glob) + "$"
return re.compile(r, flags=re.IGNORECASE)
def _re_word_boundary(r):
"""
Adds word boundary characters to the start and end of an
expression to require that the match occur as a whole word,
but do so respecting the fact that strings starting or ending
with non-word characters will change word boundaries.
"""
# Matching a regex string aginst a regex, since by definition
# \b is the boundary between a \w and a \W, so match \w at the
# start or end of the expression (although this will miss, eg.
# "[dl]og")
if STARTS_WITH_WORD_CHAR_REGEX.search(r):
r = r"\b%s" % (r,)
if ENDS_WITH_WORD_CHAR_REGEX.search(r):
r = r"%s\b" % (r,)
return r
def _flatten_dict(d, prefix=[], result=None):
if result is None:
result = {}
2016-01-18 09:09:47 -05:00
for key, value in d.items():
if isinstance(value, basestring):
result[".".join(prefix + [key])] = value.lower()
elif hasattr(value, "items"):
2016-02-02 12:18:50 -05:00
_flatten_dict(value, prefix=(prefix + [key]), result=result)
2016-01-18 09:09:47 -05:00
return result