From a1e2e41e5a134336786a5ae298088118569822b1 Mon Sep 17 00:00:00 2001 From: tdurieux Date: Wed, 8 Aug 2018 11:10:22 +0200 Subject: [PATCH] fix: add word boudary around anonymized term --- server.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/server.py b/server.py index 0c60cf9..96bc133 100644 --- a/server.py +++ b/server.py @@ -86,7 +86,7 @@ class Anonymous_Github: application.jinja_env.add_extension('jinja2.ext.do') @application.template_filter('remove_terms', ) - def remove_terms(content, repository_configuration): + def remove_terms(content, repository_configuration, word_boundaries=True): """ remove the blacklisted terms from the content :param content: the content to anonymize @@ -100,7 +100,10 @@ class Anonymous_Github: "%s/repository/%s" % (self.public_url, repository_configuration["id"]), content) content = re.compile(repo, re.IGNORECASE).sub("%s/repository/%s" % (self.public_url, repository_configuration["id"]), content) for term in repository_configuration['terms']: - content = re.compile(term, re.IGNORECASE).sub("XXX", content) + if word_boundaries: + content = re.compile(r'\b%s\b' % term, re.IGNORECASE).sub("XXX", content) + else: + content = re.compile(term, re.IGNORECASE).sub("XXX", content) return content @application.template_filter('file_render', )