Merge "Strip unsafe chars from author email"

This commit is contained in:
Jenkins
2015-01-15 13:33:36 +00:00
committed by Gerrit Code Review
3 changed files with 13 additions and 0 deletions

View File

@@ -234,6 +234,10 @@ def safe_encode(s):
return six.moves.urllib.parse.quote(s.encode('utf-8'))
def keep_safe_chars(s):
return re.sub(r'[^\x21-\x7e\x80-\xff]+', '', s)
def make_module_group(module_group_id, name=None, modules=None, tag='module'):
return {'id': module_group_id,
'module_group_name': name or module_group_id,

View File

@@ -211,6 +211,9 @@ class Git(Vcs):
# ignore commits with empty email (there are some < Essex)
continue
commit['author_email'] = utils.keep_safe_chars(
commit['author_email'])
diff_stat_str = rec.group('diff_stat')
diff_rec = re.search(DIFF_STAT_PATTERN, diff_stat_str)

View File

@@ -78,6 +78,12 @@ class TestUtils(testtools.TestCase):
self.assertEqual(expected, utils.add_index(
sequence, start=0, item_filter=lambda x: x['name'] != 'B'))
def test_keep_safe_chars(self):
self.assertEqual('somemoretext',
utils.keep_safe_chars('some more text'))
self.assertEqual(u'(unicode)',
utils.keep_safe_chars(u'(unicode \u0423) '))
def test_normalize_company_name(self):
company_names = ['EMC Corporation', 'Abc, corp..', 'Mirantis IT.',
'Red Hat, Inc.', 'abc s.r.o. ABC', '2s.r.o. co',