From ed38bfde4e1eaddd6d710802b6f372c7b0aab26b Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Fri, 14 Feb 2020 00:07:56 -0800 Subject: ES updates: fix tests to accept archive.org in host/domain --- python/tests/transform_elasticsearch.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/python/tests/transform_elasticsearch.py b/python/tests/transform_elasticsearch.py index c94ab375..a954fc4d 100644 --- a/python/tests/transform_elasticsearch.py +++ b/python/tests/transform_elasticsearch.py @@ -110,9 +110,10 @@ def test_elasticsearch_file_transform(matched_importer): assert 'web' in es['rels'] assert 'www.zhros.ru' in es['hosts'] assert 'zhros.ru' in es['domains'] + assert 'archive.org' in (es['hosts'] + es['domains']) + assert 'web.archive.org' in (es['hosts'] + es['domains']) + # old regression assert not '.archive.org' in (es['hosts'] + es['domains']) - assert not 'archive.org' in (es['hosts'] + es['domains']) - assert not 'web.archive.org' in (es['hosts'] + es['domains']) def test_elasticsearch_changelog_transform(matched_importer): ce = entity_from_json(open('./tests/files/changelog_3469683.json', 'r').read(), ChangelogEntry) -- cgit v1.2.3