aboutsummaryrefslogtreecommitdiffstats
path: root/tests/test_matching.py
diff options
context:
space:
mode:
Diffstat (limited to 'tests/test_matching.py')
-rw-r--r--tests/test_matching.py82
1 files changed, 1 insertions, 81 deletions
diff --git a/tests/test_matching.py b/tests/test_matching.py
index ca94c2a..a7754ee 100644
--- a/tests/test_matching.py
+++ b/tests/test_matching.py
@@ -8,12 +8,11 @@ import requests
from fatcat_openapi_client import ReleaseEntity, ReleaseContrib
from fuzzycat.entities import entity_from_dict, entity_from_json
-from fuzzycat.matching import anything_to_entity, match_release_fuzzy, FuzzyReleaseMatcher
+from fuzzycat.matching import anything_to_entity, FuzzyReleaseMatcher
warnings.filterwarnings(
"ignore") # InsecureRequestWarning: Unverified HTTPS request is being made to host ...
-from fuzzycat.matching import anything_to_entity, match_release_fuzzy
from fuzzycat.config import settings
from fatcat_openapi_client import ReleaseEntity
import pytest
@@ -30,20 +29,6 @@ logger.setLevel(logging.DEBUG)
FATCAT_SEARCH_URL = settings.get("FATCAT_SEARCH_URL", "https://search.fatcat.wiki:443")
-def is_not_reachable(url, timeout=3):
- return not is_reachable(url)
-
-
-def is_reachable(url, timeout=3):
- """
- Return true, if URL is reachable and returns HTTP 200.
- """
- try:
- return requests.get(url, verify=False, timeout=timeout).ok
- except Exception:
- return False
-
-
def yaml_to_cases(klass,
files="tests/files/fuzzy_release_match_release_exact_title_exact_contrib/*.yaml"):
"""
@@ -63,71 +48,6 @@ def es_client():
return elasticsearch.Elasticsearch([FATCAT_SEARCH_URL])
-# @pytest.mark.skipif(
-# is_not_reachable(FATCAT_SEARCH_URL),
-# reason="{} not reachable, use e.g. FUZZYCAT_FATCAT_SEARCH_URL=localhost:9200 to override".
-# format(FATCAT_SEARCH_URL))
-def test_match_release_fuzzy(es_client, caplog):
- """
- This test is tied to the current index contents, so if that changes, this
- test may fail as well.
-
- Note: Deprecated. We want to get rid of this.
- """
- cases = (
- ("wtv64ahbdzgwnan7rllwr3nurm", 1),
- ("eqcgtpav3na5jh56o5vjsvb4ei", 1),
- )
- for i, (ident, count) in enumerate(cases):
- entity = anything_to_entity(ident, ReleaseEntity)
-
- result = match_release_fuzzy(entity, es=es_client)
- logger.info("[{}] given {}, found {}".format(i, entity.title, len(result)))
- assert len(result) == count
-
- # Partial data.
- cases = (
- ({
- "title": "digital libraries",
- "ext_ids": {}
- }, 5),
- ({
- "title": "unlikelytitle",
- "ext_ids": {}
- }, 0),
- ({
- "title": "Imminent dystopia",
- "ext_ids": {}
- }, 2),
- ({
- "title": "",
- "contribs": [{
- "raw_name": "Aristoteles"
- }],
- "ext_ids": {}
- }, 5),
- # ({
- # "title": "Letter",
- # "contribs": [{"raw_name": "Claudel"}],
- # "ext_ids": {}
- # }, 1),
- # ({
- # "title": "The Future of Digital Scholarship",
- # "contribs": [{
- # "raw_name": "Costantino Thanos"
- # }],
- # "ext_ids": {}
- # }, 5),
- )
- for i, (doc, count) in enumerate(cases):
- entity = entity_from_dict(doc, ReleaseEntity)
- result = match_release_fuzzy(entity, es=es_client)
- with caplog.at_level(logging.INFO):
- logging.info("[{}] given title '{}', found {}, {}".format(i, entity.title, len(result),
- [v.title for v in result]))
- assert len(result) == count, doc
-
-
def test_matcher_match_release(es_client, caplog):
cases = (
("wtv64ahbdzgwnan7rllwr3nurm", 1),