aboutsummaryrefslogtreecommitdiffstats
path: root/tests/test_parse.py
diff options
context:
space:
mode:
Diffstat (limited to 'tests/test_parse.py')
-rw-r--r--tests/test_parse.py30
1 files changed, 30 insertions, 0 deletions
diff --git a/tests/test_parse.py b/tests/test_parse.py
index 203c960..9d8f4ff 100644
--- a/tests/test_parse.py
+++ b/tests/test_parse.py
@@ -410,3 +410,33 @@ def test_citation_multiple_editors() -> None:
assert ref.publisher == "Williams and Wilkins"
assert ref.date == "1996"
assert ref.note == "12th ed. Baltimore"
+
+
+def test_author_email() -> None:
+ with open("tests/files/document/author_email.tei.xml", "r") as f:
+ tei_xml = f.read()
+
+ doc = parse_document_xml(tei_xml)
+ biblio = doc.header
+ assert biblio
+ assert biblio.title == "Task-Based Intelligent Retrieval and Recommendation"
+ assert biblio.authors
+ assert biblio.authors[0].given_name == "Chirag"
+ assert biblio.authors[0].surname == "Shah"
+ assert biblio.authors[0].email == "redacted@example.com"
+ assert biblio.authors[0].affiliation
+ assert biblio.authors[0].affiliation.institution == "University of Washington"
+ assert biblio.authors[0].affiliation.address
+ assert biblio.authors[0].affiliation.address.settlement == "Seattle"
+ assert biblio.authors[0].affiliation.address.country == "USA"
+
+ assert doc.pdf_md5 == "6C18173427FE3FAD756BB2F4F7665855"
+ assert doc.grobid_version == "0.7.1-SNAPSHOT"
+ assert doc.grobid_timestamp == "2021-11-02T09:03+0000"
+ assert doc.language_code == "en"
+ assert doc.abstract
+ assert doc.abstract[:50] == "While the act of looking for information happens within a"[:50]
+ assert doc.citations == []
+ assert doc.body is None
+ assert doc.acknowledgement is None
+ assert doc.annex is None