summaryrefslogtreecommitdiffstats
path: root/fatcat_scholar/grobid2json.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-09-04 17:52:01 -0700
committerBryan Newbold <bnewbold@archive.org>2020-09-04 17:52:01 -0700
commit3bf706f07d68aaacebcbf08d21c7b4c4f91856ea (patch)
treeb32bd11d7fb5091567c179877f9f5784c595faca /fatcat_scholar/grobid2json.py
parent8ef87c02693a51b319249632e3219d8414ce8c13 (diff)
downloadfatcat-scholar-3bf706f07d68aaacebcbf08d21c7b4c4f91856ea.tar.gz
fatcat-scholar-3bf706f07d68aaacebcbf08d21c7b4c4f91856ea.zip
heavy to refs command
Diffstat (limited to 'fatcat_scholar/grobid2json.py')
-rwxr-xr-xfatcat_scholar/grobid2json.py6
1 files changed, 6 insertions, 0 deletions
diff --git a/fatcat_scholar/grobid2json.py b/fatcat_scholar/grobid2json.py
index 979a794..fc19036 100755
--- a/fatcat_scholar/grobid2json.py
+++ b/fatcat_scholar/grobid2json.py
@@ -97,6 +97,12 @@ def journal_info(elem: ET.Element) -> Dict[str, Any]:
def biblio_info(elem: ET.Element) -> Dict[str, Any]:
+ """
+ TODO for references:
+ - pages
+ - locator
+ - doi, pmid, pmcid, arxiv_id, isbn
+ """
ref: Dict[str, Any] = dict()
ref["id"] = elem.attrib.get("{http://www.w3.org/XML/1998/namespace}id")
# Title stuff is messy in references...