aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2021-11-10 16:47:03 -0800
committerBryan Newbold <bnewbold@archive.org>2021-11-10 16:47:03 -0800
commitc164970449a392b5165d903d213c2bb51f2a187f (patch)
tree917de69bef051e211c38018e8d91950d7cae2f71
parent36ddc22358614be5c38f230594f6f83e19f4ad96 (diff)
downloadfatcat-scholar-c164970449a392b5165d903d213c2bb51f2a187f.tar.gz
fatcat-scholar-c164970449a392b5165d903d213c2bb51f2a187f.zip
pull GROBID refs along with crossref records into bundles
-rw-r--r--fatcat_scholar/sandcrawler.py4
-rw-r--r--fatcat_scholar/work_pipeline.py1
-rw-r--r--tests/test_work_pipeline.py3
3 files changed, 6 insertions, 2 deletions
diff --git a/fatcat_scholar/sandcrawler.py b/fatcat_scholar/sandcrawler.py
index 087cdc6..9b016f5 100644
--- a/fatcat_scholar/sandcrawler.py
+++ b/fatcat_scholar/sandcrawler.py
@@ -40,7 +40,9 @@ class SandcrawlerPostgrestClient:
return None
def get_crossref(self, doi: str) -> Optional[Dict[str, Any]]:
- resp = requests.get(self.api_url + "/crossref", params=dict(doi="eq." + doi))
+ resp = requests.get(
+ self.api_url + "/crossref_with_refs", params=dict(doi="eq." + doi)
+ )
resp.raise_for_status()
resp_json = resp.json()
if resp_json:
diff --git a/fatcat_scholar/work_pipeline.py b/fatcat_scholar/work_pipeline.py
index 5c32767..ea4b0a4 100644
--- a/fatcat_scholar/work_pipeline.py
+++ b/fatcat_scholar/work_pipeline.py
@@ -252,6 +252,7 @@ class WorkPipeline:
release_ident=re.ident,
doi=doi,
record=crossref_meta["record"],
+ grobid_refs=crossref_meta["refs_json"],
)
def lookup_sim(self, release: ReleaseEntity) -> Optional[SimIssueRow]:
diff --git a/tests/test_work_pipeline.py b/tests/test_work_pipeline.py
index 55cc7d8..554cc07 100644
--- a/tests/test_work_pipeline.py
+++ b/tests/test_work_pipeline.py
@@ -71,7 +71,7 @@ def test_run_transform(mocker: Any) -> None:
responses.add(
responses.GET,
- "http://disabled-during-tests-bogus.xyz:3333/crossref?doi=eq.10.7717%2Fpeerj.4375",
+ "http://disabled-during-tests-bogus.xyz:3333/crossref_with_refs?doi=eq.10.7717%2Fpeerj.4375",
status=200,
json=[
{
@@ -81,6 +81,7 @@ def test_run_transform(mocker: Any) -> None:
"title": "something",
"TODO_better_object": 3,
},
+ "refs_json": [],
}
],
)