diff options
author | Bryan Newbold <bnewbold@archive.org> | 2021-11-10 16:47:03 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2021-11-10 16:47:03 -0800 |
commit | c164970449a392b5165d903d213c2bb51f2a187f (patch) | |
tree | 917de69bef051e211c38018e8d91950d7cae2f71 | |
parent | 36ddc22358614be5c38f230594f6f83e19f4ad96 (diff) | |
download | fatcat-scholar-c164970449a392b5165d903d213c2bb51f2a187f.tar.gz fatcat-scholar-c164970449a392b5165d903d213c2bb51f2a187f.zip |
pull GROBID refs along with crossref records into bundles
-rw-r--r-- | fatcat_scholar/sandcrawler.py | 4 | ||||
-rw-r--r-- | fatcat_scholar/work_pipeline.py | 1 | ||||
-rw-r--r-- | tests/test_work_pipeline.py | 3 |
3 files changed, 6 insertions, 2 deletions
diff --git a/fatcat_scholar/sandcrawler.py b/fatcat_scholar/sandcrawler.py index 087cdc6..9b016f5 100644 --- a/fatcat_scholar/sandcrawler.py +++ b/fatcat_scholar/sandcrawler.py @@ -40,7 +40,9 @@ class SandcrawlerPostgrestClient: return None def get_crossref(self, doi: str) -> Optional[Dict[str, Any]]: - resp = requests.get(self.api_url + "/crossref", params=dict(doi="eq." + doi)) + resp = requests.get( + self.api_url + "/crossref_with_refs", params=dict(doi="eq." + doi) + ) resp.raise_for_status() resp_json = resp.json() if resp_json: diff --git a/fatcat_scholar/work_pipeline.py b/fatcat_scholar/work_pipeline.py index 5c32767..ea4b0a4 100644 --- a/fatcat_scholar/work_pipeline.py +++ b/fatcat_scholar/work_pipeline.py @@ -252,6 +252,7 @@ class WorkPipeline: release_ident=re.ident, doi=doi, record=crossref_meta["record"], + grobid_refs=crossref_meta["refs_json"], ) def lookup_sim(self, release: ReleaseEntity) -> Optional[SimIssueRow]: diff --git a/tests/test_work_pipeline.py b/tests/test_work_pipeline.py index 55cc7d8..554cc07 100644 --- a/tests/test_work_pipeline.py +++ b/tests/test_work_pipeline.py @@ -71,7 +71,7 @@ def test_run_transform(mocker: Any) -> None: responses.add( responses.GET, - "http://disabled-during-tests-bogus.xyz:3333/crossref?doi=eq.10.7717%2Fpeerj.4375", + "http://disabled-during-tests-bogus.xyz:3333/crossref_with_refs?doi=eq.10.7717%2Fpeerj.4375", status=200, json=[ { @@ -81,6 +81,7 @@ def test_run_transform(mocker: Any) -> None: "title": "something", "TODO_better_object": 3, }, + "refs_json": [], } ], ) |