diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2021-01-11 20:30:39 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2021-01-20 11:47:43 -0800 |
commit | 7940b4b02492eb8052c33252a7c77188181867e6 (patch) | |
tree | 6ed542e0e8e463027f570a61452b59cec500b75b | |
parent | 99e37fca2ad74cd3e48d09b12b0d8a005d0de59e (diff) | |
download | fatcat-7940b4b02492eb8052c33252a7c77188181867e6.tar.gz fatcat-7940b4b02492eb8052c33252a7c77188181867e6.zip |
elasticsearch: simple new dblp and doaj fields
-rw-r--r-- | extra/elasticsearch/release_schema.json | 3 | ||||
-rw-r--r-- | python/fatcat_tools/transforms/elasticsearch.py | 4 |
2 files changed, 7 insertions, 0 deletions
diff --git a/extra/elasticsearch/release_schema.json b/extra/elasticsearch/release_schema.json index 666a672f..e1f7a79a 100644 --- a/extra/elasticsearch/release_schema.json +++ b/extra/elasticsearch/release_schema.json @@ -72,6 +72,8 @@ "ark_id": { "type": "keyword", "normalizer": "default", "doc_values": false }, "mag_id": { "type": "keyword", "normalizer": "default", "doc_values": false }, "s2_id": { "type": "keyword", "normalizer": "default", "doc_values": false }, + "dblp_id": { "type": "keyword", "normalizer": "default", "doc_values": false }, + "doaj_id": { "type": "keyword", "normalizer": "default", "doc_values": false }, "license": { "type": "keyword", "normalizer": "default" }, "publisher": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, "publisher_type": { "type": "keyword", "normalizer": "default" }, @@ -103,6 +105,7 @@ "is_preserved": { "type": "boolean" }, "in_kbart": { "type": "boolean" }, "in_jstor": { "type": "boolean" }, + "in_doaj": { "type": "boolean" }, "in_dweb": { "type": "boolean" }, "in_web": { "type": "boolean" }, "in_ia": { "type": "boolean" }, diff --git a/python/fatcat_tools/transforms/elasticsearch.py b/python/fatcat_tools/transforms/elasticsearch.py index db860a09..f37aadba 100644 --- a/python/fatcat_tools/transforms/elasticsearch.py +++ b/python/fatcat_tools/transforms/elasticsearch.py @@ -72,6 +72,8 @@ def release_to_elasticsearch(entity: ReleaseEntity, force_bool: bool = True) -> jstor_id = release.ext_ids.jstor, ark_id = release.ext_ids.ark, mag_id = release.ext_ids.mag, + dblp_id = release.ext_ids.dblp, + doaj_id = release.ext_ids.doaj, ) t.update(dict( @@ -84,6 +86,7 @@ def release_to_elasticsearch(entity: ReleaseEntity, force_bool: bool = True) -> in_ia_sim = False, in_kbart = None, in_jstor = False, + in_doaj= bool(release.ext_ids.doaj), in_shadows = False, )) @@ -280,6 +283,7 @@ def _rte_container_helper(container: ContainerEntity, release_year: Optional[int if c_extra.get('doaj'): if c_extra['doaj'].get('as_of'): t['is_oa'] = True + t['in_doaj'] = True if c_extra.get('road'): if c_extra['road'].get('as_of'): t['is_oa'] = True |