aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2021-01-11 20:30:39 -0800
committerBryan Newbold <bnewbold@robocracy.org>2021-01-20 11:47:43 -0800
commit7940b4b02492eb8052c33252a7c77188181867e6 (patch)
tree6ed542e0e8e463027f570a61452b59cec500b75b
parent99e37fca2ad74cd3e48d09b12b0d8a005d0de59e (diff)
downloadfatcat-7940b4b02492eb8052c33252a7c77188181867e6.tar.gz
fatcat-7940b4b02492eb8052c33252a7c77188181867e6.zip
elasticsearch: simple new dblp and doaj fields
-rw-r--r--extra/elasticsearch/release_schema.json3
-rw-r--r--python/fatcat_tools/transforms/elasticsearch.py4
2 files changed, 7 insertions, 0 deletions
diff --git a/extra/elasticsearch/release_schema.json b/extra/elasticsearch/release_schema.json
index 666a672f..e1f7a79a 100644
--- a/extra/elasticsearch/release_schema.json
+++ b/extra/elasticsearch/release_schema.json
@@ -72,6 +72,8 @@
"ark_id": { "type": "keyword", "normalizer": "default", "doc_values": false },
"mag_id": { "type": "keyword", "normalizer": "default", "doc_values": false },
"s2_id": { "type": "keyword", "normalizer": "default", "doc_values": false },
+ "dblp_id": { "type": "keyword", "normalizer": "default", "doc_values": false },
+ "doaj_id": { "type": "keyword", "normalizer": "default", "doc_values": false },
"license": { "type": "keyword", "normalizer": "default" },
"publisher": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },
"publisher_type": { "type": "keyword", "normalizer": "default" },
@@ -103,6 +105,7 @@
"is_preserved": { "type": "boolean" },
"in_kbart": { "type": "boolean" },
"in_jstor": { "type": "boolean" },
+ "in_doaj": { "type": "boolean" },
"in_dweb": { "type": "boolean" },
"in_web": { "type": "boolean" },
"in_ia": { "type": "boolean" },
diff --git a/python/fatcat_tools/transforms/elasticsearch.py b/python/fatcat_tools/transforms/elasticsearch.py
index db860a09..f37aadba 100644
--- a/python/fatcat_tools/transforms/elasticsearch.py
+++ b/python/fatcat_tools/transforms/elasticsearch.py
@@ -72,6 +72,8 @@ def release_to_elasticsearch(entity: ReleaseEntity, force_bool: bool = True) ->
jstor_id = release.ext_ids.jstor,
ark_id = release.ext_ids.ark,
mag_id = release.ext_ids.mag,
+ dblp_id = release.ext_ids.dblp,
+ doaj_id = release.ext_ids.doaj,
)
t.update(dict(
@@ -84,6 +86,7 @@ def release_to_elasticsearch(entity: ReleaseEntity, force_bool: bool = True) ->
in_ia_sim = False,
in_kbart = None,
in_jstor = False,
+ in_doaj= bool(release.ext_ids.doaj),
in_shadows = False,
))
@@ -280,6 +283,7 @@ def _rte_container_helper(container: ContainerEntity, release_year: Optional[int
if c_extra.get('doaj'):
if c_extra['doaj'].get('as_of'):
t['is_oa'] = True
+ t['in_doaj'] = True
if c_extra.get('road'):
if c_extra['road'].get('as_of'):
t['is_oa'] = True