From 9ad198b7a1e12504e3d4718e56edd0a7e8b5e61a Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Fri, 3 Dec 2021 17:20:45 -0800 Subject: ES container schema: add 'sim_pubid' and `ia_sim_collection` fields --- extra/elasticsearch/container_schema.json | 2 ++ python/fatcat_tools/transforms/elasticsearch.py | 2 ++ 2 files changed, 4 insertions(+) diff --git a/extra/elasticsearch/container_schema.json b/extra/elasticsearch/container_schema.json index 05aa0b35..d3351aab 100644 --- a/extra/elasticsearch/container_schema.json +++ b/extra/elasticsearch/container_schema.json @@ -57,6 +57,8 @@ "issns": { "type": "keyword", "normalizer": "default" }, "wikidata_qid": { "type": "keyword", "normalizer": "default" }, "dblp_prefix": { "type": "keyword", "normalizer": "default" }, + "sim_pubid": { "type": "keyword", "normalizer": "default" }, + "ia_sim_collection": { "type": "keyword", "normalizer": "default" }, "country_code": { "type": "keyword", "normalizer": "default" }, "region": { "type": "keyword", "normalizer": "default" }, "discipline": { "type": "keyword", "normalizer": "default" }, diff --git a/python/fatcat_tools/transforms/elasticsearch.py b/python/fatcat_tools/transforms/elasticsearch.py index ce4308d3..1c7c2905 100644 --- a/python/fatcat_tools/transforms/elasticsearch.py +++ b/python/fatcat_tools/transforms/elasticsearch.py @@ -509,6 +509,8 @@ def container_to_elasticsearch( if extra.get("ia"): if extra["ia"].get("sim"): any_ia_sim = True + t["sim_pubid"] = extra["ia"]["sim"].get("sim_pubid") + t["ia_sim_collection"] = extra["ia"]["sim"].get("collection_item") if extra["ia"].get("longtail_oa"): is_longtail_oa = True t["is_superceded"] = bool(extra.get("superceded")) -- cgit v1.2.3