diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2019-05-20 16:07:02 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2019-05-20 16:29:28 -0700 |
commit | 81c7293312f039f8ce3cac9a5023ab97b57e39ce (patch) | |
tree | a6caf1a95a7100cc4c691f47134b01c2669378f1 | |
parent | 5868714f4176c9cb70245d5164cc9196c2314a75 (diff) | |
download | fatcat-81c7293312f039f8ce3cac9a5023ab97b57e39ce.tar.gz fatcat-81c7293312f039f8ce3cac9a5023ab97b57e39ce.zip |
elastic release schema update
-rw-r--r-- | extra/elasticsearch/release_schema.json | 7 | ||||
-rw-r--r-- | python/fatcat_tools/transforms/elasticsearch.py | 7 |
2 files changed, 11 insertions, 3 deletions
diff --git a/extra/elasticsearch/release_schema.json b/extra/elasticsearch/release_schema.json index c30a7b5b..ef195e1b 100644 --- a/extra/elasticsearch/release_schema.json +++ b/extra/elasticsearch/release_schema.json @@ -31,11 +31,13 @@ "state": { "type": "keyword" }, "revision": { "type": "keyword" }, "title": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "subtitle": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, "original_title": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, "release_date": { "type": "date" }, "release_year": { "type": "integer" }, "release_type": { "type": "keyword" }, - "release_status": { "type": "keyword" }, + "release_stage": { "type": "keyword" }, + "withdrawn_status": { "type": "keyword" }, "language": { "type": "keyword" }, "doi": { "type": "keyword" }, "pmid": { "type": "keyword" }, @@ -45,6 +47,8 @@ "core_id": { "type": "keyword" }, "axiv_id": { "type": "keyword" }, "jstor_id": { "type": "keyword" }, + "ark_id": { "type": "keyword" }, + "mag_id": { "type": "keyword" }, "license": { "type": "keyword" }, "publisher": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, "container_name": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, @@ -81,6 +85,7 @@ "longtail": { "type": "alias", "path": "is_longtail_oa" }, "lang": { "type": "alias", "path": "language" }, "file_pdf_url": { "type": "alias", "path": "best_pdf_url" }, + "release_status": { "type": "alias", "path": "release_stage" }, "is_kept": { "type": "alias", "path": "in_kbart" } } } diff --git a/python/fatcat_tools/transforms/elasticsearch.py b/python/fatcat_tools/transforms/elasticsearch.py index 645142de..a8e0227b 100644 --- a/python/fatcat_tools/transforms/elasticsearch.py +++ b/python/fatcat_tools/transforms/elasticsearch.py @@ -43,9 +43,11 @@ def release_to_elasticsearch(entity, force_bool=True): state = release.state, revision = release.revision, title = release.title, + subtitle = release.subtitle, original_title = release.original_title, release_type = release.release_type, - release_status = release.release_stage, + release_stage = release.release_stage, + withdrawn_status = release.withdrawn_status, language = release.language, license = release.license_slug, doi = release.ext_ids.doi, @@ -56,7 +58,8 @@ def release_to_elasticsearch(entity, force_bool=True): core_id = release.ext_ids.core, arxiv_id = release.ext_ids.arxiv, jstor_id = release.ext_ids.jstor, - # TODO: mag, ark + ark_id = release.ext_ids.ark, + mag_id = release.ext_ids.mag, ) is_oa = None |