diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2018-09-21 16:56:01 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2018-09-21 16:56:01 -0700 |
commit | 86d15bda26280437ac7a853e73d460d0bf9dd418 (patch) | |
tree | cfd8347bb1f4e98cdab67cebb4637421458673a9 /extra/elasticsearch/release_schema.json | |
parent | d495df1f76c44b7e09db2fb8b93615ffcdf6b818 (diff) | |
download | fatcat-86d15bda26280437ac7a853e73d460d0bf9dd418.tar.gz fatcat-86d15bda26280437ac7a853e73d460d0bf9dd418.zip |
first pass at a release elastic schema
Diffstat (limited to 'extra/elasticsearch/release_schema.json')
-rw-r--r-- | extra/elasticsearch/release_schema.json | 60 |
1 files changed, 60 insertions, 0 deletions
diff --git a/extra/elasticsearch/release_schema.json b/extra/elasticsearch/release_schema.json new file mode 100644 index 00000000..89359de4 --- /dev/null +++ b/extra/elasticsearch/release_schema.json @@ -0,0 +1,60 @@ +{ +"settings": { + "index": { + "analysis": { + "analyzer": { + "default": { + "type": "custom", + "tokenizer": "standard", + "filter": [ "lowercase", "asciifolding" ] + }, + "textIcu": { + "type": "custom", + "tokenizer": "icu_tokenizer", + "char_filter": [ "icu_normalizer" ], + "filter": [ "icu_folding" ] + }, + "textIcuSearch": { + "type": "custom", + "tokenizer": "icu_tokenizer", + "char_filter": [ "icu_normalizer" ], + "filter": [ "icu_folding" ] + } + } + } + } +}, +"mappings": { + "work": { + "_all": { "enabled": true }, + "properties": { + "ident": { "type": "keyword", "include_in_all": false }, + "revision": { "type": "keyword", "include_in_all": false }, + "title": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "author_names": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "release_date": { "type": "date" }, + "release_type": { "type": "keyword", "include_in_all": false }, + "release_status": { "type": "keyword", "include_in_all": false }, + "language": { "type": "keyword", "include_in_all": false }, + "doi": { "type": "keyword" }, + "pmid": { "type": "keyword" }, + "pmcid": { "type": "keyword" }, + "isbn13": { "type": "keyword" }, + "core_id": { "type": "keyword", "include_in_all": false }, + "wikidata_qid": { "type": "keyword", "include_in_all": false }, + "publisher": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "include_in_all": false }, + "container_title": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "container_issnl": { "type": "keyword", "include_in_all": false }, + "container_is_oa": { "type": "boolean", "include_in_all": false }, + "container_is_kept": { "type": "boolean", "include_in_all": false }, + "container_is_longtail_oa": { "type": "booloean", "include_in_all": false }, + "file_count": { "type": "number", "include_in_all": false }, + "file_pdf_url": { "type": "keyword", "include_in_all": false }, + "file_in_webarchive": { "type": "boolean", "include_in_all": false }, + "file_in_ia": { "type": "boolean", "include_in_all": false }, + "any_abstract": { "type": "boolean", "include_in_all": false }, + "in_shadow": { "type": "boolean", "include_in_all": false } + } + } +} +} |