diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2019-01-23 21:07:23 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2019-01-23 21:07:23 -0800 |
commit | c33e7827175a9ecff288aa095138ed5f79d1b125 (patch) | |
tree | cbced07ccb7e7f26ff21776f41218319269dadce /extra/elasticsearch/container_schema.json | |
parent | 642501efc92e31ac438fe0f70820415c825a3802 (diff) | |
download | fatcat-c33e7827175a9ecff288aa095138ed5f79d1b125.tar.gz fatcat-c33e7827175a9ecff288aa095138ed5f79d1b125.zip |
initial changelog and container ES schemas
Diffstat (limited to 'extra/elasticsearch/container_schema.json')
-rw-r--r-- | extra/elasticsearch/container_schema.json | 74 |
1 files changed, 74 insertions, 0 deletions
diff --git a/extra/elasticsearch/container_schema.json b/extra/elasticsearch/container_schema.json new file mode 100644 index 00000000..83791ab8 --- /dev/null +++ b/extra/elasticsearch/container_schema.json @@ -0,0 +1,74 @@ +{ +"settings": { + "index": { + "analysis": { + "analyzer": { + "default": { + "type": "custom", + "tokenizer": "standard", + "filter": [ "lowercase", "asciifolding" ] + }, + "textIcu": { + "type": "custom", + "tokenizer": "icu_tokenizer", + "char_filter": [ "icu_normalizer" ], + "filter": [ "icu_folding" ] + }, + "textIcuSearch": { + "type": "custom", + "tokenizer": "icu_tokenizer", + "char_filter": [ "icu_normalizer" ], + "filter": [ "icu_folding" ] + } + } + } + } +}, +"mappings": { + "container": { + "properties": { + "ident": { "type": "keyword" }, + "state": { "type": "keyword" }, + "revision": { "type": "keyword" }, + "name": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "publisher": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" }, + "container_type": { "type": "keyword" }, + "wikidata_qid": { "type": "keyword" }, + "issnl": { "type": "keyword" }, + "region": { "type": "keyword" }, + "nation": { "type": "keyword" }, + "discipline": { "type": "keyword" }, + "languages": { "type": "keyword" }, + "mimetypes": { "type": "keyword" }, + "first_year": { "type": "integer" }, + "last_year": { "type": "integer" }, + + "in_doaj": { "type": "boolean" }, + "in_road": { "type": "boolean" }, + "in_doi": { "type": "boolean" }, + "in_doaj_works": { "type": "boolean" }, + "in_sherpa_romeo":{ "type": "boolean" }, + "is_oa": { "type": "boolean" }, + "is_longtail_oa": { "type": "boolean" }, + "any_kbart": { "type": "boolean" }, + "any_jstor": { "type": "boolean" }, + "any_sim": { "type": "boolean" }, + "ia_homepage_status": { "type": "boolean" }, + + "releases_total": { "type": "integer" }, + "releases_kbart": { "type": "integer" }, + "releases_ia": { "type": "integer" }, + "releases_sim": { "type": "integer" }, + "releases_shadow": { "type": "integer" }, + "releases_any_file": { "type": "integer" }, + "releases_any_fileset": { "type": "integer" }, + "releases_any_webcapture": { "type": "integer" }, + + "year": { "type": "alias", "path": "first_year" }, + "type": { "type": "alias", "path": "container_type" }, + "oa": { "type": "alias", "path": "is_oa" }, + "longtail": { "type": "alias", "path": "is_longtail_oa" } + } + } +} +} |