diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2018-11-04 18:51:09 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2018-11-04 18:51:09 -0800 |
commit | 66953b184d9b664e15cd7d7fddcb250c2b767df5 (patch) | |
tree | e9841cbc26d6a0d21e9b236dcffd474632c66673 /extra/elasticsearch | |
parent | 881b46e3b1682974f48fc196f483c3fa2648b998 (diff) | |
download | fatcat-66953b184d9b664e15cd7d7fddcb250c2b767df5.tar.gz fatcat-66953b184d9b664e15cd7d7fddcb250c2b767df5.zip |
note elastic plugin needed
Diffstat (limited to 'extra/elasticsearch')
-rw-r--r-- | extra/elasticsearch/README.md | 10 | ||||
-rw-r--r-- | extra/elasticsearch/release_schema.no-plugins.json | 42 |
2 files changed, 52 insertions, 0 deletions
diff --git a/extra/elasticsearch/README.md b/extra/elasticsearch/README.md index c94c3109..d5ac0c53 100644 --- a/extra/elasticsearch/README.md +++ b/extra/elasticsearch/README.md @@ -25,6 +25,16 @@ relation is *removed*. For example, if a file match against a given release is removed, the old release elastic object needs to be updated to remove the file from it's `files`. +## Setting Up Elasticsearch + +We use elasticsearch version 6.x, with the `analysis-icu` plugin installed: + + sudo /usr/share/elasticsearch/bin/elasticsearch-plugin install analysis-icu + sudo service elasticsearch restart + +If you can't install this plugin easily (eg, in a docker container), you can +use the `no-plugin` variant (though, warning, it might not be up to date). + ## Loading Data Drop and rebuild the schema: diff --git a/extra/elasticsearch/release_schema.no-plugins.json b/extra/elasticsearch/release_schema.no-plugins.json new file mode 100644 index 00000000..c879c176 --- /dev/null +++ b/extra/elasticsearch/release_schema.no-plugins.json @@ -0,0 +1,42 @@ +{ +"mappings": { + "release": { + "properties": { + "ident": { "type": "keyword" }, + "revision": { "type": "keyword" }, + "title": { "type": "text", "index": true }, + "author": { "type": "alias", "path": "contrib_names" }, + "journal": { "type": "alias", "path": "container_name" }, + "date": { "type": "alias", "path": "release_date" }, + "issn": { "type": "alias", "path": "container_issnl" }, + "oa": { "type": "alias", "path": "container_is_oa" }, + "longtail": { "type": "alias", "path": "container_is_longtail_oa" }, + "release_date": { "type": "date" }, + "release_type": { "type": "keyword" }, + "release_status": { "type": "keyword" }, + "language": { "type": "keyword" }, + "doi": { "type": "keyword" }, + "pmid": { "type": "keyword" }, + "pmcid": { "type": "keyword" }, + "isbn13": { "type": "keyword" }, + "core_id": { "type": "keyword" }, + "wikidata_qid": { "type": "keyword" }, + "publisher": { "type": "text", "index": true }, + "container_name": { "type": "text", "index": true }, + "container_issnl": { "type": "keyword" }, + "container_is_oa": { "type": "boolean" }, + "container_is_longtail_oa": { "type": "boolean" }, + "contrib_count": { "type": "integer" }, + "contrib_names": { "type": "text", "index": true }, + "ref_count": { "type": "integer" }, + "file_count": { "type": "integer" }, + "file_pdf_url": { "type": "keyword" }, + "file_in_webarchive": { "type": "boolean" }, + "file_in_ia": { "type": "boolean" }, + "any_abstract": { "type": "boolean" }, + "is_kept": { "type": "boolean" }, + "in_shadow": { "type": "boolean" } + } + } +} +} |