summaryrefslogtreecommitdiffstats
path: root/schema/scholar_fulltext.v01.json
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-08-06 12:31:53 -0700
committerBryan Newbold <bnewbold@archive.org>2020-08-06 12:32:09 -0700
commit8611d4cfd348b57120f936c064e9591c419a7ace (patch)
treee3a5ca33953aeb61202b8d4e850a05f253fcdf2d /schema/scholar_fulltext.v01.json
parent8b5a78cd13ebfe5843bb0f04839afde69e09bb59 (diff)
downloadfatcat-scholar-8611d4cfd348b57120f936c064e9591c419a7ace.tar.gz
fatcat-scholar-8611d4cfd348b57120f936c064e9591c419a7ace.zip
ES schema: do not index fulltext.body or fulltext.annex separately from 'everything'
The goal here is to reduce term index size. This means that querying/matching only on these fields (distinct from "everything") will not work.
Diffstat (limited to 'schema/scholar_fulltext.v01.json')
-rw-r--r--schema/scholar_fulltext.v01.json5
1 files changed, 2 insertions, 3 deletions
diff --git a/schema/scholar_fulltext.v01.json b/schema/scholar_fulltext.v01.json
index b03412d..a759d8f 100644
--- a/schema/scholar_fulltext.v01.json
+++ b/schema/scholar_fulltext.v01.json
@@ -130,9 +130,9 @@
"dynamic": false,
"properties": {
"lang_code": { "type": "keyword", "normalizer": "default" },
- "body": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "everything", "store": true },
+ "body": { "type": "text", "index": false, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "everything", "store": true },
"acknowledgement": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "everything", "store": true },
- "annex": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "everything", "store": true },
+ "annex": { "type": "text", "index": false, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "everything", "store": true },
"release_ident": { "type": "keyword", "normalizer": "default", "doc_values": false },
"file_ident": { "type": "keyword", "normalizer": "default", "doc_values": false },
"file_sha1": { "type": "keyword", "normalizer": "default", "doc_values": false },
@@ -219,7 +219,6 @@
"doctype": { "type": "alias", "path": "doc_type" },
"tag": { "type": "alias", "path": "tags" },
- "body": { "type": "alias", "path": "fulltext.body" },
"abstract": { "type": "alias", "path": "abstracts.body" },
"acknowledgement":{ "type": "alias", "path": "fulltext.acknowledgement" },
"access_type": { "type": "alias", "path": "fulltext.access_type" },