diff options
| author | Bryan Newbold <bnewbold@archive.org> | 2020-04-02 17:38:30 -0700 | 
|---|---|---|
| committer | Bryan Newbold <bnewbold@archive.org> | 2020-04-02 17:38:30 -0700 | 
| commit | f760c853eb3d878974d307d0468408dea5552e1d (patch) | |
| tree | a70395f7981bfd9121e6eca793db546e8342a59a | |
| parent | 87f40d0f8d15f16020964773e75d35ea22da049f (diff) | |
| download | fatcat-covid19-f760c853eb3d878974d307d0468408dea5552e1d.tar.gz fatcat-covid19-f760c853eb3d878974d307d0468408dea5552e1d.zip  | |
include container_original_name ES field
| -rwxr-xr-x | elastic_transform.py | 1 | ||||
| -rw-r--r-- | schema/fulltext_schema.v00.json | 1 | 
2 files changed, 2 insertions, 0 deletions
diff --git a/elastic_transform.py b/elastic_transform.py index 587aabd..93b0310 100755 --- a/elastic_transform.py +++ b/elastic_transform.py @@ -132,6 +132,7 @@ def fulltext_to_elasticsearch(row, force_bool=True):      if container:          t['publisher'] = container.get('publisher')          t['container_name'] = container.get('name') +        t['container_original_name'] = container.get('original_name')          # this is container.ident, not release.container_id, because there may          # be a redirect involved          t['container_id'] = container['ident'] diff --git a/schema/fulltext_schema.v00.json b/schema/fulltext_schema.v00.json index 694048e..26bafe7 100644 --- a/schema/fulltext_schema.v00.json +++ b/schema/fulltext_schema.v00.json @@ -84,6 +84,7 @@          "publisher":            { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },          "publisher_type":       { "type": "keyword", "normalizer": "default" },          "container_name":       { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": ["biblio_all", "everything"] }, +        "container_original_name":       { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": ["biblio_all", "everything"] },          "container_id":         { "type": "keyword", "normalizer": "default" },          "container_issnl":      { "type": "keyword", "normalizer": "default" },          "container_type":       { "type": "keyword", "normalizer": "default" },  | 
