summaryrefslogtreecommitdiffstats
path: root/extra/elasticsearch/release_schema.json
blob: fa466168f8e4bb7a99076bdb3402d8e453b344cd (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
{
"settings": {
    "index": {
        "number_of_shards": 6,
        "number_of_replicas": 0,
        "analysis": {
            "analyzer": {
                "default": {
                    "type": "custom",
                    "tokenizer": "standard",
                    "filter": [ "lowercase", "asciifolding" ]
                },
                "textIcu": {
                    "type": "custom",
                    "tokenizer": "icu_tokenizer",
                    "char_filter": [ "icu_normalizer" ],
                    "filter": [ "icu_folding" ]
                },
                "textIcuSearch": {
                    "type": "custom",
                    "tokenizer": "icu_tokenizer",
                    "char_filter": [ "icu_normalizer" ],
                    "filter": [ "icu_folding" ]
                }
            },
            "normalizer": {
                "default": {
                    "type": "custom",
                    "char_filter": [],
                    "filter": ["lowercase"]
                },
                "caseSensitive": {
                    "type": "custom",
                    "char_filter": [],
                    "filter": []
                }
            }
        }
    }
},
"mappings": {
    "_doc": {
        "properties": {
            "doc_index_ts":   { "type": "date" },
            "ident":          { "type": "keyword", "normalizer": "default", "doc_values": false },
            "state":          { "type": "keyword", "normalizer": "default" },
            "revision":       { "type": "keyword", "normalizer": "default", "doc_values": false },
            "work_id":        { "type": "keyword", "normalizer": "default" },
            "title":          { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "subtitle":       { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "original_title": { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "release_date":   { "type": "date" },
            "release_year":   { "type": "integer", "copy_to": "biblio" },
            "release_type":   { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "release_stage":  { "type": "keyword", "normalizer": "default" },
            "withdrawn_status": { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "language":       { "type": "keyword", "normalizer": "default" },
            "country_code":        { "type": "keyword", "normalizer": "default" },
            "country_code_upper":  { "type": "keyword", "normalizer": "caseSensitive" },
            "volume":         { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "issue":          { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "pages":          { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "first_page":     { "type": "keyword", "normalizer": "default" },
            "number":         { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "doi":            { "type": "keyword", "normalizer": "default" },
            "doi_prefix":     { "type": "keyword", "normalizer": "default" },
            "doi_registrar":  { "type": "keyword", "normalizer": "default" },
            "pmid":           { "type": "keyword", "normalizer": "default", "doc_values": false },
            "pmcid":          { "type": "keyword", "normalizer": "default", "doc_values": false },
            "isbn13":         { "type": "keyword", "normalizer": "default", "doc_values": false },
            "wikidata_qid":   { "type": "keyword", "normalizer": "default", "doc_values": false },
            "core_id":        { "type": "keyword", "normalizer": "default", "doc_values": false },
            "arxiv_id":       { "type": "keyword", "normalizer": "default", "doc_values": false },
            "jstor_id":       { "type": "keyword", "normalizer": "default", "doc_values": false },
            "ark_id":         { "type": "keyword", "normalizer": "default", "doc_values": false },
            "mag_id":         { "type": "keyword", "normalizer": "default", "doc_values": false },
            "s2_id":          { "type": "keyword", "normalizer": "default", "doc_values": false },
            "dblp_id":        { "type": "keyword", "normalizer": "default", "doc_values": false },
            "doaj_id":        { "type": "keyword", "normalizer": "default", "doc_values": false },
            "hdl":            { "type": "keyword", "normalizer": "default", "doc_values": false },
            "license":        { "type": "keyword", "normalizer": "default" },
            "version":        { "type": "keyword", "normalizer": "default", "copy_to": "biblio" },
            "publisher":            { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },
            "publisher_type":       { "type": "keyword", "normalizer": "default" },
            "container_name":       { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "container_id":         { "type": "keyword", "normalizer": "default" },
            "container_issns":      { "type": "keyword", "normalizer": "default" },
            "container_issnl":      { "type": "keyword", "normalizer": "default" },
            "container_type":       { "type": "keyword", "normalizer": "default" },
            "container_publication_status": { "type": "keyword", "normalizer": "default" },
            "discipline":           { "type": "keyword", "normalizer": "default" },
            "contrib_count":        { "type": "integer" },
            "contrib_names":        { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "affiliations":         { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },
            "affiliation_rors":     { "type": "keyword", "normalizer": "default" },
            "creator_ids":          { "type": "keyword", "normalizer": "default" },
            "ref_count":            { "type": "integer" },
            "ref_linked_count":     { "type": "integer" },
            "ref_release_ids":      { "type": "keyword", "normalizer": "default" },
            "file_count":           { "type": "integer" },
            "fileset_count":        { "type": "integer" },
            "webcapture_count":     { "type": "integer" },
            "any_abstract":         { "type": "boolean" },

            "biblio":               { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },

            "best_pdf_url":         { "type": "keyword", "normalizer": "caseSensitive", "doc_values": false },
            "ia_pdf_url":           { "type": "keyword", "normalizer": "caseSensitive", "doc_values": false },
            "ia_microfilm_url":     { "type": "keyword", "normalizer": "caseSensitive", "doc_values": false },
            "is_oa":                { "type": "boolean" },
            "oa_color":             { "type": "keyword", "normalizer": "default" },
            "is_longtail_oa":       { "type": "boolean" },
            "is_preserved":         { "type": "boolean" },
            "in_kbart":             { "type": "boolean" },
            "in_jstor":             { "type": "boolean" },
            "in_doaj":              { "type": "boolean" },
            "in_dweb":              { "type": "boolean" },
            "in_web":               { "type": "boolean" },
            "in_ia":                { "type": "boolean" },
            "in_ia_sim":            { "type": "boolean" },
            "in_shadows":           { "type": "boolean" },
            "is_superceded":        { "type": "boolean" },
            "is_retracted":         { "type": "boolean" },
            "is_work_alias":        { "type": "boolean" },
            "preservation":         { "type": "keyword", "normalizer": "default" },
            "tags":                 { "type": "keyword", "normalizer": "default" },

            "affiliation":    { "type": "alias", "path": "affiliations" },
            "ror":            { "type": "alias", "path": "affiliation_rors" },
            "creator_id":     { "type": "alias", "path": "creator_ids" },
            "ref_release_id": { "type": "alias", "path": "ref_release_ids" },
            "author":         { "type": "alias", "path": "contrib_names" },
            "journal":        { "type": "alias", "path": "container_name" },
            "date":           { "type": "alias", "path": "release_date" },
            "year":           { "type": "alias", "path": "release_year" },
            "issn":           { "type": "alias", "path": "container_issns" },
            "oa":             { "type": "alias", "path": "is_oa" },
            "longtail":       { "type": "alias", "path": "is_longtail_oa" },
            "lang":           { "type": "alias", "path": "language" },
            "file_pdf_url":   { "type": "alias", "path": "best_pdf_url" },
            "release_status": { "type": "alias", "path": "release_stage" },
            "stage":          { "type": "alias", "path": "release_stage" },
            "type":           { "type": "alias", "path": "release_type" },
            "retracted":      { "type": "alias", "path": "is_retracted" },
            "is_kept":        { "type": "alias", "path": "in_kbart" },
            "tag":            { "type": "alias", "path": "tags" }
        }
    }
}
}