summaryrefslogtreecommitdiffstats
path: root/extra/elasticsearch/container_schema.json
blob: d3351aabcf61907052d43cbe2c3a20ef12372ee7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
{
"settings": {
    "index": {
        "number_of_shards": 1,
        "number_of_replicas": 0,
        "analysis": {
            "analyzer": {
                "default": {
                    "type": "custom",
                    "tokenizer": "standard",
                    "filter": [ "lowercase", "asciifolding" ]
                },
                "textIcu": {
                    "type": "custom",
                    "tokenizer": "icu_tokenizer",
                    "char_filter": [ "icu_normalizer" ],
                    "filter": [ "icu_folding" ]
                },
                "textIcuSearch": {
                    "type": "custom",
                    "tokenizer": "icu_tokenizer",
                    "char_filter": [ "icu_normalizer" ],
                    "filter": [ "icu_folding" ]
                }
            },
            "normalizer": {
                "default": {
                    "type": "custom",
                    "char_filter": [],
                    "filter": ["lowercase"]
                },
                "caseSensitive": {
                    "type": "custom",
                    "char_filter": [],
                    "filter": []
                }
            }
        }
    }
},
"mappings": {
    "_doc": {
        "properties": {
            "doc_index_ts":   { "type": "date" },
            "ident":          { "type": "keyword", "normalizer": "default", "doc_values": false },
            "state":          { "type": "keyword", "normalizer": "default" },
            "revision":       { "type": "keyword", "normalizer": "default", "doc_values": false },
            "name":           { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "original_name":  { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "publisher":      { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "abbrev":         { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "aliases":        { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch", "copy_to": "biblio" },
            "publisher_type": { "type": "keyword", "normalizer": "default" },
            "container_type": { "type": "keyword", "normalizer": "default" },
            "publication_status": { "type": "keyword", "normalizer": "default" },
            "issnl":          { "type": "keyword", "normalizer": "default" },
            "issns":          { "type": "keyword", "normalizer": "default" },
            "wikidata_qid":   { "type": "keyword", "normalizer": "default" },
            "dblp_prefix":    { "type": "keyword", "normalizer": "default" },
            "sim_pubid":      { "type": "keyword", "normalizer": "default" },
            "ia_sim_collection": { "type": "keyword", "normalizer": "default" },
            "country_code":   { "type": "keyword", "normalizer": "default" },
            "region":         { "type": "keyword", "normalizer": "default" },
            "discipline":     { "type": "keyword", "normalizer": "default" },
            "languages":      { "type": "keyword", "normalizer": "default" },
            "mimetypes":      { "type": "keyword", "normalizer": "default" },
            "first_year":     { "type": "integer" },
            "last_year":      { "type": "integer" },


            "biblio":         { "type": "text", "index": true, "analyzer": "textIcu", "search_analyzer":"textIcuSearch" },

            "in_doaj":              { "type": "boolean" },
            "in_road":              { "type": "boolean" },
            "is_oa":                { "type": "boolean" },
            "is_longtail_oa":       { "type": "boolean" },
            "any_kbart":            { "type": "boolean" },
            "any_jstor":            { "type": "boolean" },
            "any_ia_sim":           { "type": "boolean" },
            "sherpa_romeo_color":   { "type": "keyword", "normalizer": "default" },
            "keepers":              { "type": "keyword", "normalizer": "default" },

            "releases_total":           { "type": "integer" },
            "preservation_bright":      { "type": "integer" },
            "preservation_dark":        { "type": "integer" },
            "preservation_shadows_only":{ "type": "integer" },
            "preservation_none":        { "type": "integer" },
            "tags":                 { "type": "keyword", "normalizer": "default" },

            "year":           { "type": "alias", "path": "first_year" },
            "type":           { "type": "alias", "path": "container_type" },
            "issn":           { "type": "alias", "path": "issns" },
            "release_count":  { "type": "alias", "path": "releases_total" },
            "releases_count": { "type": "alias", "path": "releases_total" },
            "oa":             { "type": "alias", "path": "is_oa" },
            "longtail":       { "type": "alias", "path": "is_longtail_oa" },
            "tag":            { "type": "alias", "path": "tags" }
        }
    }
}
}