Newer
Older
template = {
#"index_patterns" : ["geodata.v1"],
"order" : 0,
"settings" : {
"index.mapping.total_fields.limit": 10000,
#"index.mapping.ignore_malformed": True,
# "number_of_shards" : 48,
# "number_of_replicas" : 0,
Alessandro Cerioni
committed
"refresh_interval" : -1,
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
"max_ngram_diff": 100,
"analysis": {
"filter": {
"my_ascii_folding" : {
"type" : "asciifolding",
"preserve_original" : False
},
"my_original_preserving_ascii_folding" : {
"type" : "asciifolding",
"preserve_original" : True
},
"french_elision": {
"type": "elision",
"articles_case": True,
"articles": [
"l", "m", "t", "qu", "n", "s",
"j", "d", "c", "jusqu", "quoiqu",
"lorsqu", "puisqu"
]
},
"french_stop": {
"type": "stop",
"stopwords": "_french_"
},
"preserving_word_delimiter": {
"type": "word_delimiter",
"preserve_original": "true"
},
"keep_keywords": {
"type": "keep",
"keep_words": ["vélo'v", "Vélo'V", "Vélo'v", "metropole de lyon"]
},
"my_multiplexer" : {
"type" : "multiplexer",
"filters" : [ "lowercase, my_original_preserving_ascii_folding, french_elision, french_stop", "keep_keywords" ],
#"filters" : [ "keep_keywords" ]
"preserve_original": "false"
},
"my_other_multiplexer" : {
"type" : "multiplexer",
"filters" : [ "lowercase, french_elision, french_stop", "keep_keywords" ],
#"filters" : [ "keep_keywords" ]
"preserve_original": "false"
}
},
"tokenizer": {
"my_edge_ngram_tokenizer": {
"type": "edge_ngram",
"min_gram": 2,
"max_gram": 30,
"token_chars": [
"letter",
"digit"
]
}
},
"analyzer": {
"edge_ngram_analyzer_with_asciifolding": {
"type": "custom",
"tokenizer": "my_edge_ngram_tokenizer",
"filter": [
"lowercase",
"my_original_preserving_ascii_folding",
"french_elision",
"french_stop"
#"my_multiplexer"
]
},
"my_search_analyzer": {
"type": "custom",
"tokenizer": "standard",
"filter": [
"lowercase",
"french_elision",
"french_stop"
#"my_other_multiplexer"
]
},
"my_suggest_analyzer": {
"type": "custom",
"tokenizer": "standard",
"filter": [
"lowercase",
"french_elision",
"french_stop"#,
#"my_other_multiplexer"
]
},
}
}
},
"mappings" : {
"_doc" : {
"dynamic_templates": [ # priority is given by order!
{
"geoshape-template" : {
"match_pattern": "regex",
"path_match": "metadata-fr.bbox|data-fr.geometry",
"mapping": {
"type": "geo_shape",
"tree": "quadtree",
#"index": "false"
"ignore_malformed": True
}
}
},
# {
# "link-template" : {
# "path_match": "metadata-fr.link",
# "mapping": {
# #"type": "nested",
# "index": "false"
# #"ignore_malformed": True
# }
# }
# },
"keyword-template" : {
"match_pattern": "regex",
"path_match": ".*md5.*|metadata-fr\.link\.formats.*|metadata-fr\.link\.service.*|metadata-fr\.parentId.*",
"type": "text",
"index": False,
"fields": {
"keyword": {
"type": "keyword"
}
}
#"ignore_malformed": True
}
}
},
{
"date-template" : {
"match_mapping_type": "date",
# "path_match": "data-fr\.properties\.date.+|data-fr\.properties\.last_update.*|metadata-fr\.creationDate",
"mapping": {
"type": "date",
"format": "strict_date_optional_time",#||epoch_millis||yyyy-MM-dd HH:mm:ss",
"fields": {
"sort": {
"type": "date"
}
}
}
}
},
{
"nested-template": {
"path_match": "metadata-fr.responsibleParty",
"mapping": {
"type": "nested"
# "fields": {
# "sort":
# {
# "type": "boolean"
# }
# }
}
}
},
"unindexed-path-template-1": {
"match_pattern": "regex",
"match_mapping_type": "*",
"path_match": "metadata-fr\.href.*|metadata-fr\.idxMsg.*|data-fr\.geometry\..*|metadata-fr\.identifier.*|metadata-fr\.geonet\:info.*:geonet|metadata-fr\.responsibleParty\.logo|metadata-fr\.image\..*|.*url|metadata-fr\.link\.name",
# "match": "(metadata-fr\.image.*|data-fr\.geometry.*|metadata-fr\.href.*|metadata-fr\.idxMsg.*)",
"mapping": {
"type": "text",
#"ignore_malformed": True
"index": False
}
}
},
{
"unindexed-path-template-2": {
"match_pattern": "regex",
"match_mapping_type": "*",
"path_match": "metadata-fr\.link\.bbox_by_projection|metadata-fr\.link\.projections|metadata-fr\.link\.content-type|metadata-fr\.link\.content-length",
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
# "match": "(metadata-fr\.image.*|data-fr\.geometry.*|metadata-fr\.href.*|metadata-fr\.idxMsg.*)",
"mapping": {
"type": "text",
#"ignore_malformed": True
"index": False
}
}
},
{
"long-template": {
"match_mapping_type": "long",
"mapping": {
"type": "long",
"fields": {
"sort":
{
"type": "long"
}
}
}
}
},
{
"double-template": {
"match_mapping_type": "double",
"mapping": {
"type": "double",
"fields": {
"sort":
{
"type": "double"
}
}
}
}
},
{
"boolean-template": {
"match_mapping_type": "boolean",
"mapping": {
"type": "boolean",
"fields": {
"sort":
{
"type": "boolean"
}
}
}
}
},
{
"data-template": {
"match_pattern": "regex",
"path_match": "data-fr\.properties\..+",
"match_mapping_type": "string",
"mapping": {
"type": "text",
# "ignore_malformed": True,
"analyzer": "edge_ngram_analyzer_with_asciifolding",
# "search_analyzer": "standard",
"search_analyzer": "my_search_analyzer",
"term_vector": "with_positions_offsets",
"copy_to": ["data", "data_and_metadata"],
"index_options": "offsets",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256,
},
"sort": {
"type": "keyword"
},
"suggest": {
"type": "completion",
"analyzer": "simple"
#"preserve_position_increments":
}
}
}
}
},
{
"string-template": {
"match_mapping_type": "string",
"mapping": {
"type": "text",
# "ignore_malformed": True,
"analyzer": "edge_ngram_analyzer_with_asciifolding",
# "search_analyzer": "standard",
"search_analyzer": "my_search_analyzer",
"term_vector": "with_positions_offsets",
"copy_to": "data_and_metadata",
"index_options": "offsets",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256,
},
"sort": {
"type": "keyword"
},
"suggest": {
"type": "text",
"analyzer": "my_suggest_analyzer"
}
}
}
}
}
]
}
}
}