-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindexes.txt
98 lines (94 loc) · 2.59 KB
/
indexes.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
GET _cat/indices?v
GET kyf
POST kyf/_search
{
"query": {
"match": {
"fr": "salami"
}
}
}
PUT kyf
{
"settings": {
"analysis": {
"analyzer": {
"custom_analyzer": {
"tokenizer": "standard",
"filter": [
"lowercase",
"custom_word_delimiter",
"custom_ascii",
"custom_number_removal",
"custom_stop",
"custom_stemmer",
"custom_length",
"custom_bigram",
"custom_spacing_removal",
"trim"
]
}
},
"filter": {
"custom_word_delimiter": {
"type": "word_delimiter",
"generate_word_parts": false,
"generate_number_parts": true,
"catenate_words": true,
"catenate_numbers": true,
"catenate_all": false,
"preserve_original": false,
"split_on_case_change": false,
"split_on_numerics": false,
"stem_english_possessive": false
},
"custom_ascii": {
"type" : "asciifolding",
"preserve_original" : true
},
"custom_number_removal": {
"type": "pattern_replace",
"pattern": "([0-9]+)",
"replacement": ""
},
"custom_spacing_removal": {
"type": "pattern_replace",
"pattern": "( +)",
"replacement": " "
},
"custom_stop": {
"type": "stop",
"stopwords": "_french_",
"ignore_case": true,
"remove_trailing": true
},
"custom_stemmer" : {
"type": "stemmer",
"name": "light_french"
},
"custom_bigram" : {
"type" : "shingle",
"min_shingle_size": 2,
"max_shingle_size": 4,
"output_unigrams": true,
"filler_token": ""
},
"custom_length": {
"type": "length",
"min": 2
}
}
}
},
"mappings": {
"default": {
"properties": {
"fr": {
"type": "string",
"term_vector": "yes",
"analyzer": "custom_analyzer"
}
}
}
}
}