|
@@ -11,6 +11,10 @@
|
|
"type": "mapping",
|
|
"type": "mapping",
|
|
"mappings_path": "${fess.dictionary.path}ja/mapping.txt"
|
|
"mappings_path": "${fess.dictionary.path}ja/mapping.txt"
|
|
},
|
|
},
|
|
|
|
+ "zero_width_spaces": {
|
|
|
|
+ "type": "mapping",
|
|
|
|
+ "mappings": [ "\\u200C=> "]
|
|
|
|
+ },
|
|
"removeall_filter": {
|
|
"removeall_filter": {
|
|
"type": "pattern_replace",
|
|
"type": "pattern_replace",
|
|
"pattern":"(.*)",
|
|
"pattern":"(.*)",
|
|
@@ -84,6 +88,317 @@
|
|
"連体詞"
|
|
"連体詞"
|
|
]
|
|
]
|
|
},
|
|
},
|
|
|
|
+ "german_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_german_"
|
|
|
|
+ },
|
|
|
|
+ "german_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}de/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "german_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "light_german"
|
|
|
|
+ },
|
|
|
|
+ "french_elision": {
|
|
|
|
+ "type": "elision",
|
|
|
|
+ "articles_case": true,
|
|
|
|
+ "articles": [
|
|
|
|
+ "l", "m", "t", "qu", "n", "s",
|
|
|
|
+ "j", "d", "c", "jusqu", "quoiqu",
|
|
|
|
+ "lorsqu", "puisqu"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "french_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_french_"
|
|
|
|
+ },
|
|
|
|
+ "french_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}fr/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "french_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "light_french"
|
|
|
|
+ },
|
|
|
|
+ "italian_elision": {
|
|
|
|
+ "type": "elision",
|
|
|
|
+ "articles": [
|
|
|
|
+ "c", "l", "all", "dall", "dell",
|
|
|
|
+ "nell", "sull", "coll", "pell",
|
|
|
|
+ "gl", "agl", "dagl", "degl", "negl",
|
|
|
|
+ "sugl", "un", "m", "t", "s", "v", "d"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "italian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_italian_"
|
|
|
|
+ },
|
|
|
|
+ "italian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}it/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "italian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "light_italian"
|
|
|
|
+ },
|
|
|
|
+ "arabic_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_arabic_"
|
|
|
|
+ },
|
|
|
|
+ "arabic_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}ar/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "arabic_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "arabic"
|
|
|
|
+ },
|
|
|
|
+ "romanian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_romanian_"
|
|
|
|
+ },
|
|
|
|
+ "romanian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}ro/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "romanian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "romanian"
|
|
|
|
+ },
|
|
|
|
+ "catalan_elision": {
|
|
|
|
+ "type": "elision",
|
|
|
|
+ "articles": [ "d", "l", "m", "n", "s", "t"]
|
|
|
|
+ },
|
|
|
|
+ "catalan_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_catalan_"
|
|
|
|
+ },
|
|
|
|
+ "catalan_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}ca/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "catalan_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "catalan"
|
|
|
|
+ },
|
|
|
|
+ "czech_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_czech_"
|
|
|
|
+ },
|
|
|
|
+ "czech_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}cs/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "czech_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "czech"
|
|
|
|
+ },
|
|
|
|
+ "danish_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_danish_"
|
|
|
|
+ },
|
|
|
|
+ "danish_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}da/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "danish_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "danish"
|
|
|
|
+ },
|
|
|
|
+ "spanish_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_spanish_"
|
|
|
|
+ },
|
|
|
|
+ "spanish_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}es/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "spanish_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "light_spanish"
|
|
|
|
+ },
|
|
|
|
+ "greek_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_greek_"
|
|
|
|
+ },
|
|
|
|
+ "greek_lowercase": {
|
|
|
|
+ "type": "lowercase",
|
|
|
|
+ "language": "greek"
|
|
|
|
+ },
|
|
|
|
+ "greek_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}el/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "greek_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "greek"
|
|
|
|
+ },
|
|
|
|
+ "persian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_persian_"
|
|
|
|
+ },
|
|
|
|
+ "finnish_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_finnish_"
|
|
|
|
+ },
|
|
|
|
+ "finnish_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}fi/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "finnish_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "finnish"
|
|
|
|
+ },
|
|
|
|
+ "hindi_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_hindi_"
|
|
|
|
+ },
|
|
|
|
+ "hindi_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}hi/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "hindi_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "hindi"
|
|
|
|
+ },
|
|
|
|
+ "hungarian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_hungarian_"
|
|
|
|
+ },
|
|
|
|
+ "hungarian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}hu/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "hungarian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "hungarian"
|
|
|
|
+ },
|
|
|
|
+ "indonesian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_indonesian_"
|
|
|
|
+ },
|
|
|
|
+ "indonesian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}id/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "indonesian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "indonesian"
|
|
|
|
+ },
|
|
|
|
+ "lithuanian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_lithuanian_"
|
|
|
|
+ },
|
|
|
|
+ "lithuanian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}lt/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "lithuanian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "lithuanian"
|
|
|
|
+ },
|
|
|
|
+ "latvian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_latvian_"
|
|
|
|
+ },
|
|
|
|
+ "latvian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}lv/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "latvian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "latvian"
|
|
|
|
+ },
|
|
|
|
+ "dutch_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_dutch_"
|
|
|
|
+ },
|
|
|
|
+ "dutch_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}nl/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "dutch_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "dutch"
|
|
|
|
+ },
|
|
|
|
+ "dutch_override": {
|
|
|
|
+ "type": "stemmer_override",
|
|
|
|
+ "rules": [
|
|
|
|
+ "fiets=>fiets",
|
|
|
|
+ "bromfiets=>bromfiets",
|
|
|
|
+ "ei=>eier",
|
|
|
|
+ "kind=>kinder"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "norwegian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_norwegian_"
|
|
|
|
+ },
|
|
|
|
+ "norwegian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}no/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "norwegian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "norwegian"
|
|
|
|
+ },
|
|
|
|
+ "portuguese_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_portuguese_"
|
|
|
|
+ },
|
|
|
|
+ "portuguese_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}pt/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "portuguese_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "light_portuguese"
|
|
|
|
+ },
|
|
|
|
+ "russian_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_russian_"
|
|
|
|
+ },
|
|
|
|
+ "russian_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}ru/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "russian_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "russian"
|
|
|
|
+ },
|
|
|
|
+ "swedish_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_swedish_"
|
|
|
|
+ },
|
|
|
|
+ "swedish_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}sv/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "swedish_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "swedish"
|
|
|
|
+ },
|
|
|
|
+ "thai_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_thai_"
|
|
|
|
+ },
|
|
|
|
+ "turkish_stop": {
|
|
|
|
+ "type": "stop",
|
|
|
|
+ "stopwords": "_turkish_"
|
|
|
|
+ },
|
|
|
|
+ "turkish_lowercase": {
|
|
|
|
+ "type": "lowercase",
|
|
|
|
+ "language": "turkish"
|
|
|
|
+ },
|
|
|
|
+ "turkish_keywords": {
|
|
|
|
+ "type": "keyword_marker",
|
|
|
|
+ "keywords_path": "${fess.dictionary.path}tr/protwords.txt"
|
|
|
|
+ },
|
|
|
|
+ "turkish_stemmer": {
|
|
|
|
+ "type": "stemmer",
|
|
|
|
+ "language": "turkish"
|
|
|
|
+ },
|
|
"truncate10_filter" : {
|
|
"truncate10_filter" : {
|
|
"type" : "truncate",
|
|
"type" : "truncate",
|
|
"length" : 10
|
|
"length" : 10
|
|
@@ -153,6 +468,276 @@
|
|
"type": "custom",
|
|
"type": "custom",
|
|
"tokenizer":"seunjeon_default_tokenizer"
|
|
"tokenizer":"seunjeon_default_tokenizer"
|
|
},
|
|
},
|
|
|
|
+ "german_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "german_stop",
|
|
|
|
+ "german_normalization",
|
|
|
|
+ "german_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "french_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "french_elision",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "french_stop",
|
|
|
|
+ "french_keywords",
|
|
|
|
+ "french_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "italian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "italian_elision",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "italian_stop",
|
|
|
|
+ "italian_keywords",
|
|
|
|
+ "italian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "arabic_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "arabic_stop",
|
|
|
|
+ "arabic_normalization",
|
|
|
|
+ "arabic_keywords",
|
|
|
|
+ "arabic_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "romanian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "romanian_stop",
|
|
|
|
+ "romanian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "catalan_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "catalan_elision",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "catalan_stop",
|
|
|
|
+ "catalan_keywords",
|
|
|
|
+ "catalan_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "czech_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "czech_stop",
|
|
|
|
+ "czech_keywords",
|
|
|
|
+ "czech_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "danish_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "danish_stop",
|
|
|
|
+ "danish_keywords",
|
|
|
|
+ "danish_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "spanish_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "spanish_stop",
|
|
|
|
+ "spanish_keywords",
|
|
|
|
+ "spanish_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "greek_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "greek_lowercase",
|
|
|
|
+ "greek_stop",
|
|
|
|
+ "greek_keywords",
|
|
|
|
+ "greek_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "persian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "char_filter": [ "zero_width_spaces" ],
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "arabic_normalization",
|
|
|
|
+ "persian_normalization",
|
|
|
|
+ "persian_stop"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "finnish_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "finnish_stop",
|
|
|
|
+ "finnish_keywords",
|
|
|
|
+ "finnish_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "hindi_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "indic_normalization",
|
|
|
|
+ "hindi_normalization",
|
|
|
|
+ "hindi_stop",
|
|
|
|
+ "hindi_keywords",
|
|
|
|
+ "hindi_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "hungarian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "hungarian_stop",
|
|
|
|
+ "hungarian_keywords",
|
|
|
|
+ "hungarian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "indonesian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "indonesian_stop",
|
|
|
|
+ "indonesian_keywords",
|
|
|
|
+ "indonesian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "lithuanian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "lithuanian_stop",
|
|
|
|
+ "lithuanian_keywords",
|
|
|
|
+ "lithuanian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "latvian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "latvian_stop",
|
|
|
|
+ "latvian_keywords",
|
|
|
|
+ "latvian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "dutch_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "dutch_stop",
|
|
|
|
+ "dutch_keywords",
|
|
|
|
+ "dutch_override",
|
|
|
|
+ "dutch_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "norwegian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "norwegian_stop",
|
|
|
|
+ "norwegian_keywords",
|
|
|
|
+ "norwegian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "portuguese_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "portuguese_stop",
|
|
|
|
+ "portuguese_keywords",
|
|
|
|
+ "portuguese_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "russian_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "russian_stop",
|
|
|
|
+ "russian_keywords",
|
|
|
|
+ "russian_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "swedish_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "swedish_stop",
|
|
|
|
+ "swedish_keywords",
|
|
|
|
+ "swedish_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "thai_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "thai",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "lowercase",
|
|
|
|
+ "thai_stop"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
|
|
+ "turkish_analyzer": {
|
|
|
|
+ "type": "custom",
|
|
|
|
+ "tokenizer": "standard",
|
|
|
|
+ "filter": [
|
|
|
|
+ "truncate20_filter",
|
|
|
|
+ "apostrophe",
|
|
|
|
+ "turkish_lowercase",
|
|
|
|
+ "turkish_stop",
|
|
|
|
+ "turkish_keywords",
|
|
|
|
+ "turkish_stemmer"
|
|
|
|
+ ]
|
|
|
|
+ },
|
|
"empty_analyzer": {
|
|
"empty_analyzer": {
|
|
"type": "custom",
|
|
"type": "custom",
|
|
"tokenizer": "standard",
|
|
"tokenizer": "standard",
|