diff --git a/src/main/java/org/codelibs/fess/Constants.java b/src/main/java/org/codelibs/fess/Constants.java index 8f42c796c..0aa3462d0 100644 --- a/src/main/java/org/codelibs/fess/Constants.java +++ b/src/main/java/org/codelibs/fess/Constants.java @@ -449,4 +449,10 @@ public class Constants extends CoreLibConstants { public static final String XERCES_FEATURE_PREFIX = "http://apache.org/xml/features/"; public static final String LOAD_EXTERNAL_DTD_FEATURE = "nonvalidating/load-external-dtd"; + + public static final String FESEN_TYPE_CLOUD = "cloud"; + + public static final String FESEN_USERNAME = "fesen.username"; + + public static final String FESEN_PASSWORD = "fesen.password"; } diff --git a/src/main/java/org/codelibs/fess/app/web/base/FessAdminAction.java b/src/main/java/org/codelibs/fess/app/web/base/FessAdminAction.java index 67f6fb506..506187a2c 100644 --- a/src/main/java/org/codelibs/fess/app/web/base/FessAdminAction.java +++ b/src/main/java/org/codelibs/fess/app/web/base/FessAdminAction.java @@ -55,6 +55,7 @@ public abstract class FessAdminAction extends FessBaseAction { .map(user -> user.hasRoles(fessConfig.getAuthenticationAdminRolesAsArray()) || user.hasRole(getActionRole())).orElse(false); runtime.registerData("editable", editable); runtime.registerData("editableClass", editable ? StringUtil.EMPTY : "disabled"); + runtime.registerData("fesenType", fessConfig.getFesenType()); final String forumLink = systemHelper.getForumLink(); if (StringUtil.isNotBlank(forumLink)) { runtime.registerData("forumLink", forumLink); diff --git a/src/main/java/org/codelibs/fess/es/client/CrawlerEngineClient.java b/src/main/java/org/codelibs/fess/es/client/CrawlerEngineClient.java new file mode 100644 index 000000000..afa367842 --- /dev/null +++ b/src/main/java/org/codelibs/fess/es/client/CrawlerEngineClient.java @@ -0,0 +1,40 @@ +/* + * Copyright 2012-2021 CodeLibs Project and the Others. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, + * either express or implied. See the License for the specific language + * governing permissions and limitations under the License. + */ +package org.codelibs.fess.es.client; + +import org.codelibs.core.lang.StringUtil; +import org.codelibs.fesen.client.Client; +import org.codelibs.fesen.client.HttpClient; +import org.codelibs.fesen.common.settings.Settings; +import org.codelibs.fesen.common.settings.Settings.Builder; +import org.codelibs.fess.Constants; +import org.codelibs.fess.crawler.client.FesenClient; +import org.codelibs.fess.mylasta.direction.FessConfig; +import org.codelibs.fess.util.ComponentUtil; + +public class CrawlerEngineClient extends FesenClient { + protected Client createClient() { + final Builder builder = Settings.builder().putList("http.hosts", address); + final FessConfig fessConfig = ComponentUtil.getFessConfig(); + final String username = fessConfig.getFesenUsername(); + final String password = fessConfig.getFesenPassword(); + if (StringUtil.isNotBlank(username) && StringUtil.isNotBlank(password)) { + builder.put(Constants.FESEN_USERNAME, username); + builder.put(Constants.FESEN_PASSWORD, password); + } + return new HttpClient(builder.build(), null); + } +} diff --git a/src/main/java/org/codelibs/fess/es/client/SearchEngineClient.java b/src/main/java/org/codelibs/fess/es/client/SearchEngineClient.java index ed292c84b..5d28276b0 100644 --- a/src/main/java/org/codelibs/fess/es/client/SearchEngineClient.java +++ b/src/main/java/org/codelibs/fess/es/client/SearchEngineClient.java @@ -52,6 +52,7 @@ import org.codelibs.core.lang.StringUtil; import org.codelibs.core.lang.ThreadUtil; import org.codelibs.curl.CurlResponse; import org.codelibs.fesen.FesenException; +import org.codelibs.fesen.FesenStatusException; import org.codelibs.fesen.action.ActionFuture; import org.codelibs.fesen.action.ActionListener; import org.codelibs.fesen.action.ActionRequest; @@ -127,6 +128,7 @@ import org.codelibs.fesen.common.xcontent.XContentType; import org.codelibs.fesen.index.query.InnerHitBuilder; import org.codelibs.fesen.index.query.QueryBuilder; import org.codelibs.fesen.index.query.QueryBuilders; +import org.codelibs.fesen.rest.RestStatus; import org.codelibs.fesen.runner.FesenRunner; import org.codelibs.fesen.runner.FesenRunner.Configs; import org.codelibs.fesen.search.SearchHit; @@ -244,29 +246,37 @@ public class SearchEngineClient implements Client { String httpAddress = System.getProperty(Constants.FESS_ES_HTTP_ADDRESS); if (StringUtil.isBlank(httpAddress)) { if (runner == null) { - runner = new FesenRunner(); - final Configs config = newConfigs().clusterName(clusterName).numOfNode(1).useLogger(); - final String esDir = System.getProperty("fess.es.dir"); - if (esDir != null) { - config.basePath(esDir); + switch (fessConfig.getFesenType()) { + case Constants.FESEN_TYPE_CLOUD: + httpAddress = org.codelibs.fess.util.ResourceUtil.getFesenHttpUrl(); + break; + default: + runner = new FesenRunner(); + final Configs config = newConfigs().clusterName(clusterName).numOfNode(1).useLogger(); + final String esDir = System.getProperty("fess.es.dir"); + if (esDir != null) { + config.basePath(esDir); + } + config.disableESLogger(); + runner.onBuild((number, settingsBuilder) -> { + final File pluginDir = new File(esDir, "plugins"); + if (pluginDir.isDirectory()) { + settingsBuilder.put("path.plugins", pluginDir.getAbsolutePath()); + } else { + settingsBuilder.put("path.plugins", new File(System.getProperty("user.dir"), "plugins").getAbsolutePath()); + } + if (settings != null) { + settingsBuilder.putProperties(settings, s -> s); + } + }); + runner.build(config); + + final int port = runner.node().settings().getAsInt("http.port", 9200); + httpAddress = "http://localhost:" + port; + logger.warn("Embedded Fesen is running. This configuration is not recommended for production use."); + break; } - config.disableESLogger(); - runner.onBuild((number, settingsBuilder) -> { - final File pluginDir = new File(esDir, "plugins"); - if (pluginDir.isDirectory()) { - settingsBuilder.put("path.plugins", pluginDir.getAbsolutePath()); - } else { - settingsBuilder.put("path.plugins", new File(System.getProperty("user.dir"), "plugins").getAbsolutePath()); - } - if (settings != null) { - settingsBuilder.putProperties(settings, s -> s); - } - }); - runner.build(config); } - final int port = runner.node().settings().getAsInt("http.port", 9200); - httpAddress = "http://localhost:" + port; - logger.warn("Embedded Fesen is running. This configuration is not recommended for production use."); } client = createHttpClient(fessConfig, httpAddress); @@ -332,6 +342,10 @@ public class SearchEngineClient implements Client { protected Client createHttpClient(final FessConfig fessConfig, final String host) { final Builder builder = Settings.builder().putList("http.hosts", host).put("processors", fessConfig.availableProcessors()); + if (StringUtil.isNotBlank(fessConfig.getFesenUsername()) && StringUtil.isNotBlank(fessConfig.getFesenPassword())) { + builder.put(Constants.FESEN_USERNAME, fessConfig.getFesenUsername()); + builder.put(Constants.FESEN_PASSWORD, fessConfig.getFesenPassword()); + } return new HttpClient(builder.build(), null); } @@ -382,12 +396,20 @@ public class SearchEngineClient implements Client { final boolean uploadConfig) { final FessConfig fessConfig = ComponentUtil.getFessConfig(); + final String fesenType = fessConfig.getFesenType(); if (uploadConfig) { - waitForConfigSyncStatus(); - sendConfigFiles(index); + switch (fesenType) { + case Constants.FESEN_TYPE_CLOUD: + // nothing + break; + default: + waitForConfigSyncStatus(); + sendConfigFiles(index); + break; + } } - final String indexConfigFile = indexConfigPath + "/" + index + ".json"; + final String indexConfigFile = getResourcePath(indexConfigPath, fesenType, "/" + index + ".json"); try { String source = FileUtil.readUTF8(indexConfigFile); String dictionaryPath = System.getProperty("fess.dictionary.path", StringUtil.EMPTY); @@ -413,6 +435,14 @@ public class SearchEngineClient implements Client { return false; } + protected String getResourcePath(final String basePath, final String type, final String path) { + final String target = basePath + "/_" + type + path; + if (ResourceUtil.getResourceNoException(target) != null) { + return target; + } + return basePath + path; + } + public void addMapping(final String index, final String docType, final String indexName) { final FessConfig fessConfig = ComponentUtil.getFessConfig(); @@ -421,7 +451,7 @@ public class SearchEngineClient implements Client { final ImmutableOpenMap indexMappings = getMappingsResponse.mappings().get(indexName); if (indexMappings == null || !indexMappings.containsKey("properties")) { String source = null; - final String mappingFile = indexConfigPath + "/" + index + "/" + docType + ".json"; + final String mappingFile = getResourcePath(indexConfigPath, fessConfig.getFesenType(), "/" + index + "/" + docType + ".json"); try { source = FileUtil.readUTF8(mappingFile); } catch (final Exception e) { @@ -436,12 +466,13 @@ public class SearchEngineClient implements Client { logger.warn("Failed to create {}/{} mapping.", indexName, docType); } - final String dataPath = indexConfigPath + "/" + index + "/" + docType + ".bulk"; + final String dataPath = getResourcePath(indexConfigPath, fessConfig.getFesenType(), "/" + index + "/" + docType + ".bulk"); if (ResourceUtil.isExist(dataPath)) { insertBulkData(fessConfig, indexName, dataPath); } split(fessConfig.getAppExtensionNames(), ",").of(stream -> stream.filter(StringUtil::isNotBlank).forEach(name -> { - final String bulkPath = indexConfigPath + "/" + index + "/" + docType + "_" + name + ".bulk"; + final String bulkPath = + getResourcePath(indexConfigPath, fessConfig.getFesenType(), "/" + index + "/" + docType + "_" + name + ".bulk"); if (ResourceUtil.isExist(bulkPath)) { insertBulkData(fessConfig, indexName, bulkPath); } @@ -480,7 +511,7 @@ public class SearchEngineClient implements Client { protected void createAlias(final String index, final String createdIndexName) { final FessConfig fessConfig = ComponentUtil.getFessConfig(); // alias - final String aliasConfigDirPath = indexConfigPath + "/" + index + "/alias"; + final String aliasConfigDirPath = getResourcePath(indexConfigPath, fessConfig.getFesenType(), "/" + index + "/alias"); try { final File aliasConfigDir = ResourceUtil.getResourceAsFile(aliasConfigDirPath); if (aliasConfigDir.isDirectory()) { @@ -594,8 +625,19 @@ public class SearchEngineClient implements Client { } catch (final Exception e) { cause = e; } - if (logger.isDebugEnabled()) { - logger.debug("Failed to access to Fesen:{}", i, cause); + if (cause instanceof FesenStatusException) { + final RestStatus status = ((FesenStatusException) cause).status(); + switch (status) { + case UNAUTHORIZED: + logger.warn("[{}] Unauthorized access: {}", i, System.getProperty(Constants.FESS_ES_HTTP_ADDRESS), cause); + break; + default: + logger.debug("[{}][{}] Failed to access to Fesen ({})", i, status, System.getProperty(Constants.FESS_ES_HTTP_ADDRESS), + cause); + break; + } + } else if (logger.isDebugEnabled()) { + logger.debug("[{}] Failed to access to Fesen ({})", i, System.getProperty(Constants.FESS_ES_HTTP_ADDRESS), cause); } ThreadUtil.sleep(1000L); } diff --git a/src/main/java/org/codelibs/fess/helper/CurlHelper.java b/src/main/java/org/codelibs/fess/helper/CurlHelper.java index a49513826..8bbccc4cc 100644 --- a/src/main/java/org/codelibs/fess/helper/CurlHelper.java +++ b/src/main/java/org/codelibs/fess/helper/CurlHelper.java @@ -15,8 +15,13 @@ */ package org.codelibs.fess.helper; +import java.nio.charset.StandardCharsets; + +import org.codelibs.core.lang.StringUtil; import org.codelibs.curl.Curl.Method; import org.codelibs.curl.CurlRequest; +import org.codelibs.fess.mylasta.direction.FessConfig; +import org.codelibs.fess.util.ComponentUtil; import org.codelibs.fess.util.ResourceUtil; public class CurlHelper { @@ -38,6 +43,15 @@ public class CurlHelper { } public CurlRequest request(final Method method, final String path) { - return new CurlRequest(method, ResourceUtil.getFesenHttpUrl() + path); + final CurlRequest request = new CurlRequest(method, ResourceUtil.getFesenHttpUrl() + path); + final FessConfig fessConfig = ComponentUtil.getFessConfig(); + final String username = fessConfig.getFesenUsername(); + final String password = fessConfig.getFesenPassword(); + if (StringUtil.isNotBlank(username) && StringUtil.isNotBlank(password)) { + final String value = username + ":" + password; + final String basicAuth = "Basic " + java.util.Base64.getEncoder().encodeToString(value.getBytes(StandardCharsets.UTF_8)); + request.header("Authorization", basicAuth); + } + return request; } } diff --git a/src/main/java/org/codelibs/fess/helper/IndexingHelper.java b/src/main/java/org/codelibs/fess/helper/IndexingHelper.java index 0db51ac5d..57524512c 100644 --- a/src/main/java/org/codelibs/fess/helper/IndexingHelper.java +++ b/src/main/java/org/codelibs/fess/helper/IndexingHelper.java @@ -47,7 +47,7 @@ public class IndexingHelper { final FessConfig fessConfig = ComponentUtil.getFessConfig(); if (fessConfig.isResultCollapsed()) { docList.forEach(doc -> { - doc.put("content_minhash", doc.get(fessConfig.getIndexFieldContent())); + doc.put(fessConfig.getIndexFieldContentMinhash(), doc.get(fessConfig.getIndexFieldContent())); }); } final long execTime = System.currentTimeMillis(); diff --git a/src/main/java/org/codelibs/fess/helper/SuggestHelper.java b/src/main/java/org/codelibs/fess/helper/SuggestHelper.java index b6850eaa1..742d10830 100644 --- a/src/main/java/org/codelibs/fess/helper/SuggestHelper.java +++ b/src/main/java/org/codelibs/fess/helper/SuggestHelper.java @@ -102,6 +102,7 @@ public class SuggestHelper { .actionGet(fessConfig.getIndexHealthTimeout()); final SuggestSettingsBuilder settingsBuilder = SuggestSettings.builder(); + settingsBuilder.addInitialSettings("elasticsearch.type", fessConfig.getFesenType()); settingsBuilder.bulkTimeout(fessConfig.getIndexBulkTimeout()); settingsBuilder.clusterTimeout(fessConfig.getIndexHealthTimeout()); settingsBuilder.indexTimeout(fessConfig.getIndexIndexTimeout()); diff --git a/src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java b/src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java index edbe23a46..5ca2b2bc1 100644 --- a/src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java +++ b/src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java @@ -25,9 +25,18 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction /** The key of the configuration. e.g. Fess */ String DOMAIN_TITLE = "domain.title"; + /** The key of the configuration. e.g. default */ + String ELASTICSEARCH_TYPE = "elasticsearch.type"; + /** The key of the configuration. e.g. http://localhost:9201 */ String ELASTICSEARCH_HTTP_URL = "elasticsearch.http.url"; + /** The key of the configuration. e.g. */ + String ELASTICSEARCH_USERNAME = "elasticsearch.username"; + + /** The key of the configuration. e.g. */ + String ELASTICSEARCH_PASSWORD = "elasticsearch.password"; + /** The key of the configuration. e.g. aes */ String APP_CIPHER_ALGORISM = "app.cipher.algorism"; @@ -1695,13 +1704,50 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction String getDomainTitle(); /** - * Get the value for the key 'elasticsearch.http.url'.
- * The value is, e.g. http://localhost:9201
+ * Get the value for the key 'elasticsearch.type'.
+ * The value is, e.g. default
* comment: Fesen * @return The value of found property. (NotNull: if not found, exception but basically no way) */ + String getFesenType(); + + /** + * Get the value for the key 'elasticsearch.http.url'.
+ * The value is, e.g. http://localhost:9201
+ * @return The value of found property. (NotNull: if not found, exception but basically no way) + */ String getFesenHttpUrl(); + /** + * Get the value for the key 'elasticsearch.username'.
+ * The value is, e.g.
+ * @return The value of found property. (NotNull: if not found, exception but basically no way) + */ + String getFesenUsername(); + + /** + * Get the value for the key 'elasticsearch.username' as {@link Integer}.
+ * The value is, e.g.
+ * @return The value of found property. (NotNull: if not found, exception but basically no way) + * @throws NumberFormatException When the property is not integer. + */ + Integer getFesenUsernameAsInteger(); + + /** + * Get the value for the key 'elasticsearch.password'.
+ * The value is, e.g.
+ * @return The value of found property. (NotNull: if not found, exception but basically no way) + */ + String getFesenPassword(); + + /** + * Get the value for the key 'elasticsearch.password' as {@link Integer}.
+ * The value is, e.g.
+ * @return The value of found property. (NotNull: if not found, exception but basically no way) + * @throws NumberFormatException When the property is not integer. + */ + Integer getFesenPasswordAsInteger(); + /** * Get the value for the key 'app.cipher.algorism'.
* The value is, e.g. aes
@@ -6961,10 +7007,30 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction return get(FessConfig.DOMAIN_TITLE); } + public String getFesenType() { + return get(FessConfig.ELASTICSEARCH_TYPE); + } + public String getFesenHttpUrl() { return get(FessConfig.ELASTICSEARCH_HTTP_URL); } + public String getFesenUsername() { + return get(FessConfig.ELASTICSEARCH_USERNAME); + } + + public Integer getFesenUsernameAsInteger() { + return getAsInteger(FessConfig.ELASTICSEARCH_USERNAME); + } + + public String getFesenPassword() { + return get(FessConfig.ELASTICSEARCH_PASSWORD); + } + + public Integer getFesenPasswordAsInteger() { + return getAsInteger(FessConfig.ELASTICSEARCH_PASSWORD); + } + public String getAppCipherAlgorism() { return get(FessConfig.APP_CIPHER_ALGORISM); } @@ -9713,7 +9779,10 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction protected java.util.Map prepareGeneratedDefaultMap() { java.util.Map defaultMap = super.prepareGeneratedDefaultMap(); defaultMap.put(FessConfig.DOMAIN_TITLE, "Fess"); + defaultMap.put(FessConfig.ELASTICSEARCH_TYPE, "default"); defaultMap.put(FessConfig.ELASTICSEARCH_HTTP_URL, "http://localhost:9201"); + defaultMap.put(FessConfig.ELASTICSEARCH_USERNAME, ""); + defaultMap.put(FessConfig.ELASTICSEARCH_PASSWORD, ""); defaultMap.put(FessConfig.APP_CIPHER_ALGORISM, "aes"); defaultMap.put(FessConfig.APP_CIPHER_KEY, "___change__me___"); defaultMap.put(FessConfig.APP_DIGEST_ALGORISM, "sha256"); diff --git a/src/main/java/org/codelibs/fess/mylasta/direction/FessProp.java b/src/main/java/org/codelibs/fess/mylasta/direction/FessProp.java index a4b4953e4..8fa17a72f 100644 --- a/src/main/java/org/codelibs/fess/mylasta/direction/FessProp.java +++ b/src/main/java/org/codelibs/fess/mylasta/direction/FessProp.java @@ -338,7 +338,12 @@ public interface FessProp { } default boolean isResultCollapsed() { - return getSystemPropertyAsBoolean(Constants.RESULT_COLLAPSED_PROPERTY, false); + switch (getFesenType()) { + case Constants.FESEN_TYPE_CLOUD: + return false; + default: + return getSystemPropertyAsBoolean(Constants.RESULT_COLLAPSED_PROPERTY, false); + } } default void setLoginLinkEnabled(final boolean value) { @@ -2071,4 +2076,6 @@ public interface FessProp { return !split(getPasswordInvalidAdminPasswords(), "\n") .get(stream -> stream.map(String::trim).filter(StringUtil::isNotEmpty).anyMatch(s -> s.equals(password))); } + + String getFesenType(); } diff --git a/src/main/resources/crawler/es.xml b/src/main/resources/crawler/es.xml index ad2cfd0d7..bffb11d40 100644 --- a/src/main/resources/crawler/es.xml +++ b/src/main/resources/crawler/es.xml @@ -3,6 +3,6 @@ "http://dbflute.org/meta/lastadi10.dtd"> + class="org.codelibs.fess.es.client.CrawlerEngineClient"> diff --git a/src/main/resources/fess_config.properties b/src/main/resources/fess_config.properties index 5bb9b1d52..f1926321d 100644 --- a/src/main/resources/fess_config.properties +++ b/src/main/resources/fess_config.properties @@ -9,7 +9,10 @@ domain.title = Fess # Elasticsearch +elasticsearch.type=default elasticsearch.http.url=http://localhost:9201 +elasticsearch.username= +elasticsearch.password= # Cryptographer app.cipher.algorism=aes diff --git a/src/main/resources/fess_indices/_cloud/fess.json b/src/main/resources/fess_indices/_cloud/fess.json new file mode 100644 index 000000000..5125553ed --- /dev/null +++ b/src/main/resources/fess_indices/_cloud/fess.json @@ -0,0 +1,1276 @@ +{ + "settings": { + "index": { + "codec": "${fess.index.codec}", + "refresh_interval": "1s", + "number_of_shards": "${fess.index.number_of_shards}", + "number_of_replicas": 0, + "auto_expand_replicas": "${fess.index.auto_expand_replicas}" + }, + "analysis": { + "char_filter": { + "mapping_fa_filter": { + "type": "mapping", + "mappings": ["\u0009,\u000A,\u000B,\u000C,\u000D,\u001C,\u001D,\u001E,\u001F,\u00A0,\u1680,\u180E,\u2000,\u2001,\u2002,\u2003,\u2004,\u2005,\u2006,\u2007,\u2008,\u2009,\u200A,\u200B,\u200C,\u202F,\u205F,\u3000,\uFEFF=>\u0020", "\u064A => \u06CC", "\u0643 => \u06A9", "\u0660 => 0", "\u06F0 => 0", "\u0661 => 1", "\u06F1 => 1", "\u0662 => 2", "\u06F2 => 2", "\u0663 => 3", "\u06F3 => 3", "\u0664 => 4", "\u06F4 => 4", "\u0665 => 5", "\u06F5 => 5", "\u0666 => 6", "\u06F6 => 6", "\u0667 => 7", "\u06F7 => 7", "\u0668 => 8", "\u06F8 => 8", "\u0669 => 9", "\u06F9 => 9"] + }, + "mapping_ja_filter": { + "type": "mapping", + "mappings": ["\u0009,\u000A,\u000B,\u000C,\u000D,\u001C,\u001D,\u001E,\u001F,\u00A0,\u1680,\u180E,\u2000,\u2001,\u2002,\u2003,\u2004,\u2005,\u2006,\u2007,\u2008,\u2009,\u200A,\u200B,\u202F,\u205F,\u3000,\uFEFF => \u0020", "~,˜,῀,⁓,∼,∿,~ => 〜", "A => A", "B => B", "C => C", "D => D", "E => E", "F => F", "G => G", "H => H", "I => I", "J => J", "K => K", "L => L", "M => M", "N => N", "O => O", "P => P", "Q => Q", "R => R", "S => S", "T => T", "U => U", "V => V", "W => W", "X => X", "Y => Y", "Z => Z", "a => a", "b => b", "c => c", "d => d", "e => e", "f => f", "g => g", "h => h", "i => i", "j => j", "k => k", "l => l", "m => m", "n => n", "o => o", "p => p", "q => q", "r => r", "s => s", "t => t", "u => u", "v => v", "w => w", "x => x", "y => y", "z => z", "が => が", "ぎ => ぎ", "ぐ => ぐ", "げ => げ", "ご => ご", "ざ => ざ", "じ => じ", "ず => ず", "ぜ => ぜ", "ぞ => ぞ", "だ => だ", "ぢ => ぢ", "づ => づ", "で => で", "ど => ど", "ば => ば", "び => び", "ぶ => ぶ", "べ => べ", "ぼ => ぼ", "ぱ => ぱ", "ぴ => ぴ", "ぷ => ぷ", "ぺ => ぺ", "ぽ => ぽ", "ガ => ガ", "ギ => ギ", "グ => グ", "ゲ => ゲ", "ゴ => ゴ", "ザ => ザ", "ジ => ジ", "ズ => ズ", "ゼ => ゼ", "ゾ => ゾ", "ダ => ダ", "ヂ => ヂ", "ヅ => ヅ", "デ => デ", "ド => ド", "バ => バ", "ビ => ビ", "ブ => ブ", "ベ => ベ", "ボ => ボ", "パ => パ", "ピ => ピ", "プ => プ", "ペ => ペ", "ポ => ポ", "ア => ア", "イ => イ", "ウ => ウ", "エ => エ", "オ => オ", "カ => カ", "キ => キ", "ク => ク", "ケ => ケ", "コ => コ", "ガ => ガ", "ギ => ギ", "グ => グ", "ゲ => ゲ", "ゴ => ゴ", "サ => サ", "シ => シ", "ス => ス", "セ => セ", "ソ => ソ", "ザ => ザ", "ジ => ジ", "ズ => ズ", "ゼ => ゼ", "ゾ => ゾ", "タ => タ", "チ => チ", "ツ => ツ", "テ => テ", "ト => ト", "ダ => ダ", "ヂ => ヂ", "ヅ => ヅ", "デ => デ", "ド => ド", "ナ => ナ", "ニ => ニ", "ヌ => ヌ", "ネ => ネ", "ノ => ノ", "ハ => ハ", "ヒ => ヒ", "フ => フ", "ヘ => ヘ", "ホ => ホ", "バ => バ", "ビ => ビ", "ブ => ブ", "ベ => ベ", "ボ => ボ", "パ => パ", "ピ => ピ", "プ => プ", "ペ => ペ", "ポ => ポ", "マ => マ", "ミ => ミ", "ム => ム", "メ => メ", "モ => モ", "ヤ => ヤ", "ユ => ユ", "ヨ => ヨ", "ラ => ラ", "リ => リ", "ル => ル", "レ => レ", "ロ => ロ", "ワ => ワ", "ヲ => ヲ", "ン => ン", "ヴ => ヴ", "ッ => ッ", "ァ => ァ", "ィ => ィ", "ゥ => ゥ", "ェ => ェ", "ォ => ォ", "ャ => ャ", "ュ => ュ", "ョ => ョ", "゙ => ゛", "゚ => ゜", "ー => ー", "・ => ・", "0 => 0", "1 => 1", "2 => 2", "3 => 3", "4 => 4", "5 => 5", "6 => 6", "7 => 7", "8 => 8", "9 => 9", "① => 1", "② => 2", "③ => 3", "④ => 4", "⑤ => 5", "⑥ => 6", "⑦ => 7", "⑧ => 8", "⑨ => 9", "! => !", "? => ?", "# => #", "% => %", "& => &", "@ => @", "+ => +", "- => -", "* => *", "/ => /", "= => =", "$ => $", "^ => ^", ": => :", "; => ;", "’ => '", "‘ => '", ", => ,", ". => .", "¥ => ¥", "” => \"", "( => (", ") => )", "| => |", "[ => [", "` => `", "{ => {", "] => ]", "} => }", "_ => _", "< => <", "> => >", "Ⅰ => 1", "Ⅱ => 2", "Ⅲ => 3", "Ⅳ => 4", "Ⅴ => 5", "Ⅵ => 6", "Ⅶ => 7", "Ⅷ => 8", "Ⅸ => 9", "Ⅹ => 10", "ゐ => い", "ゑ => え", "ヰ => イ", "ヱ => エ", "ヴァ => バ", "ヴィ => ビ", "ヴゥ => ブ", "ヴェ => ベ", "ヴォ => ボ", "Ζ => Z", "亞 => 亜", "惡 => 悪", "蘆 => 芦", "鰺 => 鯵", "壓 => 圧", "菴 => 庵", "圍 => 囲", "爲 => 為", "醫 => 医", "毓 => 育", "弌 => 一", "壹 => 壱", "稻 => 稲", "飮 => 飲", "婬 => 淫", "隱 => 隠", "夘 => 卯", "欝 => 鬱", "廐 => 厩", "廏 => 厩", "睿 => 叡", "營 => 営", "暎 => 映", "曵 => 曳", "榮 => 栄", "頴 => 穎", "偀 => 英", "衞 => 衛", "咏 => 詠", "驛 => 駅", "圓 => 円", "烟 => 煙", "艷 => 艶", "鈆 => 鉛", "鹽 => 塩", "奧 => 奥", "徃 => 往", "應 => 応", "橫 => 横", "歐 => 欧", "毆 => 殴", "鶯 => 鴬", "堽 => 岡", "崗 => 岡", "冲 => 沖", "穩 => 穏", "假 => 仮", "價 => 価", "譁 => 嘩", "峩 => 峨", "畫 => 画", "會 => 会", "觧 => 解", "囘 => 回", "壞 => 壊", "迴 => 廻", "恠 => 怪", "懷 => 懐", "畍 => 界", "繪 => 絵", "蠏 => 蟹", "崕 => 崖", "礙 => 碍", "盖 => 蓋", "葢 => 蓋", "蠣 => 蛎", "鉤 => 鈎", "擴 => 拡", "攪 => 撹", "殼 => 殻", "覺 => 覚", "學 => 学", "斈 => 学", "嶽 => 岳", "樂 => 楽", "竈 => 竃", "釡 => 釜", "栢 => 柏", "鬻 => 粥", "勸 => 勧", "卷 => 巻", "寬 => 寛", "歡 => 歓", "灌 => 潅", "罐 => 缶", "觀 => 観", "諫 => 諌", "鑒 => 鑑", "閒 => 間", "關 => 関", "陷 => 陥", "舘 => 館", "巖 => 巌", "嵓 => 巌", "鴈 => 雁", "鳫 => 雁", "顏 => 顔", "憙 => 喜", "憘 => 喜", "噐 => 器", "竒 => 奇", "朞 => 期", "棊 => 棋", "弃 => 棄", "歸 => 帰", "皈 => 帰", "氣 => 気", "龜 => 亀", "僞 => 偽", "冝 => 宜", "戲 => 戯", "犧 => 犠", "卻 => 却", "糺 => 糾", "舊 => 旧", "據 => 拠", "擧 => 挙", "舉 => 挙", "亰 => 京", "恊 => 協", "峽 => 峡", "挾 => 挟", "敎 => 教", "况 => 況", "狹 => 狭", "鄕 => 郷", "曉 => 暁", "惞 => 欣", "區 => 区", "驅 => 駆", "駈 => 駆", "桒 => 桑", "勳 => 勲", "勛 => 勲", "薰 => 薫", "羣 => 群", "徑 => 径", "逕 => 径", "惠 => 恵", "憇 => 憩", "攜 => 携", "溪 => 渓", "谿 => 渓", "經 => 経", "繼 => 継", "莖 => 茎", "螢 => 蛍", "輕 => 軽", "頸 => 頚", "鷄 => 鶏", "藝 => 芸", "缺 => 欠", "决 => 決", "儉 => 倹", "劍 => 剣", "劔 => 剣", "劒 => 剣", "剱 => 剣", "釼 => 剣", "圈 => 圏", "檢 => 検", "權 => 権", "獻 => 献", "縣 => 県", "險 => 険", "顯 => 顕", "驗 => 験", "鹹 => 鹸", "嚴 => 厳", "乕 => 虎", "皷 => 鼓", "效 => 効", "廣 => 広", "恆 => 恒", "晄 => 晃", "稾 => 稿", "畊 => 耕", "鑛 => 鉱", "礦 => 砿", "髙 => 高", "刧 => 劫", "號 => 号", "軣 => 轟", "國 => 国", "圀 => 国", "黑 => 黒", "嵳 => 嵯", "濟 => 済", "碎 => 砕", "劑 => 剤", "戝 => 財", "冱 => 冴", "沍 => 冴", "嵜 => 崎", "﨑 => 崎", "碕 => 埼", "櫻 => 桜", "册 => 冊", "雜 => 雑", "襍 => 雑", "皋 => 皐", "參 => 参", "慘 => 惨", "棧 => 桟", "蠶 => 蚕", "讚 => 讃", "贊 => 賛", "殘 => 残", "絲 => 糸", "帋 => 紙", "齒 => 歯", "亊 => 事", "兒 => 児", "尓 => 爾", "辭 => 辞", "濕 => 湿", "貭 => 質", "實 => 実", "筱 => 篠", "蘂 => 蕊", "蕋 => 蕊", "舍 => 舎", "冩 => 写", "寫 => 写", "釋 => 釈", "咒 => 呪", "壽 => 寿", "收 => 収", "穐 => 秋", "龝 => 秋", "讎 => 讐", "從 => 従", "澁 => 渋", "澀 => 渋", "獸 => 獣", "縱 => 縦", "肅 => 粛", "凖 => 準", "處 => 処", "敍 => 叙", "敘 => 叙", "甞 => 嘗", "奬 => 奨", "獎 => 奨", "將 => 将", "厰 => 廠", "曻 => 昇", "枩 => 松", "燒 => 焼", "稱 => 称", "證 => 証", "乘 => 乗", "剩 => 剰", "塲 => 場", "壤 => 壌", "孃 => 嬢", "條 => 条", "淨 => 浄", "疊 => 畳", "疉 => 畳", "疂 => 畳", "穰 => 穣", "讓 => 譲", "釀 => 醸", "囑 => 嘱", "餝 => 飾", "觸 => 触", "脣 => 唇", "訷 => 伸", "寢 => 寝", "愼 => 慎", "晉 => 晋", "眞 => 真", "刄 => 刃", "盡 => 尽", "靫 => 靭", "靱 => 靭", "醋 => 酢", "圖 => 図", "廚 => 厨", "埀 => 垂", "粹 => 粋", "翆 => 翠", "醉 => 酔", "隨 => 随", "膸 => 髄", "髓 => 髄", "數 => 数", "樞 => 枢", "椙 => 杉", "杦 => 杉", "澂 => 澄", "丗 => 世", "瀨 => 瀬", "畆 => 畝", "淒 => 凄", "栖 => 棲", "淸 => 清", "聲 => 声", "靑 => 青", "靜 => 静", "齊 => 斉", "攝 => 摂", "竊 => 窃", "專 => 専", "戰 => 戦", "淺 => 浅", "潛 => 潜", "濳 => 潜", "綫 => 線", "纖 => 繊", "纎 => 繊", "舩 => 船", "賤 => 賎", "踐 => 践", "錢 => 銭", "譱 => 善", "禪 => 禅", "曾 => 曽", "踈 => 疎", "蘓 => 蘇", "溯 => 遡", "鼡 => 鼠", "雙 => 双", "壯 => 壮", "搜 => 捜", "插 => 挿", "曺 => 曹", "爭 => 争", "窗 => 窓", "總 => 総", "聰 => 聡", "莊 => 荘", "裝 => 装", "赱 => 走", "騷 => 騒", "增 => 増", "臟 => 臓", "藏 => 蔵", "屬 => 属", "續 => 続", "卆 => 卒", "夛 => 多", "墮 => 堕", "柁 => 舵", "橢 => 楕", "躰 => 体", "軆 => 体", "體 => 体", "對 => 対", "帶 => 帯", "滯 => 滞", "臺 => 台", "瀧 => 滝", "擇 => 択", "澤 => 沢", "鈬 => 鐸", "逹 => 達", "豎 => 竪", "貍 => 狸", "單 => 単", "擔 => 担", "膽 => 胆", "團 => 団", "彈 => 弾", "斷 => 断", "耻 => 恥", "癡 => 痴", "穉 => 稚", "遲 => 遅", "晝 => 昼", "蟲 => 虫", "鑄 => 鋳", "潴 => 瀦", "豬 => 猪", "廳 => 庁", "廰 => 庁", "甼 => 町", "聽 => 聴", "膓 => 腸", "敕 => 勅", "珎 => 珍", "鎭 => 鎮", "壺 => 壷", "寉 => 鶴", "靍 => 鶴", "靏 => 鶴", "遞 => 逓", "喆 => 哲", "悊 => 哲", "銕 => 鉄", "鐵 => 鉄", "鐡 => 鉄", "纒 => 纏", "轉 => 転", "點 => 点", "傳 => 伝", "兔 => 兎", "莵 => 兎", "礪 => 砺", "黨 => 党", "嶌 => 島", "嶋 => 島", "隝 => 島", "檮 => 梼", "盜 => 盗", "濤 => 涛", "燈 => 灯", "當 => 当", "迯 => 逃", "鬪 => 闘", "仂 => 働", "仝 => 同", "德 => 徳", "悳 => 徳", "獨 => 独", "讀 => 読", "杤 => 栃", "屆 => 届", "繩 => 縄", "貳,貮,弍 => 弐", "邇 => 迩", "韭 => 韮", "姙 => 妊", "禰 => 祢", "迺 => 廼", "墅 => 野", "埜 => 野", "惱 => 悩", "腦 => 脳", "霸 => 覇", "廢 => 廃", "拜 => 拝", "盃 => 杯", "楳 => 梅", "賣 => 売", "蠅 => 蝿", "麥 => 麦", "凾 => 函", "枦 => 櫨", "發 => 発", "髮 => 髪", "罸 => 罰", "拔 => 抜", "蠻 => 蛮", "祕 => 秘", "桧 => 檜", "冰 => 氷", "斌 => 彬", "濱,濵 => 浜", "甁 => 瓶", "冨 => 富", "凬 => 風", "淵,渊 => 渕", "拂 => 払", "佛 => 仏", "幤 => 幣", "竝 => 並", "閇 => 閉", "篦 => 箆", "變 => 変", "邊 => 辺", "邉 => 辺", "辨 => 弁", "辧 => 弁", "瓣 => 弁", "辯 => 弁", "舖 => 舗", "鋪 => 舗", "穗 => 穂", "寶 => 宝", "寳 => 宝", "峯 => 峰", "萠 => 萌", "襃 => 褒", "豐 => 豊", "冐 => 冒", "皃 => 貌", "沒 => 没", "夲 => 本", "飜 => 翻", "槇 => 槙", "枡 => 桝", "儘 => 侭", "萬 => 万", "滿 => 満", "簑 => 蓑", "簔 => 蓑", "脉 => 脈", "梦 => 夢", "无 => 無", "壻 => 婿", "聟 => 婿", "麪 => 麺", "默 => 黙", "餠 => 餅", "彌 => 弥", "笶 => 矢", "藥 => 薬", "譯 => 訳", "栁 => 柳", "籔 => 薮", "藪 => 薮", "瘉 => 癒", "豫 => 予", "餘 => 余", "與 => 与", "譽 => 誉", "搖 => 揺", "樣 => 様", "窰 => 窯", "燿 => 耀", "謠 => 謡", "踴 => 踊", "來 => 来", "賴 => 頼", "亂 => 乱", "覽 => 覧", "裡 => 裏", "畧 => 略", "澑 => 溜", "畄 => 留", "兩 => 両", "凉 => 涼", "獵 => 猟", "暸 => 瞭", "粮 => 糧", "綠 => 緑", "鄰 => 隣", "璢 => 瑠", "壘 => 塁", "泪 => 涙", "勵 => 励", "禮 => 礼", "隸 => 隷", "靈 => 霊", "齡 => 齢", "戀 => 恋", "聨 => 聯", "爐 => 炉", "勞 => 労", "朖 => 朗", "樓 => 楼", "籠 => 篭", "祿 => 禄", "咊 => 和", "亙 => 亘", "灣 => 湾", "仭 => 仞", "爼 => 俎", "伜 => 倅", "僣 => 僭", "寃 => 冤", "寇 => 冦", "羃 => 冪", "洌 => 冽", "涸 => 凅", "凜 => 凛", "刋 => 刊", "尅 => 剋", "箚 => 剳", "匇 => 匆", "奩 => 匳", "巵 => 卮", "廁 => 厠", "廈 => 厦", "廝 => 厮", "咜 => 咤", "咯 => 喀", "譟 => 噪", "嚏 => 嚔", "齧 => 囓", "阯 => 址", "埓 => 埒", "罎 => 壜", "弉 => 奘", "侫 => 佞", "嫻 => 嫺", "嫐 => 嬲", "崘 => 崙", "篏 => 嵌", "迪 => 廸", "彜 => 彝", "弯 => 彎", "髴 => 彿", "忰 => 悴", "愠 => 慍", "慚 => 慙", "懴 => 懺", "戞 => 戛", "扨 => 扠", "抬 => 擡", "旙 => 旛", "昿 => 曠", "杰 => 傑", "椶 => 棕", "櫁 => 樒", "蘗 => 檗", "檪 => 櫟", "殱 => 殲", "烱 => 炯", "熈 => 煕", "熙 => 煕", "燻 => 薫", "暿 => 熹", "犁 => 犂", "豺 => 犲", "貉 => 狢", "貎 => 猊", "貘 => 獏", "瑯 => 琅", "碯 => 瑙", "瑤 => 瑶", "珱 => 瓔", "畴 => 疇", "肬 => 疣", "晥 => 皖", "皹 => 皸", "蘯 => 盪", "眦 => 眥", "禀 => 稟", "筺 => 筐", "笋 => 筍", "筝 => 箏", "籘 => 籐", "籖 => 籤", "絖 => 絋", "纊 => 絋", "緕 => 纃", "羇 => 羈", "覊 => 羈", "羮 => 羹", "腟 => 膣", "臈 => 臘", "舮 => 艫", "莓 => 苺", "蕚 => 萼", "薀 => 蘊", "蝨 => 虱", "蟆 => 蟇", "蟒 => 蠎", "蠧 => 蠹", "衂 => 衄", "袵 => 衽", "裵 => 裴", "褝 => 襌", "諡 => 謚", "譛 => 譖", "豼 => 貔", "賍 => 贓", "躪 => 躙", "輒 => 輙", "輛 => 輌", "逎 => 遒", "鈩 => 鑪", "鑚 => 鑽", "鬧 => 閙", "濶 => 闊", "隯 => 陦", "韲 => 齏", "韵 => 韻", "匀 => 韻", "飃 => 飄", "鰛 => 鰮", "魲 => 鱸", "鳬 => 鳧", "鵄 => 鴟", "鵞 => 鵝", "鶫 => 鶇", "鷏 => 鷆", "麸 => 麩", "兊 => 兌", "焏 => 亟", "犱 => 執", "緖 => 緒", "羡 => 羨", "閠 => 閏", "薗 => 園", "謌,哥 => 歌", "籏 => 旗", "竸 => 競", "堯 => 尭", "蹟 => 跡", "迹 => 跡", "涌 => 湧", "遙 => 遥", "縲 => 累", "牆 => 墻", "郞 => 郎", "悅 => 悦", "懼 => 惧", "蒭 => 芻", "韈 => 襪", "萱 => 茅", "倂 => 併", "凛 => 凜", "卽 => 即", "吳 => 呉", "姬 => 姫", "娛 => 娯", "尙 => 尚", "巢 => 巣", "强 => 強", "彅 => 薙", "徵 => 徴", "慾 => 欲", "懐 => 懐", "戶 => 戸", "戾 => 戻", "揭 => 掲", "擊 => 撃", "斎 => 斉", "旣 => 既", "晚 => 晩", "曆 => 暦", "槪 => 概", "步 => 歩", "歲 => 歳", "歷 => 歴", "每 => 毎", "涉 => 渉", "淚 => 涙", "渕 => 淵", "渴 => 渇", "溫 => 温", "濱 => 浜", "牀 => 床", "狀 => 状", "瘦 => 痩", "硏 => 研", "稅 => 税", "緣 => 縁", "脫 => 脱", "虛 => 虚", "說 => 説", "貳 => 弐", "銳 => 鋭", "錄 => 録", "鍊 => 錬", "閱 => 閲", "鬭 => 闘", "麵 => 麺", "黃 => 黄", "黏 => 粘", "齋 => 斉", "龍 => 竜", "契 => 契", "欄 => 欄", "廊 => 廊", "朗 => 朗", "虜 => 虜", "殺 => 殺", "旅 => 旅", "廉 => 廉", "類 => 類", "隆 => 隆", "塚 => 塚", "晴 => 晴", "猪 => 猪", "益 => 益", "神 => 神", "祥 => 祥", "福 => 福", "精 => 精", "羽 => 羽", "諸 => 諸", "都 => 都", "飯 => 飯", "飼 => 飼", "館 => 館", "侮 => 侮", "僧 => 僧", "免 => 免", "勉 => 勉", "勤 => 勤", "卑 => 卑", "喝 => 喝", "嘆 => 嘆", "器 => 器", "塀 => 塀", "墨 => 墨", "層 => 層", "悔 => 悔", "慨 => 慨", "憎 => 憎", "懲 => 懲", "敏 => 敏", "既 => 既", "暑 => 暑", "梅 => 梅", "海 => 海", "漢 => 漢", "煮 => 煮", "琢 => 琢", "碑 => 碑", "社 => 社", "祉 => 祉", "祈 => 祈", "祐 => 祐", "祖 => 祖", "祝 => 祝", "禍 => 禍", "穀 => 穀", "突 => 突", "節 => 節", "練 => 練", "繁 => 繁", "署 => 署", "者 => 者", "臭 => 臭", "著 => 着", "褐 => 褐", "視 => 視", "謁 => 謁", "謹 => 謹", "賓 => 賓", "贈 => 贈", "逸 => 逸", "難 => 難", "響 => 響", "頻 => 頻"] + }, + "mapping_filter": { + "type": "mapping", + "mappings": ["\u0009,\u000A,\u000B,\u000C,\u000D,\u001C,\u001D,\u001E,\u001F,\u00A0,\u1680,\u180E,\u2000,\u2001,\u2002,\u2003,\u2004,\u2005,\u2006,\u2007,\u2008,\u2009,\u200A,\u200B,\u202F,\u205F,\u3000,\uFEFF => \u0020", "~,˜,῀,⁓,∼,∿,~ => 〜", "A => A", "B => B", "C => C", "D => D", "E => E", "F => F", "G => G", "H => H", "I => I", "J => J", "K => K", "L => L", "M => M", "N => N", "O => O", "P => P", "Q => Q", "R => R", "S => S", "T => T", "U => U", "V => V", "W => W", "X => X", "Y => Y", "Z => Z", "a => a", "b => b", "c => c", "d => d", "e => e", "f => f", "g => g", "h => h", "i => i", "j => j", "k => k", "l => l", "m => m", "n => n", "o => o", "p => p", "q => q", "r => r", "s => s", "t => t", "u => u", "v => v", "w => w", "x => x", "y => y", "z => z", "あ => ア", "い => イ", "う => ウ", "え => エ", "お => オ", "か => カ", "き => キ", "く => ク", "け => ケ", "こ => コ", "が => ガ", "ぎ => ギ", "ぐ => グ", "げ => ゲ", "ご => ゴ", "さ => サ", "し => シ", "す => ス", "せ => セ", "そ => ソ", "ざ => ザ", "じ => ジ", "ず => ズ", "ぜ => ゼ", "ぞ => ゾ", "た => タ", "ち => チ", "つ => ツ", "て => テ", "と => ト", "だ => ダ", "ぢ => ヂ", "づ => ヅ", "で => デ", "ど => ド", "な => ナ", "に => ニ", "ぬ => ヌ", "ね => ネ", "の => ノ", "は => ハ", "ひ => ヒ", "ふ => フ", "へ => ヘ", "ほ => ホ", "ば => バ", "び => ビ", "ぶ => ブ", "べ => ベ", "ぼ => ボ", "ぱ => パ", "ぴ => ピ", "ぷ => プ", "ぺ => ペ", "ぽ => ポ", "ま => マ", "み => ミ", "む => ム", "め => メ", "も => モ", "や => ヤ", "ゆ => ユ", "よ => ヨ", "ら => ラ", "り => リ", "る => ル", "れ => レ", "ろ => ロ", "わ => ワ", "を => ヲ", "ん => ン", "っ => ツ", "ぁ => ア", "ぃ => イ", "ぅ => ウ", "ぇ => エ", "ぉ => オ", "ゃ => ヤ", "ゅ => ユ", "ょ => ヨ", "が => ガ", "ぎ => ギ", "ぐ => グ", "げ => ゲ", "ご => ゴ", "ざ => ザ", "じ => ジ", "ず => ズ", "ぜ => ゼ", "ぞ => ゾ", "だ => ダ", "ぢ => ヂ", "づ => ヅ", "で => デ", "ど => ド", "ば => バ", "び => ビ", "ぶ => ブ", "べ => ベ", "ぼ => ボ", "ぱ => パ", "ぴ => ピ", "ぷ => プ", "ぺ => ペ", "ぽ => ポ", "ガ => ガ", "ギ => ギ", "グ => グ", "ゲ => ゲ", "ゴ => ゴ", "ザ => ザ", "ジ => ジ", "ズ => ズ", "ゼ => ゼ", "ゾ => ゾ", "ダ => ダ", "ヂ => ヂ", "ヅ => ヅ", "デ => デ", "ド => ド", "バ => バ", "ビ => ビ", "ブ => ブ", "ベ => ベ", "ボ => ボ", "パ => パ", "ピ => ピ", "プ => プ", "ペ => ペ", "ポ => ポ", "ッ => ツ", "ァ => ア", "ィ => イ", "ゥ => ウ", "ェ => エ", "ォ => オ", "ャ => ヤ", "ュ => ユ", "ョ => ヨ", "ア => ア", "イ => イ", "ウ => ウ", "エ => エ", "オ => オ", "カ => カ", "キ => キ", "ク => ク", "ケ => ケ", "コ => コ", "ガ => ガ", "ギ => ギ", "グ => グ", "ゲ => ゲ", "ゴ => ゴ", "サ => サ", "シ => シ", "ス => ス", "セ => セ", "ソ => ソ", "ザ => ザ", "ジ => ジ", "ズ => ズ", "ゼ => ゼ", "ゾ => ゾ", "タ => タ", "チ => チ", "ツ => ツ", "テ => テ", "ト => ト", "ダ => ダ", "ヂ => ヂ", "ヅ => ヅ", "デ => デ", "ド => ド", "ナ => ナ", "ニ => ニ", "ヌ => ヌ", "ネ => ネ", "ノ => ノ", "ハ => ハ", "ヒ => ヒ", "フ => フ", "ヘ => ヘ", "ホ => ホ", "バ => バ", "ビ => ビ", "ブ => ブ", "ベ => ベ", "ボ => ボ", "パ => パ", "ピ => ピ", "プ => プ", "ペ => ペ", "ポ => ポ", "マ => マ", "ミ => ミ", "ム => ム", "メ => メ", "モ => モ", "ヤ => ヤ", "ユ => ユ", "ヨ => ヨ", "ラ => ラ", "リ => リ", "ル => ル", "レ => レ", "ロ => ロ", "ワ => ワ", "ヲ => ヲ", "ン => ン", "ヴ => ヴ", "ッ => ツ", "ァ => ア", "ィ => イ", "ゥ => ウ", "ェ => エ", "ォ => オ", "ャ => ヤ", "ュ => ユ", "ョ => ヨ", "゙ => ゛", "゚ => ゜", "ー => ー", "・ => ・", "0 => 0", "1 => 1", "2 => 2", "3 => 3", "4 => 4", "5 => 5", "6 => 6", "7 => 7", "8 => 8", "9 => 9", "① => 1", "② => 2", "③ => 3", "④ => 4", "⑤ => 5", "⑥ => 6", "⑦ => 7", "⑧ => 8", "⑨ => 9", "! => !", "? => ?", "# => #", "% => %", "& => &", "@ => @", "+ => +", "- => -", "* => *", "/ => /", "= => =", "$ => $", "^ => ^", ": => :", "; => ;", "’ => '", "‘ => '", ", => ,", ". => .", "¥ => ¥", "” => \"", "( => (", ") => )", "| => |", "[ => [", "` => `", "{ => {", "] => ]", "} => }", "_ => _", "< => <", "> => >", "Ⅰ => 1", "Ⅱ => 2", "Ⅲ => 3", "Ⅳ => 4", "Ⅴ => 5", "Ⅵ => 6", "Ⅶ => 7", "Ⅷ => 8", "Ⅸ => 9", "Ⅹ => 10", "ゐ => い", "ゑ => え", "ヰ => イ", "ヱ => エ", "ヴァ => バ", "ヴィ => ビ", "ヴゥ => ブ", "ヴェ => ベ", "ヴォ => ボ", "Ζ => Z", "亞 => 亜", "惡 => 悪", "蘆 => 芦", "鰺 => 鯵", "壓 => 圧", "菴 => 庵", "圍 => 囲", "爲 => 為", "醫 => 医", "毓 => 育", "弌 => 一", "壹 => 壱", "稻 => 稲", "飮 => 飲", "婬 => 淫", "隱 => 隠", "夘 => 卯", "欝 => 鬱", "廐 => 厩", "廏 => 厩", "睿 => 叡", "營 => 営", "暎 => 映", "曵 => 曳", "榮 => 栄", "頴 => 穎", "偀 => 英", "衞 => 衛", "咏 => 詠", "驛 => 駅", "圓 => 円", "烟 => 煙", "艷 => 艶", "鈆 => 鉛", "鹽 => 塩", "奧 => 奥", "徃 => 往", "應 => 応", "橫 => 横", "歐 => 欧", "毆 => 殴", "鶯 => 鴬", "堽 => 岡", "崗 => 岡", "冲 => 沖", "穩 => 穏", "假 => 仮", "價 => 価", "譁 => 嘩", "峩 => 峨", "畫 => 画", "會 => 会", "觧 => 解", "囘 => 回", "壞 => 壊", "迴 => 廻", "恠 => 怪", "懷 => 懐", "畍 => 界", "繪 => 絵", "蠏 => 蟹", "崕 => 崖", "礙 => 碍", "盖 => 蓋", "葢 => 蓋", "蠣 => 蛎", "鉤 => 鈎", "擴 => 拡", "攪 => 撹", "殼 => 殻", "覺 => 覚", "學 => 学", "斈 => 学", "嶽 => 岳", "樂 => 楽", "竈 => 竃", "釡 => 釜", "栢 => 柏", "鬻 => 粥", "勸 => 勧", "卷 => 巻", "寬 => 寛", "歡 => 歓", "灌 => 潅", "罐 => 缶", "觀 => 観", "諫 => 諌", "鑒 => 鑑", "閒 => 間", "關 => 関", "陷 => 陥", "舘 => 館", "巖 => 巌", "嵓 => 巌", "鴈 => 雁", "鳫 => 雁", "顏 => 顔", "憙 => 喜", "憘 => 喜", "噐 => 器", "竒 => 奇", "朞 => 期", "棊 => 棋", "弃 => 棄", "歸 => 帰", "皈 => 帰", "氣 => 気", "龜 => 亀", "僞 => 偽", "冝 => 宜", "戲 => 戯", "犧 => 犠", "卻 => 却", "糺 => 糾", "舊 => 旧", "據 => 拠", "擧 => 挙", "舉 => 挙", "亰 => 京", "恊 => 協", "峽 => 峡", "挾 => 挟", "敎 => 教", "况 => 況", "狹 => 狭", "鄕 => 郷", "曉 => 暁", "惞 => 欣", "區 => 区", "驅 => 駆", "駈 => 駆", "桒 => 桑", "勳 => 勲", "勛 => 勲", "薰 => 薫", "羣 => 群", "徑 => 径", "逕 => 径", "惠 => 恵", "憇 => 憩", "攜 => 携", "溪 => 渓", "谿 => 渓", "經 => 経", "繼 => 継", "莖 => 茎", "螢 => 蛍", "輕 => 軽", "頸 => 頚", "鷄 => 鶏", "藝 => 芸", "缺 => 欠", "决 => 決", "儉 => 倹", "劍 => 剣", "劔 => 剣", "劒 => 剣", "剱 => 剣", "釼 => 剣", "圈 => 圏", "檢 => 検", "權 => 権", "獻 => 献", "縣 => 県", "險 => 険", "顯 => 顕", "驗 => 験", "鹹 => 鹸", "嚴 => 厳", "乕 => 虎", "皷 => 鼓", "效 => 効", "廣 => 広", "恆 => 恒", "晄 => 晃", "稾 => 稿", "畊 => 耕", "鑛 => 鉱", "礦 => 砿", "髙 => 高", "刧 => 劫", "號 => 号", "軣 => 轟", "國 => 国", "圀 => 国", "黑 => 黒", "嵳 => 嵯", "濟 => 済", "碎 => 砕", "劑 => 剤", "戝 => 財", "冱 => 冴", "沍 => 冴", "嵜 => 崎", "﨑 => 崎", "碕 => 埼", "櫻 => 桜", "册 => 冊", "雜 => 雑", "襍 => 雑", "皋 => 皐", "參 => 参", "慘 => 惨", "棧 => 桟", "蠶 => 蚕", "讚 => 讃", "贊 => 賛", "殘 => 残", "絲 => 糸", "帋 => 紙", "齒 => 歯", "亊 => 事", "兒 => 児", "尓 => 爾", "辭 => 辞", "濕 => 湿", "貭 => 質", "實 => 実", "筱 => 篠", "蘂 => 蕊", "蕋 => 蕊", "舍 => 舎", "冩 => 写", "寫 => 写", "釋 => 釈", "咒 => 呪", "壽 => 寿", "收 => 収", "穐 => 秋", "龝 => 秋", "讎 => 讐", "從 => 従", "澁 => 渋", "澀 => 渋", "獸 => 獣", "縱 => 縦", "肅 => 粛", "凖 => 準", "處 => 処", "敍 => 叙", "敘 => 叙", "甞 => 嘗", "奬 => 奨", "獎 => 奨", "將 => 将", "厰 => 廠", "曻 => 昇", "枩 => 松", "燒 => 焼", "稱 => 称", "證 => 証", "乘 => 乗", "剩 => 剰", "塲 => 場", "壤 => 壌", "孃 => 嬢", "條 => 条", "淨 => 浄", "疊 => 畳", "疉 => 畳", "疂 => 畳", "穰 => 穣", "讓 => 譲", "釀 => 醸", "囑 => 嘱", "餝 => 飾", "觸 => 触", "脣 => 唇", "訷 => 伸", "寢 => 寝", "愼 => 慎", "晉 => 晋", "眞 => 真", "刄 => 刃", "盡 => 尽", "靫 => 靭", "靱 => 靭", "醋 => 酢", "圖 => 図", "廚 => 厨", "埀 => 垂", "粹 => 粋", "翆 => 翠", "醉 => 酔", "隨 => 随", "膸 => 髄", "髓 => 髄", "數 => 数", "樞 => 枢", "椙 => 杉", "杦 => 杉", "澂 => 澄", "丗 => 世", "瀨 => 瀬", "畆 => 畝", "淒 => 凄", "栖 => 棲", "淸 => 清", "聲 => 声", "靑 => 青", "靜 => 静", "齊 => 斉", "攝 => 摂", "竊 => 窃", "專 => 専", "戰 => 戦", "淺 => 浅", "潛 => 潜", "濳 => 潜", "綫 => 線", "纖 => 繊", "纎 => 繊", "舩 => 船", "賤 => 賎", "踐 => 践", "錢 => 銭", "譱 => 善", "禪 => 禅", "曾 => 曽", "踈 => 疎", "蘓 => 蘇", "溯 => 遡", "鼡 => 鼠", "雙 => 双", "壯 => 壮", "搜 => 捜", "插 => 挿", "曺 => 曹", "爭 => 争", "窗 => 窓", "總 => 総", "聰 => 聡", "莊 => 荘", "裝 => 装", "赱 => 走", "騷 => 騒", "增 => 増", "臟 => 臓", "藏 => 蔵", "屬 => 属", "續 => 続", "卆 => 卒", "夛 => 多", "墮 => 堕", "柁 => 舵", "橢 => 楕", "躰 => 体", "軆 => 体", "體 => 体", "對 => 対", "帶 => 帯", "滯 => 滞", "臺 => 台", "瀧 => 滝", "擇 => 択", "澤 => 沢", "鈬 => 鐸", "逹 => 達", "豎 => 竪", "貍 => 狸", "單 => 単", "擔 => 担", "膽 => 胆", "團 => 団", "彈 => 弾", "斷 => 断", "耻 => 恥", "癡 => 痴", "穉 => 稚", "遲 => 遅", "晝 => 昼", "蟲 => 虫", "鑄 => 鋳", "潴 => 瀦", "豬 => 猪", "廳 => 庁", "廰 => 庁", "甼 => 町", "聽 => 聴", "膓 => 腸", "敕 => 勅", "珎 => 珍", "鎭 => 鎮", "壺 => 壷", "寉 => 鶴", "靍 => 鶴", "靏 => 鶴", "遞 => 逓", "喆 => 哲", "悊 => 哲", "銕 => 鉄", "鐵 => 鉄", "鐡 => 鉄", "纒 => 纏", "轉 => 転", "點 => 点", "傳 => 伝", "兔 => 兎", "莵 => 兎", "礪 => 砺", "黨 => 党", "嶌 => 島", "嶋 => 島", "隝 => 島", "檮 => 梼", "盜 => 盗", "濤 => 涛", "燈 => 灯", "當 => 当", "迯 => 逃", "鬪 => 闘", "仂 => 働", "仝 => 同", "德 => 徳", "悳 => 徳", "獨 => 独", "讀 => 読", "杤 => 栃", "屆 => 届", "繩 => 縄", "貳,貮,弍 => 弐", "邇 => 迩", "韭 => 韮", "姙 => 妊", "禰 => 祢", "迺 => 廼", "墅 => 野", "埜 => 野", "惱 => 悩", "腦 => 脳", "霸 => 覇", "廢 => 廃", "拜 => 拝", "盃 => 杯", "楳 => 梅", "賣 => 売", "蠅 => 蝿", "麥 => 麦", "凾 => 函", "枦 => 櫨", "發 => 発", "髮 => 髪", "罸 => 罰", "拔 => 抜", "蠻 => 蛮", "祕 => 秘", "桧 => 檜", "冰 => 氷", "斌 => 彬", "濱,濵 => 浜", "甁 => 瓶", "冨 => 富", "凬 => 風", "淵,渊 => 渕", "拂 => 払", "佛 => 仏", "幤 => 幣", "竝 => 並", "閇 => 閉", "篦 => 箆", "變 => 変", "邊 => 辺", "邉 => 辺", "辨 => 弁", "辧 => 弁", "瓣 => 弁", "辯 => 弁", "舖 => 舗", "鋪 => 舗", "穗 => 穂", "寶 => 宝", "寳 => 宝", "峯 => 峰", "萠 => 萌", "襃 => 褒", "豐 => 豊", "冐 => 冒", "皃 => 貌", "沒 => 没", "夲 => 本", "飜 => 翻", "槇 => 槙", "枡 => 桝", "儘 => 侭", "萬 => 万", "滿 => 満", "簑 => 蓑", "簔 => 蓑", "脉 => 脈", "梦 => 夢", "无 => 無", "壻 => 婿", "聟 => 婿", "麪 => 麺", "默 => 黙", "餠 => 餅", "彌 => 弥", "笶 => 矢", "藥 => 薬", "譯 => 訳", "栁 => 柳", "籔 => 薮", "藪 => 薮", "瘉 => 癒", "豫 => 予", "餘 => 余", "與 => 与", "譽 => 誉", "搖 => 揺", "樣 => 様", "窰 => 窯", "燿 => 耀", "謠 => 謡", "踴 => 踊", "來 => 来", "賴 => 頼", "亂 => 乱", "覽 => 覧", "裡 => 裏", "畧 => 略", "澑 => 溜", "畄 => 留", "兩 => 両", "凉 => 涼", "獵 => 猟", "暸 => 瞭", "粮 => 糧", "綠 => 緑", "鄰 => 隣", "璢 => 瑠", "壘 => 塁", "泪 => 涙", "勵 => 励", "禮 => 礼", "隸 => 隷", "靈 => 霊", "齡 => 齢", "戀 => 恋", "聨 => 聯", "爐 => 炉", "勞 => 労", "朖 => 朗", "樓 => 楼", "籠 => 篭", "祿 => 禄", "咊 => 和", "亙 => 亘", "灣 => 湾", "仭 => 仞", "爼 => 俎", "伜 => 倅", "僣 => 僭", "寃 => 冤", "寇 => 冦", "羃 => 冪", "洌 => 冽", "涸 => 凅", "凜 => 凛", "刋 => 刊", "尅 => 剋", "箚 => 剳", "匇 => 匆", "奩 => 匳", "巵 => 卮", "廁 => 厠", "廈 => 厦", "廝 => 厮", "咜 => 咤", "咯 => 喀", "譟 => 噪", "嚏 => 嚔", "齧 => 囓", "阯 => 址", "埓 => 埒", "罎 => 壜", "弉 => 奘", "侫 => 佞", "嫻 => 嫺", "嫐 => 嬲", "崘 => 崙", "篏 => 嵌", "迪 => 廸", "彜 => 彝", "弯 => 彎", "髴 => 彿", "忰 => 悴", "愠 => 慍", "慚 => 慙", "懴 => 懺", "戞 => 戛", "扨 => 扠", "抬 => 擡", "旙 => 旛", "昿 => 曠", "杰 => 傑", "椶 => 棕", "櫁 => 樒", "蘗 => 檗", "檪 => 櫟", "殱 => 殲", "烱 => 炯", "熈 => 煕", "熙 => 煕", "燻 => 薫", "暿 => 熹", "犁 => 犂", "豺 => 犲", "貉 => 狢", "貎 => 猊", "貘 => 獏", "瑯 => 琅", "碯 => 瑙", "瑤 => 瑶", "珱 => 瓔", "畴 => 疇", "肬 => 疣", "晥 => 皖", "皹 => 皸", "蘯 => 盪", "眦 => 眥", "禀 => 稟", "筺 => 筐", "笋 => 筍", "筝 => 箏", "籘 => 籐", "籖 => 籤", "絖 => 絋", "纊 => 絋", "緕 => 纃", "羇 => 羈", "覊 => 羈", "羮 => 羹", "腟 => 膣", "臈 => 臘", "舮 => 艫", "莓 => 苺", "蕚 => 萼", "薀 => 蘊", "蝨 => 虱", "蟆 => 蟇", "蟒 => 蠎", "蠧 => 蠹", "衂 => 衄", "袵 => 衽", "裵 => 裴", "褝 => 襌", "諡 => 謚", "譛 => 譖", "豼 => 貔", "賍 => 贓", "躪 => 躙", "輒 => 輙", "輛 => 輌", "逎 => 遒", "鈩 => 鑪", "鑚 => 鑽", "鬧 => 閙", "濶 => 闊", "隯 => 陦", "韲 => 齏", "韵 => 韻", "匀 => 韻", "飃 => 飄", "鰛 => 鰮", "魲 => 鱸", "鳬 => 鳧", "鵄 => 鴟", "鵞 => 鵝", "鶫 => 鶇", "鷏 => 鷆", "麸 => 麩", "兊 => 兌", "焏 => 亟", "犱 => 執", "緖 => 緒", "羡 => 羨", "閠 => 閏", "薗 => 園", "謌,哥 => 歌", "籏 => 旗", "竸 => 競", "堯 => 尭", "蹟 => 跡", "迹 => 跡", "涌 => 湧", "遙 => 遥", "縲 => 累", "牆 => 墻", "郞 => 郎", "悅 => 悦", "懼 => 惧", "蒭 => 芻", "韈 => 襪", "萱 => 茅", "倂 => 併", "凛 => 凜", "卽 => 即", "吳 => 呉", "姬 => 姫", "娛 => 娯", "尙 => 尚", "巢 => 巣", "强 => 強", "彅 => 薙", "徵 => 徴", "慾 => 欲", "懐 => 懐", "戶 => 戸", "戾 => 戻", "揭 => 掲", "擊 => 撃", "斎 => 斉", "旣 => 既", "晚 => 晩", "曆 => 暦", "槪 => 概", "步 => 歩", "歲 => 歳", "歷 => 歴", "每 => 毎", "涉 => 渉", "淚 => 涙", "渕 => 淵", "渴 => 渇", "溫 => 温", "濱 => 浜", "牀 => 床", "狀 => 状", "瘦 => 痩", "硏 => 研", "稅 => 税", "緣 => 縁", "脫 => 脱", "虛 => 虚", "說 => 説", "貳 => 弐", "銳 => 鋭", "錄 => 録", "鍊 => 錬", "閱 => 閲", "鬭 => 闘", "麵 => 麺", "黃 => 黄", "黏 => 粘", "齋 => 斉", "龍 => 竜", "契 => 契", "欄 => 欄", "廊 => 廊", "朗 => 朗", "虜 => 虜", "殺 => 殺", "旅 => 旅", "廉 => 廉", "類 => 類", "隆 => 隆", "塚 => 塚", "晴 => 晴", "猪 => 猪", "益 => 益", "神 => 神", "祥 => 祥", "福 => 福", "精 => 精", "羽 => 羽", "諸 => 諸", "都 => 都", "飯 => 飯", "飼 => 飼", "館 => 館", "侮 => 侮", "僧 => 僧", "免 => 免", "勉 => 勉", "勤 => 勤", "卑 => 卑", "喝 => 喝", "嘆 => 嘆", "器 => 器", "塀 => 塀", "墨 => 墨", "層 => 層", "悔 => 悔", "慨 => 慨", "憎 => 憎", "懲 => 懲", "敏 => 敏", "既 => 既", "暑 => 暑", "梅 => 梅", "海 => 海", "漢 => 漢", "煮 => 煮", "琢 => 琢", "碑 => 碑", "社 => 社", "祉 => 祉", "祈 => 祈", "祐 => 祐", "祖 => 祖", "祝 => 祝", "禍 => 禍", "穀 => 穀", "突 => 突", "節 => 節", "練 => 練", "繁 => 繁", "署 => 署", "者 => 者", "臭 => 臭", "著 => 着", "褐 => 褐", "視 => 視", "謁 => 謁", "謹 => 謹", "賓 => 賓", "贈 => 贈", "逸 => 逸", "難 => 難", "響 => 響", "頻 => 頻"] + }, + "zero_width_spaces": { + "type": "mapping", + "mappings": [ "\\u200C=> "] + }, + "removeall_filter": { + "type": "pattern_replace", + "pattern":"(.*)", + "replacement":"" + } + }, + "filter": { + "stemmer_en_filter": { + "type": "stemmer", + "name": "english" + }, + "english_override": { + "type": "stemmer_override", + "rules": [] + }, + "possessive_stemmer_en_filter": { + "type": "stemmer", + "name": "possessive_english" + }, + "stopword_en_filter": { + "type": "stop", + "stopwords": ["a", "an", "and", "are", "as", "at", "be", "but", "by", "for", "if", "in", "into", "is", "it", "no", "not", "of", "on", "or", "such", "that", "the", "their", "then", "there", "these", "they", "this", "to", "was", "will", "with"] + }, + "arabic_stop": { + "type": "stop", + "stopwords": ["من", "ومن", "منها", "منه", "في", "وفي", "فيها", "فيه", "و", "ف", "ثم", "او", "أو", "ب", "بها", "به", "ا", "أ", "اى", "اي", "أي", "أى", "لا", "ولا", "الا", "ألا", "إلا", "لكن", "ما", "وما", "كما", "فما", "عن", "مع", "اذا", "إذا", "ان", "أن", "إن", "انها", "أنها", "إنها", "انه", "أنه", "إنه", "بان", "بأن", "فان", "فأن", "وان", "وأن", "وإن", "التى", "التي", "الذى", "الذي", "الذين", "الى", "الي", "إلى", "إلي", "على", "عليها", "عليه", "اما", "أما", "إما", "ايضا", "أيضا", "كل", "وكل", "لم", "ولم", "لن", "ولن", "هى", "هي", "هو", "وهى", "وهي", "وهو", "فهى", "فهي", "فهو", "انت", "أنت", "لك", "لها", "له", "هذه", "هذا", "تلك", "ذلك", "هناك", "كانت", "كان", "يكون", "تكون", "وكانت", "وكان", "غير", "بعض", "قد", "نحو", "بين", "بينما", "منذ", "ضمن", "حيث", "الان", "الآن", "خلال", "بعد", "قبل", "حتى", "عند", "عندما", "لدى", "جميع"] + }, + "arabic_keywords": { + "type": "keyword_marker", + "keywords": ["مرحباا", "عالم", "بحث"] + }, + "arabic_stemmer": { + "type": "stemmer", + "language": "arabic" + }, + "arabic_override": { + "type": "stemmer_override", + "rules": [] + }, + "armenian_stop": { + "type": "stop", + "stopwords": ["այդ", "այլ", "այն", "այս", "դու", "դուք", "եմ", "են", "ենք", "ես", "եք", "է", "էի", "էին", "էինք", "էիր", "էիք", "էր", "ըստ", "թ", "ի", "ին", "իսկ", "իր", "կամ", "համար", "հետ", "հետո", "մենք", "մեջ", "մի", "ն", "նա", "նաև", "նրա", "նրանք", "որ", "որը", "որոնք", "որպես", "ու", "ում", "պիտի", "վրա", "և"] + }, + "armenian_keywords": { + "type": "keyword_marker", + "keywords": ["օրինակ"] + }, + "armenian_stemmer": { + "type": "stemmer", + "language": "armenian" + }, + "armenian_override": { + "type": "stemmer_override", + "rules": [] + }, + "basque_stop": { + "type": "stop", + "stopwords": ["al", "anitz", "arabera", "asko", "baina", "bat", "batean", "batek", "bati", "batzuei", "batzuek", "batzuetan", "batzuk", "bera", "beraiek", "berau", "berauek", "bere", "berori", "beroriek", "beste", "bezala", "da", "dago", "dira", "ditu", "du", "dute", "edo", "egin", "ere", "eta", "eurak", "ez", "gainera", "gu", "gutxi", "guzti", "haiei", "haiek", "haietan", "hainbeste", "hala", "han", "handik", "hango", "hara", "hari", "hark", "hartan", "hau", "hauei", "hauek", "hauetan", "hemen", "hemendik", "hemengo", "hi", "hona", "honek", "honela", "honetan", "honi", "hor", "hori", "horiei", "horiek", "horietan", "horko", "horra", "horrek", "horrela", "horretan", "horri", "hortik", "hura", "izan", "ni", "noiz", "nola", "non", "nondik", "nongo", "nor", "nora", "ze", "zein", "zen", "zenbait", "zenbat", "zer", "zergatik", "ziren", "zituen", "zu", "zuek", "zuen", "zuten"] + }, + "basque_keywords": { + "type": "keyword_marker", + "keywords": ["Adibidez"] + }, + "basque_stemmer": { + "type": "stemmer", + "language": "basque" + }, + "basque_override": { + "type": "stemmer_override", + "rules": [] + }, + "brazilian_stop": { + "type": "stop", + "stopwords": ["a", "ainda", "alem", "ambas", "ambos", "antes", "ao", "aonde", "aos", "apos", "aquele", "aqueles", "as", "assim", "com", "como", "contra", "contudo", "cuja", "cujas", "cujo", "cujos", "da", "das", "de", "dela", "dele", "deles", "demais", "depois", "desde", "desta", "deste", "dispoe", "dispoem", "diversa", "diversas", "diversos", "do", "dos", "durante", "e", "ela", "elas", "ele", "eles", "em", "entao", "entre", "essa", "essas", "esse", "esses", "esta", "estas", "este", "estes", "ha", "isso", "isto", "logo", "mais", "mas", "mediante", "menos", "mesma", "mesmas", "mesmo", "mesmos", "na", "nas", "nao", "nas", "nem", "nesse", "neste", "nos", "o", "os", "ou", "outra", "outras", "outro", "outros", "pelas", "pelas", "pelo", "pelos", "perante", "pois", "por", "porque", "portanto", "proprio", "propios", "quais", "qual", "qualquer", "quando", "quanto", "que", "quem", "quer", "se", "seja", "sem", "sendo", "seu", "seus", "sob", "sobre", "sua", "suas", "tal", "tambem", "teu", "teus", "toda", "todas", "todo", "todos", "tua", "tuas", "tudo", "um", "uma", "umas", "uns"] + }, + "brazilian_keywords": { + "type": "keyword_marker", + "keywords": ["exemplo"] + }, + "brazilian_stemmer": { + "type": "stemmer", + "language": "brazilian" + }, + "brazilian_override": { + "type": "stemmer_override", + "rules": [] + }, + "bulgarian_stop": { + "type": "stop", + "stopwords": ["а", "аз", "ако", "ала", "бе", "без", "беше", "би", "бил", "била", "били", "било", "близо", "бъдат", "бъде", "бяха", "в", "вас", "ваш", "ваша", "вероятно", "вече", "взема", "ви", "вие", "винаги", "все", "всеки", "всички", "всичко", "всяка", "във", "въпреки", "върху", "г", "ги", "главно", "го", "д", "да", "дали", "до", "докато", "докога", "дори", "досега", "доста", "е", "едва", "един", "ето", "за", "зад", "заедно", "заради", "засега", "затова", "защо", "защото", "и", "из", "или", "им", "има", "имат", "иска", "й", "каза", "как", "каква", "какво", "както", "какъв", "като", "кога", "когато", "което", "които", "кой", "който", "колко", "която", "къде", "където", "към", "ли", "м", "ме", "между", "мен", "ми", "мнозина", "мога", "могат", "може", "моля", "момента", "му", "н", "на", "над", "назад", "най", "направи", "напред", "например", "нас", "не", "него", "нея", "ни", "ние", "никой", "нито", "но", "някои", "някой", "няма", "обаче", "около", "освен", "особено", "от", "отгоре", "отново", "още", "пак", "по", "повече", "повечето", "под", "поне", "поради", "после", "почти", "прави", "пред", "преди", "през", "при", "пък", "първо", "с", "са", "само", "се", "сега", "си", "скоро", "след", "сме", "според", "сред", "срещу", "сте", "съм", "със", "също", "т", "тази", "така", "такива", "такъв", "там", "твой", "те", "тези", "ти", "тн", "то", "това", "тогава", "този", "той", "толкова", "точно", "трябва", "тук", "тъй", "тя", "тях", "у", "харесва", "ч", "че", "често", "чрез", "ще", "щом", "я"] + }, + "bulgarian_keywords": { + "type": "keyword_marker", + "keywords": ["пример"] + }, + "bulgarian_stemmer": { + "type": "stemmer", + "language": "bulgarian" + }, + "bulgarian_override": { + "type": "stemmer_override", + "rules": [] + }, + "catalan_elision": { + "type": "elision", + "articles": [ "d", "l", "m", "n", "s", "t"] + }, + "catalan_stop": { + "type": "stop", + "stopwords": ["a", "abans", "ací", "ah", "així", "això", "al", "als", "aleshores", "algun", "alguna", "algunes", "alguns", "alhora", "allà", "allí", "allò", "altra", "altre", "altres", "amb", "ambdós", "ambdues", "apa", "aquell", "aquella", "aquelles", "aquells", "aquest", "aquesta", "aquestes", "aquests", "aquí", "baix", "cada", "cadascú", "cadascuna", "cadascunes", "cadascuns", "com", "contra", "d'un", "d'una", "d'unes", "d'uns", "dalt", "de", "del", "dels", "des", "després", "dins", "dintre", "donat", "doncs", "durant", "e", "eh", "el", "els", "em", "en", "encara", "ens", "entre", "érem", "eren", "éreu", "es", "és", "esta", "està", "estàvem", "estaven", "estàveu", "esteu", "et", "etc", "ets", "fins", "fora", "gairebé", "ha", "han", "has", "havia", "he", "hem", "heu", "hi ", "ho", "i", "igual", "iguals", "ja", "l'hi", "la", "les", "li", "li'n", "llavors", "m'he", "ma", "mal", "malgrat", "mateix", "mateixa", "mateixes", "mateixos", "me", "mentre", "més", "meu", "meus", "meva", "meves", "molt", "molta", "moltes", "molts", "mon", "mons", "n'he", "n'hi", "ne", "ni", "no", "nogensmenys", "només", "nosaltres", "nostra", "nostre", "nostres", "o", "oh", "oi", "on", "pas", "pel", "pels", "per", "però", "perquè", "poc ", "poca", "pocs", "poques", "potser", "propi", "qual", "quals", "quan", "quant ", "que", "què", "quelcom", "qui", "quin", "quina", "quines", "quins", "s'ha", "s'han", "sa", "semblant", "semblants", "ses", "seu ", "seus", "seva", "seva", "seves", "si", "sobre", "sobretot", "sóc", "solament", "sols", "son ", "són", "sons ", "sota", "sou", "t'ha", "t'han", "t'he", "ta", "tal", "també", "tampoc", "tan", "tant", "tanta", "tantes", "teu", "teus", "teva", "teves", "ton", "tons", "tot", "tota", "totes", "tots", "un", "una", "unes", "uns", "us", "va", "vaig", "vam", "van", "vas", "veu", "vosaltres", "vostra", "vostre", "vostres"] + }, + "catalan_keywords": { + "type": "keyword_marker", + "keywords": ["Hola", "món", "recerca"] + }, + "catalan_stemmer": { + "type": "stemmer", + "language": "catalan" + }, + "catalan_override": { + "type": "stemmer_override", + "rules": [] + }, + "czech_stop": { + "type": "stop", + "stopwords": ["a", "s", "k", "o", "i", "u", "v", "z", "dnes", "cz", "tímto", "budeš", "budem", "byli", "jseš", "můj", "svým", "ta", "tomto", "tohle", "tuto", "tyto", "jej", "zda", "proč", "máte", "tato", "kam", "tohoto", "kdo", "kteří", "mi", "nám", "tom", "tomuto", "mít", "nic", "proto", "kterou", "byla", "toho", "protože", "asi", "ho", "naši", "napište", "re", "což", "tím", "takže", "svých", "její", "svými", "jste", "aj", "tu", "tedy", "teto", "bylo", "kde", "ke", "pravé", "ji", "nad", "nejsou", "či", "pod", "téma", "mezi", "přes", "ty", "pak", "vám", "ani", "když", "však", "neg", "jsem", "tento", "článku", "články", "aby", "jsme", "před", "pta", "jejich", "byl", "ještě", "až", "bez", "také", "pouze", "první", "vaše", "která", "nás", "nový", "tipy", "pokud", "může", "strana", "jeho", "své", "jiné", "zprávy", "nové", "není", "vás", "jen", "podle", "zde", "už", "být", "více", "bude", "již", "než", "který", "by", "které", "co", "nebo", "ten", "tak", "má", "při", "od", "po", "jsou", "jak", "další", "ale", "si", "se", "ve", "to", "jako", "za", "zpět", "ze", "do", "pro", "je", "na", "atd", "atp", "jakmile", "přičemž", "já", "on", "ona", "ono", "oni", "ony", "my", "vy", "jí", "ji", "mě", "mne", "jemu", "tomu", "těm", "těmu", "němu", "němuž", "jehož", "jíž", "jelikož", "jež", "jakož", "načež"] + }, + "czech_keywords": { + "type": "keyword_marker", + "keywords": ["Haló", "svět", "vyhledávání"] + }, + "czech_stemmer": { + "type": "stemmer", + "language": "czech" + }, + "czech_override": { + "type": "stemmer_override", + "rules": [] + }, + "danish_stop": { + "type": "stop", + "stopwords": ["og", "i", "jeg", "det", "at", "en", "den", "til", "er", "som", "på", "de", "med", "han", "af", "for", "ikke", "der", "var", "mig", "sig", "men", "et", "har", "om", "vi", "min", "havde", "ham", "hun", "nu", "over", "da", "fra", "du", "ud", "sin", "dem", "os", "op", "man", "hans", "hvor", "eller", "hvad", "skal", "selv", "her", "alle", "vil", "blev", "kunne", "ind", "når", "være", "dog", "noget", "ville", "jo", "deres", "efter", "ned", "skulle", "denne", "end", "dette", "mit", "også", "under", "have", "dig", "anden", "hende", "mine", "alt", "meget", "sit", "sine", "vor", "mod", "disse", "hvis", "din", "nogle", "hos", "blive", "mange", "ad", "bliver", "hendes", "været", "thi", "jer", "sådan"] + }, + "danish_keywords": { + "type": "keyword_marker", + "keywords": ["Hej", "verden", "Søg"] + }, + "danish_stemmer": { + "type": "stemmer", + "language": "danish" + }, + "danish_override": { + "type": "stemmer_override", + "rules": [] + }, + "dutch_stop": { + "type": "stop", + "stopwords": ["de", "en", "van", "ik", "te", "dat", "die", "in", "een", "hij", "het", "niet", "zijn", "is", "was", "op", "aan", "met", "als", "voor", "had", "er", "maar", "om", "hem", "dan", "zou", "of", "wat", "mijn", "men", "dit", "zo", "door", "over", "ze", "zich", "bij", "ook", "tot", "je", "mij", "uit", "der", "daar", "haar", "naar", "heb", "hoe", "heeft", "hebben", "deze", "u", "want", "nog", "zal", "me", "zij", "nu", "ge", "geen", "omdat", "iets", "worden", "toch", "al", "waren", "veel", "meer", "doen", "toen", "moet", "ben", "zonder", "kan", "hun", "dus", "alles", "onder", "ja", "eens", "hier", "wie", "werd", "altijd", "doch", "wordt", "wezen", "kunnen", "ons", "zelf", "tegen", "na", "reeds", "wil", "kon", "niets", "uw", "iemand", "geweest", "andere"] + }, + "dutch_keywords": { + "type": "keyword_marker", + "keywords": ["hallo", "wereld", "zoeken"] + }, + "dutch_stemmer": { + "type": "stemmer", + "language": "dutch" + }, + "dutch_override": { + "type": "stemmer_override", + "rules": ["fiets=>fiets", "bromfiets=>bromfiets", "ei=>eier", "kind=>kinder"] + }, + "english_keywords": { + "type": "keyword_marker", + "keywords": ["sample"] + }, + "finnish_stop": { + "type": "stop", + "stopwords": ["olla", "olen", "olet", "on", "olemme", "olette", "ovat", "ole", "oli", "olisi", "olisit", "olisin", "olisimme", "olisitte", "olisivat", "olit", "olin", "olimme", "olitte", "olivat", "ollut", "olleet", "en", "et", "ei", "emme", "ette", "eivät", "minä", "minun", "minut", "minua", "minussa", "minusta", "minuun", "minulla", "minulta", "minulle", "sinä", "sinun", "sinut", "sinua", "sinussa", "sinusta", "sinuun", "sinulla", "sinulta", "sinulle", "hän", "hänen", "hänet", "häntä", "hänessä", "hänestä", "häneen", "hänellä", "häneltä", "hänelle", "me", "meidän", "meidät", "meitä", "meissä", "meistä", "meihin", "meillä", "meiltä", "meille", "te", "teidän", "teidät", "teitä", "teissä", "teistä", "teihin", "teillä", "teiltä", "teille", "he", "heidän", "heidät", "heitä", "heissä", "heistä", "heihin", "heillä", "heiltä", "heille", "tämä", "tämän", "tätä", "tässä", "tästä", "tähän", "tallä", "tältä", "tälle", "tänä", "täksi", "tuo", "tuon", "tuotä", "tuossa", "tuosta", "tuohon", "tuolla", "tuolta", "tuolle", "tuona", "tuoksi", "se", "sen", "sitä", "siinä", "siitä", "siihen", "sillä", "siltä", "sille", "sinä", "siksi", "nämä", "näiden", "näitä", "näissä", "näistä", "näihin", "näillä", "näiltä", "näille", "näinä", "näiksi", "nuo", "noiden", "noita", "noissa", "noista", "noihin", "noilla", "noilta", "noille", "noina", "noiksi", "ne", "niiden", "niitä", "niissä", "niistä", "niihin", "niillä", "niiltä", "niille", "niinä", "niiksi", "kuka", "kenen", "kenet", "ketä", "kenessä", "kenestä", "keneen", "kenellä", "keneltä", "kenelle", "kenenä", "keneksi", "ketkä", "keiden", "ketkä", "keitä", "keissä", "keistä", "keihin", "keillä", "keiltä", "keille", "keinä", "keiksi", "mikä", "minkä", "minkä", "mitä", "missä", "mistä", "mihin", "millä", "miltä", "mille", "minä", "miksi", "mitkä", "joka", "jonka", "jota", "jossa", "josta", "johon", "jolla", "jolta", "jolle", "jona", "joksi", "jotka", "joiden", "joita", "joissa", "joista", "joihin", "joilla", "joilta", "joille", "joina", "joiksi", "että", "ja", "jos", "koska", "kuin", "mutta", "niin", "sekä", "sillä", "tai", "vaan", "vai", "vaikka", "kanssa", "mukaan", "noin", "poikki", "yli", "kun", "niin", "nyt", "itse"] + }, + "finnish_keywords": { + "type": "keyword_marker", + "keywords": ["Hei", "maailma", "haku"] + }, + "finnish_stemmer": { + "type": "stemmer", + "language": "finnish" + }, + "finnish_override": { + "type": "stemmer_override", + "rules": [] + }, + "french_elision": { + "type": "elision", + "articles_case": true, + "articles": [ + "l", "m", "t", "qu", "n", "s", + "j", "d", "c", "jusqu", "quoiqu", + "lorsqu", "puisqu" + ] + }, + "french_stop": { + "type": "stop", + "stopwords": ["au", "aux", "avec", "ce", "ces", "dans", "de", "des", "du", "elle", "en", "et", "eux", "il", "je", "la", "le", "leur", "lui", "ma", "mais", "me", "même", "mes", "moi", "mon", "ne", "nos", "notre", "nous", "on", "ou", "par", "pas", "pour", "qu", "que", "qui", "sa", "se", "ses", "son", "sur", "ta", "te", "tes", "toi", "ton", "tu", "un", "une", "vos", "votre", "vous", "c", "d", "j", "l", "à", "m", "n", "s", "t", "y", "été", "étée", "étées", "étés", "étant", "suis", "es", "est", "sommes", "êtes", "sont", "serai", "seras", "sera", "serons", "serez", "seront", "serais", "serait", "serions", "seriez", "seraient", "étais", "était", "étions", "étiez", "étaient", "fus", "fut", "fûmes", "fûtes", "furent", "sois", "soit", "soyons", "soyez", "soient", "fusse", "fusses", "fût", "fussions", "fussiez", "fussent", "ayant", "eu", "eue", "eues", "eus", "ai", "as", "avons", "avez", "ont", "aurai", "auras", "aura", "aurons", "aurez", "auront", "aurais", "aurait", "aurions", "auriez", "auraient", "avais", "avait", "avions", "aviez", "avaient", "eut", "eûmes", "eûtes", "eurent", "aie", "aies", "ait", "ayons", "ayez", "aient", "eusse", "eusses", "eût", "eussions", "eussiez", "eussent", "ceci", "cela", "celà", "cet", "cette", "ici", "ils", "les", "leurs", "quel", "quels", "quelle", "quelles", "sans", "soi"] + }, + "french_keywords": { + "type": "keyword_marker", + "keywords": ["Bonjour", "monde", "recherche"] + }, + "french_stemmer": { + "type": "stemmer", + "language": "light_french" + }, + "french_override": { + "type": "stemmer_override", + "rules": [] + }, + "galician_stop": { + "type": "stop", + "stopwords": ["a", "aínda", "alí", "aquel", "aquela", "aquelas", "aqueles", "aquilo", "aquí", "ao", "aos", "as", "así", "á", "ben", "cando", "che", "co", "coa", "comigo", "con", "connosco", "contigo", "convosco", "coas", "cos", "cun", "cuns", "cunha", "cunhas", "da", "dalgunha", "dalgunhas", "dalgún", "dalgúns", "das", "de", "del", "dela", "delas", "deles", "desde", "deste", "do", "dos", "dun", "duns", "dunha", "dunhas", "e", "el", "ela", "elas", "eles", "en", "era", "eran", "esa", "esas", "ese", "eses", "esta", "estar", "estaba", "está", "están", "este", "estes", "estiven", "estou", "eu", "é", "facer", "foi", "foron", "fun", "había", "hai", "iso", "isto", "la", "las", "lle", "lles", "lo", "los", "mais", "me", "meu", "meus", "min", "miña", "miñas", "moi", "na", "nas", "neste", "nin", "no", "non", "nos", "nosa", "nosas", "noso", "nosos", "nós", "nun", "nunha", "nuns", "nunhas", "o", "os", "ou", "ó", "ós", "para", "pero", "pode", "pois", "pola", "polas", "polo", "polos", "por", "que", "se", "senón", "ser", "seu", "seus", "sexa", "sido", "sobre", "súa", "súas", "tamén", "tan", "te", "ten", "teñen", "teño", "ter", "teu", "teus", "ti", "tido", "tiña", "tiven", "túa", "túas", "un", "unha", "unhas", "uns", "vos", "vosa", "vosas", "voso", "vosos", "vós"] + }, + "galician_keywords": { + "type": "keyword_marker", + "keywords": ["exemplo"] + }, + "galician_stemmer": { + "type": "stemmer", + "language": "galician" + }, + "galician_override": { + "type": "stemmer_override", + "rules": [] + }, + "german_stop": { + "type": "stop", + "stopwords": ["aber", "alle", "allem", "allen", "aller", "alles", "als", "also", "am", "an", "ander", "andere", "anderem", "anderen", "anderer", "anderes", "anderm", "andern", "anderr", "anders", "auch", "auf", "aus", "bei", "bin", "bis", "bist", "da", "damit", "dann", "der", "den", "des", "dem", "die", "das", "daß", "derselbe", "derselben", "denselben", "desselben", "demselben", "dieselbe", "dieselben", "dasselbe", "dazu", "dein", "deine", "deinem", "deinen", "deiner", "deines", "denn", "derer", "dessen", "dich", "dir", "du", "dies", "diese", "diesem", "diesen", "dieser", "dieses", "doch", "dort", "durch", "ein", "eine", "einem", "einen", "einer", "eines", "einig", "einige", "einigem", "einigen", "einiger", "einiges", "einmal", "er", "ihn", "ihm", "es", "etwas", "euer", "eure", "eurem", "euren", "eurer", "eures", "für", "gegen", "gewesen", "hab", "habe", "haben", "hat", "hatte", "hatten", "hier", "hin", "hinter", "ich", "mich", "mir", "ihr", "ihre", "ihrem", "ihren", "ihrer", "ihres", "euch", "im", "in", "indem", "ins", "ist", "jede", "jedem", "jeden", "jeder", "jedes", "jene", "jenem", "jenen", "jener", "jenes", "jetzt", "kann", "kein", "keine", "keinem", "keinen", "keiner", "keines", "können", "könnte", "machen", "man", "manche", "manchem", "manchen", "mancher", "manches", "mein", "meine", "meinem", "meinen", "meiner", "meines", "mit", "muss", "musste", "nach", "nicht", "nichts", "noch", "nun", "nur", "ob", "oder", "ohne", "sehr", "sein", "seine", "seinem", "seinen", "seiner", "seines", "selbst", "sich", "sie", "ihnen", "sind", "so", "solche", "solchem", "solchen", "solcher", "solches", "soll", "sollte", "sondern", "sonst", "über", "um", "und", "uns", "unse", "unsem", "unsen", "unser", "unses", "unter", "viel", "vom", "von", "vor", "während", "war", "waren", "warst", "was", "weg", "weil", "weiter", "welche", "welchem", "welchen", "welcher", "welches", "wenn", "werde", "werden", "wie", "wieder", "will", "wir", "wird", "wirst", "wo", "wollen", "wollte", "würde", "würden", "zu", "zum", "zur", "zwar", "zwischen"] + }, + "german_keywords": { + "type": "keyword_marker", + "keywords": ["Hallo", "Welt", "Suche"] + }, + "german_stemmer": { + "type": "stemmer", + "language": "light_german" + }, + "german_override": { + "type": "stemmer_override", + "rules": [] + }, + "greek_stop": { + "type": "stop", + "stopwords": ["ο", "η", "το", "οι", "τα", "του", "τησ", "των", "τον", "την", "και ", "κι", "κ", "ειμαι", "εισαι", "ειναι", "ειμαστε", "ειστε", "στο", "στον", "στη", "στην", "μα", "αλλα", "απο", "για", "προσ", "με", "σε", "ωσ", "παρα", "αντι", "κατα", "μετα", "θα", "να", "δε", "δεν", "μη", "μην", "επι", "ενω", "εαν", "αν", "τοτε", "που", "πωσ", "ποιοσ", "ποια", "ποιο", "ποιοι", "ποιεσ", "ποιων", "ποιουσ", "αυτοσ", "αυτη", "αυτο", "αυτοι", "αυτων", "αυτουσ", "αυτεσ", "αυτα", "εκεινοσ", "εκεινη", "εκεινο", "εκεινοι", "εκεινεσ", "εκεινα", "εκεινων", "εκεινουσ", "οπωσ", "ομωσ", "ισωσ", "οσο", "οτι"] + }, + "greek_lowercase": { + "type": "lowercase", + "language": "greek" + }, + "greek_keywords": { + "type": "keyword_marker", + "keywords": ["Γεια σας", "κόσμος", "έρευνα"] + }, + "greek_stemmer": { + "type": "stemmer", + "language": "greek" + }, + "greek_override": { + "type": "stemmer_override", + "rules": [] + }, + "hindi_stop": { + "type": "stop", + "stopwords": ["अंदर", "अत", "अपना", "अपनी", "अपने", "अभी", "आदि", "आप", "इत्यादि", "इन ", "इनका", "इन्हीं", "इन्हें", "इन्हों", "इस", "इसका", "इसकी", "इसके", "इसमें", "इसी", "इसे", "उन", "उनका", "उनकी", "उनके", "उनको", "उन्हीं", "उन्हें", "उन्हों", "उस", "उसके", "उसी", "उसे", "एक", "एवं", "एस", "ऐसे", "और", "कई", "कर", "करता", "करते", "करना", "करने", "करें", "कहते", "कहा", "का", "काफ़ी", "कि", "कितना", "किन्हें", "किन्हों", "किया", "किर", "किस", "किसी", "किसे", "की", "कुछ", "कुल", "के", "को", "कोई", "कौन", "कौनसा", "गया", "घर", "जब", "जहाँ", "जा", "जितना", "जिन", "जिन्हें", "जिन्हों", "जिस", "जिसे", "जीधर", "जैसा", "जैसे", "जो", "तक", "तब", "तरह", "तिन", "तिन्हें", "तिन्हों", "तिस", "तिसे", "तो", "था", "थी", "थे", "दबारा", "दिया", "दुसरा", "दूसरे", "दो", "द्वारा", "न", "नहीं", "ना", "निहायत", "नीचे", "ने", "पर", "पर ", "पहले", "पूरा", "पे", "फिर", "बनी", "बही", "बहुत", "बाद", "बाला", "बिलकुल", "भी", "भीतर", "मगर", "मानो", "मे", "में", "यदि", "यह", "यहाँ", "यही", "या", "यिह ", "ये", "रखें", "रहा", "रहे", "ऱ्वासा", "लिए", "लिये", "लेकिन", "व", "वर्ग", "वह", "वह ", "वहाँ", "वहीं", "वाले", "वुह ", "वे", "वग़ैरह", "संग", "सकता", "सकते", "सबसे", "सभी", "साथ", "साबुत", "साभ", "सारा", "से", "सो", "ही", "हुआ", "हुई", "हुए", "है", "हैं", "हो", "होता", "होती", "होते", "होना", "होने", "अपनि", "जेसे", "होति", "सभि", "तिंहों", "इंहों", "दवारा", "इसि", "किंहें", "थि", "उंहों", "ओर", "जिंहें", "वहिं", "अभि", "बनि", "हि", "उंहिं", "उंहें", "हें", "वगेरह", "एसे", "रवासा", "कोन", "निचे", "काफि", "उसि", "पुरा", "भितर", "हे", "बहि", "वहां", "कोइ", "यहां", "जिंहों", "तिंहें", "किसि", "कइ", "यहि", "इंहिं", "जिधर", "इंहें", "अदि", "इतयादि", "हुइ", "कोनसा", "इसकि", "दुसरे", "जहां", "अप", "किंहों", "उनकि", "भि", "वरग", "हुअ", "जेसा", "नहिं"] + }, + "hindi_keywords": { + "type": "keyword_marker", + "keywords": [ "नमस्ते", "दुनिया", "खोज" ] + }, + "hindi_stemmer": { + "type": "stemmer", + "language": "hindi" + }, + "hindi_override": { + "type": "stemmer_override", + "rules": [] + }, + "hungarian_stop": { + "type": "stop", + "stopwords": ["a", "ahogy", "ahol", "aki", "akik", "akkor", "alatt", "által", "általában", "amely", "amelyek", "amelyekben", "amelyeket", "amelyet", "amelynek", "ami", "amit", "amolyan", "amíg", "amikor", "át", "abban", "ahhoz", "annak", "arra", "arról", "az", "azok", "azon", "azt", "azzal", "azért", "aztán", "azután", "azonban", "bár", "be", "belül", "benne", "cikk", "cikkek", "cikkeket", "csak", "de", "e", "eddig", "egész", "egy", "egyes", "egyetlen", "egyéb", "egyik", "egyre", "ekkor", "el", "elég", "ellen", "elő", "először", "előtt", "első", "én", "éppen", "ebben", "ehhez", "emilyen", "ennek", "erre", "ez", "ezt", "ezek", "ezen", "ezzel", "ezért", "és", "fel", "felé", "hanem", "hiszen", "hogy", "hogyan", "igen", "így", "illetve", "ill.", "ill", "ilyen", "ilyenkor", "ison", "ismét", "itt", "jó", "jól", "jobban", "kell", "kellett", "keresztül", "keressünk", "ki", "kívül", "között", "közül", "legalább", "lehet", "lehetett", "legyen", "lenne", "lenni", "lesz", "lett", "maga", "magát", "majd", "majd", "már", "más", "másik", "meg", "még", "mellett", "mert", "mely", "melyek", "mi", "mit", "míg", "miért", "milyen", "mikor", "minden", "mindent", "mindenki", "mindig", "mint", "mintha", "mivel", "most", "nagy", "nagyobb", "nagyon", "ne", "néha", "nekem", "neki", "nem", "néhány", "nélkül", "nincs", "olyan", "ott", "össze", "ő", "ők", "őket", "pedig", "persze", "rá", "s", "saját", "sem", "semmi", "sok", "sokat", "sokkal", "számára", "szemben", "szerint", "szinte", "talán", "tehát", "teljes", "tovább", "továbbá", "több", "úgy", "ugyanis", "új", "újabb", "újra", "után", "utána", "utolsó", "vagy", "vagyis", "valaki", "valami", "valamint", "való", "vagyok", "van", "vannak", "volt", "voltam", "voltak", "voltunk", "vissza", "vele", "viszont", "volna"] + }, + "hungarian_keywords": { + "type": "keyword_marker", + "keywords": ["Helló", "világ", "keresés"] + }, + "hungarian_stemmer": { + "type": "stemmer", + "language": "hungarian" + }, + "hungarian_override": { + "type": "stemmer_override", + "rules": [] + }, + "indonesian_stop": { + "type": "stop", + "stopwords": ["ada", "adanya", "adalah", "adapun", "agak", "agaknya", "agar", "akan", "akankah", "akhirnya", "aku", "akulah", "amat", "amatlah", "anda", "andalah", "antar", "diantaranya", "antara", "antaranya", "diantara", "apa", "apaan", "mengapa", "apabila", "apakah", "apalagi", "apatah", "atau", "ataukah", "ataupun", "bagai", "bagaikan", "sebagai", "sebagainya", "bagaimana", "bagaimanapun", "sebagaimana", "bagaimanakah", "bagi", "bahkan", "bahwa", "bahwasanya", "sebaliknya", "banyak", "sebanyak", "beberapa", "seberapa", "begini", "beginian", "beginikah", "beginilah", "sebegini", "begitu", "begitukah", "begitulah", "begitupun", "sebegitu", "belum", "belumlah", "sebelum", "sebelumnya", "sebenarnya", "berapa", "berapakah", "berapalah", "berapapun", "betulkah", "sebetulnya", "biasa", "biasanya", "bila", "bilakah", "bisa", "bisakah", "sebisanya", "boleh", "bolehkah", "bolehlah", "buat", "bukan", "bukankah", "bukanlah", "bukannya", "cuma", "percuma", "dahulu", "dalam", "dan", "dapat", "dari", "daripada", "dekat", "demi", "demikian", "demikianlah", "sedemikian", "dengan", "depan", "di", "dia", "dialah", "dini", "diri", "dirinya", "terdiri", "dong", "dulu", "enggak", "enggaknya", "entah", "entahlah", "terhadap", "terhadapnya", "hal", "hampir", "hanya", "hanyalah", "harus", "haruslah", "harusnya", "seharusnya", "hendak", "hendaklah", "hendaknya", "hingga", "sehingga", "ia", "ialah", "ibarat", "ingin", "inginkah", "inginkan", "ini", "inikah", "inilah", "itu", "itukah", "itulah", "jangan", "jangankan", "janganlah", "jika", "jikalau", "juga", "justru", "kala", "kalau", "kalaulah", "kalaupun", "kalian", "kami", "kamilah", "kamu", "kamulah", "kan", "kapan", "kapankah", "kapanpun", "dikarenakan", "karena", "karenanya", "ke", "kecil", "kemudian", "kenapa", "kepada", "kepadanya", "ketika", "seketika", "khususnya", "kini", "kinilah", "kiranya", "sekiranya", "kita", "kitalah", "kok", "lagi", "lagian", "selagi", "lah", "lain", "lainnya", "melainkan", "selaku", "lalu", "melalui", "terlalu", "lama", "lamanya", "selama", "selama", "selamanya", "lebih", "terlebih", "bermacam", "macam", "semacam", "maka", "makanya", "makin", "malah", "malahan", "mampu", "mampukah", "mana", "manakala", "manalagi", "masih", "masihkah", "semasih", "masing", "mau", "maupun", "semaunya", "memang", "mereka", "merekalah", "meski", "meskipun", "semula", "mungkin", "mungkinkah", "nah", "namun", "nanti", "nantinya", "nyaris", "oleh", "olehnya", "seorang", "seseorang", "pada", "padanya", "padahal", "paling", "sepanjang", "pantas", "sepantasnya", "sepantasnyalah", "para", "pasti", "pastilah", "per", "pernah", "pula", "pun", "merupakan", "rupanya", "serupa", "saat", "saatnya", "sesaat", "saja", "sajalah", "saling", "bersama", "sama", "sesama", "sambil", "sampai", "sana", "sangat", "sangatlah", "saya", "sayalah", "se", "sebab", "sebabnya", "sebuah", "tersebut", "tersebutlah", "sedang", "sedangkan", "sedikit", "sedikitnya", "segala", "segalanya", "segera", "sesegera", "sejak", "sejenak", "sekali", "sekalian", "sekalipun", "sesekali", "sekaligus", "sekarang", "sekarang", "sekitar", "sekitarnya", "sela", "selain", "selalu", "seluruh", "seluruhnya", "semakin", "sementara", "sempat", "semua", "semuanya", "sendiri", "sendirinya", "seolah", "seperti", "sepertinya", "sering", "seringnya", "serta", "siapa", "siapakah", "siapapun", "disini", "disinilah", "sini", "sinilah", "sesuatu", "sesuatunya", "suatu", "sesudah", "sesudahnya", "sudah", "sudahkah", "sudahlah", "supaya", "tadi", "tadinya", "tak", "tanpa", "setelah", "telah", "tentang", "tentu", "tentulah", "tentunya", "tertentu", "seterusnya", "tapi", "tetapi", "setiap", "tiap", "setidaknya", "tidak", "tidakkah", "tidaklah", "toh", "waduh", "wah", "wahai", "sewaktu", "walau", "walaupun", "wong", "yaitu", "yakni", "yang"] + }, + "indonesian_keywords": { + "type": "keyword_marker", + "keywords": ["halo", "dunia", "pencarian"] + }, + "indonesian_stemmer": { + "type": "stemmer", + "language": "indonesian" + }, + "indonesian_override": { + "type": "stemmer_override", + "rules": [] + }, + "irish_elision": { + "type": "elision", + "articles": [ "h", "n", "t" ] + }, + "irish_stop": { + "type": "stop", + "stopwords": ["a", "ach", "ag", "agus", "an", "aon", "ar", "arna", "as", "b'", "ba", "beirt", "bhúr", "caoga", "ceathair", "ceathrar", "chomh", "chtó", "chuig", "chun", "cois", "céad", "cúig", "cúigear", "d'", "daichead", "dar", "de", "deich", "deichniúr", "den", "dhá", "do", "don", "dtí", "dá", "dár", "dó", "faoi", "faoin", "faoina", "faoinár", "fara", "fiche", "gach", "gan", "go", "gur", "haon", "hocht", "i", "iad", "idir", "in", "ina", "ins", "inár", "is", "le", "leis", "lena", "lenár", "m'", "mar", "mo", "mé", "na", "nach", "naoi", "naonúr", "ná", "ní", "níor", "nó", "nócha", "ocht", "ochtar", "os", "roimh", "sa", "seacht", "seachtar", "seachtó", "seasca", "seisear", "siad", "sibh", "sinn", "sna", "sé", "sí", "tar", "thar", "thú", "triúr", "trí", "trína", "trínár", "tríocha", "tú", "um", "ár", "é", "éis", "í", "ó", "ón", "óna", "ónár"] + }, + "irish_lowercase": { + "type": "lowercase", + "language": "irish" + }, + "irish_keywords": { + "type": "keyword_marker", + "keywords": ["sampla"] + }, + "irish_stemmer": { + "type": "stemmer", + "language": "irish" + }, + "irish_override": { + "type": "stemmer_override", + "rules": [] + }, + "italian_elision": { + "type": "elision", + "articles": [ + "c", "l", "all", "dall", "dell", + "nell", "sull", "coll", "pell", + "gl", "agl", "dagl", "degl", "negl", + "sugl", "un", "m", "t", "s", "v", "d" + ] + }, + "italian_stop": { + "type": "stop", + "stopwords": ["ad", "al", "allo", "ai", "agli", "all", "agl", "alla", "alle", "con", "col", "coi", "da", "dal", "dallo", "dai", "dagli", "dall", "dagl", "dalla", "dalle", "di", "del", "dello", "dei", "degli", "dell", "degl", "della", "delle", "in", "nel", "nello", "nei", "negli", "nell", "negl", "nella", "nelle", "su", "sul", "sullo", "sui", "sugli", "sull", "sugl", "sulla", "sulle", "per", "tra", "contro", "io", "tu", "lui", "lei", "noi", "voi", "loro", "mio", "mia", "miei", "mie", "tuo", "tua", "tuoi", "tue", "suo", "sua", "suoi", "sue", "nostro", "nostra", "nostri", "nostre", "vostro", "vostra", "vostri", "vostre", "mi", "ti", "ci", "vi", "lo", "la", "li", "le", "gli", "ne", "il", "un", "uno", "una", "ma", "ed", "se", "perché", "anche", "come", "dov", "dove", "che", "chi", "cui", "non", "più", "quale", "quanto", "quanti", "quanta", "quante", "quello", "quelli", "quella", "quelle", "questo", "questi", "questa", "queste", "si", "tutto", "tutti", "a", "c", "e", "i", "l", "o", "ho", "hai", "ha", "abbiamo", "avete", "hanno", "abbia", "abbiate", "abbiano", "avrò", "avrai", "avrà", "avremo", "avrete", "avranno", "avrei", "avresti", "avrebbe", "avremmo", "avreste", "avrebbero", "avevo", "avevi", "aveva", "avevamo", "avevate", "avevano", "ebbi", "avesti", "ebbe", "avemmo", "aveste", "ebbero", "avessi", "avesse", "avessimo", "avessero", "avendo", "avuto", "avuta", "avuti", "avute", "sono", "sei", "è", "siamo", "siete", "sia", "siate", "siano", "sarò", "sarai", "sarà", "saremo", "sarete", "saranno", "sarei", "saresti", "sarebbe", "saremmo", "sareste", "sarebbero", "ero", "eri", "era", "eravamo", "eravate", "erano", "fui", "fosti", "fu", "fummo", "foste", "furono", "fossi", "fosse", "fossimo", "fossero", "essendo", "faccio", "fai", "facciamo", "fanno", "faccia", "facciate", "facciano", "farò", "farai", "farà", "faremo", "farete", "faranno", "farei", "faresti", "farebbe", "faremmo", "fareste", "farebbero", "facevo", "facevi", "faceva", "facevamo", "facevate", "facevano", "feci", "facesti", "fece", "facemmo", "faceste", "fecero", "facessi", "facesse", "facessimo", "facessero", "facendo", "sto", "stai", "sta", "stiamo", "stanno", "stia", "stiate", "stiano", "starò", "starai", "starà", "staremo", "starete", "staranno", "starei", "staresti", "starebbe", "staremmo", "stareste", "starebbero", "stavo", "stavi", "stava", "stavamo", "stavate", "stavano", "stetti", "stesti", "stette", "stemmo", "steste", "stettero", "stessi", "stesse", "stessimo", "stessero", "stando"] + }, + "italian_keywords": { + "type": "keyword_marker", + "keywords": ["Ciao", "mondo", "ricerca"] + }, + "italian_stemmer": { + "type": "stemmer", + "language": "light_italian" + }, + "italian_override": { + "type": "stemmer_override", + "rules": [] + }, + "japanese_pos_filter" : { + "type" : "kuromoji_part_of_speech", + "stoptags" : [ + "その他", + "その他-間投", + "フィラー", + "感動詞", + "記号", + "記号-アルファベット", + "記号-一般", + "記号-括弧開", + "記号-括弧閉", + "記号-句点", + "記号-空白", + "記号-読点", + "語断片", + "助詞", + "助詞-格助詞", + "助詞-格助詞-一般", + "助詞-格助詞-引用", + "助詞-格助詞-連語", + "助詞-間投助詞", + "助詞-係助詞", + "助詞-終助詞", + "助詞-接続助詞", + "助詞-特殊", + "助詞-副詞化", + "助詞-副助詞", + "助詞-副助詞/並立助詞/終助詞", + "助詞-並立助詞", + "助詞-連体化", + "助動詞", + "接続詞", + "動詞-接尾", + "非言語音", + "連体詞" + ] + }, + "japanese_stop": { + "type": "stop", + "stopwords": [] + }, + "korean_stop": { + "type": "stop", + "stopwords": [] + }, + "latvian_stop": { + "type": "stop", + "stopwords": ["aiz", "ap", "ar", "apakš", "ārpus", "augšpus", "bez", "caur", "dēļ", "gar", "iekš", "iz", "kopš", "labad", "lejpus", "līdz", "no", "otrpus", "pa", "par", "pār", "pēc", "pie", "pirms", "pret", "priekš", "starp", "šaipus", "uz", "viņpus", "virs", "virspus", "zem", "apakšpus", "# Conjunctions", "un", "bet", "jo", "ja", "ka", "lai", "tomēr", "tikko", "turpretī", "arī", "kaut", "gan", "tādēļ", "tā", "ne", "tikvien", "vien", "kā", "ir", "te", "vai", "kamēr", "# Particles", "ar", "diezin", "droši", "diemžēl", "nebūt", "ik", "it", "taču", "nu", "pat", "tiklab", "iekšpus", "nedz", "tik", "nevis", "turpretim", "jeb", "iekam", "iekām", "iekāms", "kolīdz", "līdzko", "tiklīdz", "jebšu", "tālab", "tāpēc", "nekā", "itin", "jā", "jau", "jel", "nē", "nezin", "tad", "tikai", "vis", "tak", "iekams", "vien", "# modal verbs", "būt ", "biju ", "biji", "bija", "bijām", "bijāt", "esmu", "esi", "esam", "esat ", "būšu ", "būsi", "būs", "būsim", "būsiet", "tikt", "tiku", "tiki", "tika", "tikām", "tikāt", "tieku", "tiec", "tiek", "tiekam", "tiekat", "tikšu", "tiks", "tiksim", "tiksiet", "tapt", "tapi", "tapāt", "topat", "tapšu", "tapsi", "taps", "tapsim", "tapsiet", "kļūt", "kļuvu", "kļuvi", "kļuva", "kļuvām", "kļuvāt", "kļūstu", "kļūsti", "kļūst", "kļūstam", "kļūstat", "kļūšu", "kļūsi", "kļūs", "kļūsim", "kļūsiet", "# verbs", "varēt", "varēju", "varējām", "varēšu", "varēsim", "var", "varēji", "varējāt", "varēsi", "varēsiet", "varat", "varēja", "varēs"] + }, + "latvian_keywords": { + "type": "keyword_marker", + "keywords": ["sveiki", "pasaule", "meklēšana"] + }, + "latvian_stemmer": { + "type": "stemmer", + "language": "latvian" + }, + "latvian_override": { + "type": "stemmer_override", + "rules": [] + }, + "lithuanian_stop": { + "type": "stop", + "stopwords": ["ant", "apie", "ar", "arba", "aš", "be", "bei", "bet", "bus", "būti", "būtų", "buvo", "dėl", "gali", "į", "iki", "ir", "iš", "ja", "ją", "jai", "jais", "jam", "jame", "jas", "jei", "ji", "jį", "jie", "jiedu", "jiedvi", "jiedviem", "jiedviese", "jiems", "jis", "jo", "jodviem", "jog", "joje", "jomis", "joms", "jos", "jose", "jų", "judu", "judvi", "judviejų", "jųdviejų", "judviem", "judviese", "jumis", "jums", "jumyse", "juo", "juodu", "juodviese", "juos", "juose", "jus", "jūs", "jūsų", "ką", "kad", "kai", "kaip", "kas", "kiek", "kol", "kur", "kurie", "kuris", "man", "mane", "manęs", "manimi", "mano", "manyje", "mes", "metu", "mudu", "mudvi", "mudviejų", "mudviem", "mudviese", "mumis", "mums", "mumyse", "mus", "mūsų", "nei", "nes", "net", "nors", "nuo", "o", "pat", "per", "po", "prie", "prieš", "sau", "save", "savęs", "savimi", "savo", "savyje", "su", "tačiau", "tada", "tai", "taip", "tas", "tau", "tave", "tavęs", "tavimi", "tavyje", "ten", "to", "todėl", "tu", "tuo", "už", "visi", "yra"] + }, + "lithuanian_keywords": { + "type": "keyword_marker", + "keywords": ["Sveiki", "pasaulis", "paieška"] + }, + "lithuanian_stemmer": { + "type": "stemmer", + "language": "lithuanian" + }, + "lithuanian_override": { + "type": "stemmer_override", + "rules": [] + }, + "norwegian_stop": { + "type": "stop", + "stopwords": ["og", "i", "jeg", "det", "at", "en", "et", "den", "til", "er", "som", "på", "de", "med", "han", "av", "ikke", "ikkje", "der", "så", "var", "meg", "seg", "men", "ett", "har", "om", "vi", "min", "mitt", "ha", "hadde", "hun", "nå", "over", "da", "ved", "fra", "du", "ut", "sin", "dem", "oss", "opp", "man", "kan", "hans", "hvor", "eller", "hva", "skal", "selv", "sjøl", "her", "alle", "vil", "bli", "ble", "blei", "blitt", "kunne", "inn", "når", "være", "kom", "noen", "noe", "ville", "dere", "som", "deres", "kun", "ja", "etter", "ned", "skulle", "denne", "for", "deg", "si", "sine", "sitt", "mot", "å", "meget", "hvorfor", "dette", "disse", "uten", "hvordan", "ingen", "din", "ditt", "blir", "samme", "hvilken", "hvilke", "sånn", "inni", "mellom", "vår", "hver", "hvem", "vors", "hvis", "både", "bare", "enn", "fordi", "før", "mange", "også", "slik", "vært", "være", "båe", "begge", "siden", "dykk", "dykkar", "dei", "deira", "deires", "deim", "di", "då", "eg", "ein", "eit", "eitt", "elles", "honom", "hjå", "ho", "hoe", "henne", "hennar", "hennes", "hoss", "hossen", "ikkje", "ingi", "inkje", "korleis", "korso", "kva", "kvar", "kvarhelst", "kven", "kvi", "kvifor", "me", "medan", "mi", "mine", "mykje", "no", "nokon", "noka", "nokor", "noko", "nokre", "si", "sia", "sidan", "so", "somt", "somme", "um", "upp", "vere", "vore", "verte", "vort", "varte", "vart"] + }, + "norwegian_keywords": { + "type": "keyword_marker", + "keywords": ["Hallo", "verden", "Søk"] + }, + "norwegian_stemmer": { + "type": "stemmer", + "language": "norwegian" + }, + "norwegian_override": { + "type": "stemmer_override", + "rules": [] + }, + "persian_stop": { + "type": "stop", + "stopwords": ["انان", "نداشته", "سراسر", "خياه", "ايشان", "وي", "تاكنون", "بيشتري", "دوم", "پس", "ناشي", "وگو", "يا", "داشتند", "سپس", "هنگام", "هرگز", "پنج", "نشان", "امسال", "ديگر", "گروهي", "شدند", "چطور", "ده", "و", "دو", "نخستين", "ولي", "چرا", "چه", "وسط", "ه", "كدام", "قابل", "يك", "رفت", "هفت", "همچنين", "در", "هزار", "بله", "بلي", "شايد", "اما", "شناسي", "گرفته", "دهد", "داشته", "دانست", "داشتن", "خواهيم", "ميليارد", "وقتيكه", "امد", "خواهد", "جز", "اورده", "شده", "بلكه", "خدمات", "شدن", "برخي", "نبود", "بسياري", "جلوگيري", "حق", "كردند", "نوعي", "بعري", "نكرده", "نظير", "نبايد", "بوده", "بودن", "داد", "اورد", "هست", "جايي", "شود", "دنبال", "داده", "بايد", "سابق", "هيچ", "همان", "انجا", "كمتر", "كجاست", "گردد", "كسي", "تر", "مردم", "تان", "دادن", "بودند", "سري", "جدا", "ندارند", "مگر", "يكديگر", "دارد", "دهند", "بنابراين", "هنگامي", "سمت", "جا", "انچه", "خود", "دادند", "زياد", "دارند", "اثر", "بدون", "بهترين", "بيشتر", "البته", "به", "براساس", "بيرون", "كرد", "بعضي", "گرفت", "توي", "اي", "ميليون", "او", "جريان", "تول", "بر", "مانند", "برابر", "باشيم", "مدتي", "گويند", "اكنون", "تا", "تنها", "جديد", "چند", "بي", "نشده", "كردن", "كردم", "گويد", "كرده", "كنيم", "نمي", "نزد", "روي", "قصد", "فقط", "بالاي", "ديگران", "اين", "ديروز", "توسط", "سوم", "ايم", "دانند", "سوي", "استفاده", "شما", "كنار", "داريم", "ساخته", "طور", "امده", "رفته", "نخست", "بيست", "نزديك", "طي", "كنيد", "از", "انها", "تمامي", "داشت", "يكي", "طريق", "اش", "چيست", "روب", "نمايد", "گفت", "چندين", "چيزي", "تواند", "ام", "ايا", "با", "ان", "ايد", "ترين", "اينكه", "ديگري", "راه", "هايي", "بروز", "همچنان", "پاعين", "كس", "حدود", "مختلف", "مقابل", "چيز", "گيرد", "ندارد", "ضد", "همچون", "سازي", "شان", "مورد", "باره", "مرسي", "خويش", "برخوردار", "چون", "خارج", "شش", "هنوز", "تحت", "ضمن", "هستيم", "گفته", "فكر", "بسيار", "پيش", "براي", "روزهاي", "انكه", "نخواهد", "بالا", "كل", "وقتي", "كي", "چنين", "كه", "گيري", "نيست", "است", "كجا", "كند", "نيز", "يابد", "بندي", "حتي", "توانند", "عقب", "خواست", "كنند", "بين", "تمام", "همه", "ما", "باشند", "مثل", "شد", "اري", "باشد", "اره", "طبق", "بعد", "اگر", "صورت", "غير", "جاي", "بيش", "ريزي", "اند", "زيرا", "چگونه", "بار", "لطفا", "مي", "درباره", "من", "ديده", "همين", "گذاري", "برداري", "علت", "گذاشته", "هم", "فوق", "نه", "ها", "شوند", "اباد", "همواره", "هر", "اول", "خواهند", "چهار", "نام", "امروز", "مان", "هاي", "قبل", "كنم", "سعي", "تازه", "را", "هستند", "زير", "جلوي", "عنوان", "بود" ] + }, + "persian_keywords": { + "type": "keyword_marker", + "keywords": ["سلام", "جهان", "جستجو"] + }, + "portuguese_stop": { + "type": "stop", + "stopwords": ["de", "a", "o", "que", "e", "do", "da", "em", "um", "para", "com", "não", "uma", "os", "no", "se", "na", "por", "mais", "as", "dos", "como", "mas", "ao", "ele", "das", "à", "seu", "sua", "ou", "quando", "muito", "nos", "já", "eu", "também", "só", "pelo", "pela", "até", "isso", "ela", "entre", "depois", "sem", "mesmo", "aos", "seus", "quem", "nas", "me", "esse", "eles", "você", "essa", "num", "nem", "suas", "meu", "às", "minha", "numa", "pelos", "elas", "qual", "nós", "lhe", "deles", "essas", "esses", "pelas", "este", "dele", "tu", "te", "vocês", "vos", "lhes", "meus", "minhas", "teu", "tua", "teus", "tuas", "nosso", "nossa", "nossos", "nossas", "dela", "delas", "esta", "estes", "estas", "aquele", "aquela", "aqueles", "aquelas", "isto", "aquilo", "estou", "está", "estamos", "estão", "estive", "esteve", "estivemos", "estiveram", "estava", "estávamos", "estavam", "estivera", "estivéramos", "esteja", "estejamos", "estejam", "estivesse", "estivéssemos", "estivessem", "estiver", "estivermos", "estiverem", "hei", "há", "havemos", "hão", "houve", "houvemos", "houveram", "houvera", "houvéramos", "haja", "hajamos", "hajam", "houvesse", "houvéssemos", "houvessem", "houver", "houvermos", "houverem", "houverei", "houverá", "houveremos", "houverão", "houveria", "houveríamos", "houveriam", "sou", "somos", "são", "era", "éramos", "eram", "fui", "foi", "fomos", "foram", "fora", "fôramos", "seja", "sejamos", "sejam", "fosse", "fôssemos", "fossem", "for", "formos", "forem", "serei", "será", "seremos", "serão", "seria", "seríamos", "seriam", "tenho", "tem", "temos", "tém", "tinha", "tínhamos", "tinham", "tive", "teve", "tivemos", "tiveram", "tivera", "tivéramos", "tenha", "tenhamos", "tenham", "tivesse", "tivéssemos", "tivessem", "tiver", "tivermos", "tiverem", "terei", "terá", "teremos", "terão", "teria", "teríamos", "teriam"] + }, + "portuguese_keywords": { + "type": "keyword_marker", + "keywords": ["Olá", "mundo", "pesquisa"] + }, + "portuguese_stemmer": { + "type": "stemmer", + "language": "light_portuguese" + }, + "portuguese_override": { + "type": "stemmer_override", + "rules": [] + }, + "romanian_stop": { + "type": "stop", + "stopwords": ["acea", "aceasta", "această", "aceea", "acei", "aceia", "acel", "acela", "acele", "acelea", "acest", "acesta", "aceste", "acestea", "aceşti", "aceştia", "acolo", "acum", "ai", "aia", "aibă", "aici", "al", "ăla", "ale", "alea", "ălea", "altceva", "altcineva", "am", "ar", "are", "aş", "aşadar", "asemenea", "asta", "ăsta", "astăzi", "astea", "ăstea", "ăştia", "asupra", "aţi", "au", "avea", "avem", "aveţi", "azi", "bine", "bucur", "bună", "ca", "că", "căci", "când", "care", "cărei", "căror", "cărui", "cât", "câte", "câţi", "către", "câtva", "ce", "cel", "ceva", "chiar", "cînd", "cine", "cineva", "cît", "cîte", "cîţi", "cîtva", "contra", "cu", "cum", "cumva", "curând", "curînd", "da", "dă", "dacă", "dar", "datorită", "de", "deci", "deja", "deoarece", "departe", "deşi", "din", "dinaintea", "dintr", "dintre", "drept", "după", "ea", "ei", "el", "ele", "eram", "este", "eşti", "eu", "face", "fără", "fi", "fie", "fiecare", "fii", "fim", "fiţi", "iar", "ieri", "îi", "îl", "îmi", "împotriva", "în ", "înainte", "înaintea", "încât", "încît", "încotro", "între", "întrucât", "întrucît", "îţi", "la", "lângă", "le", "li", "lîngă", "lor", "lui", "mă", "mâine", "mea", "mei", "mele", "mereu", "meu", "mi", "mine", "mult", "multă", "mulţi", "ne", "nicăieri", "nici", "nimeni", "nişte", "noastră", "noastre", "noi", "noştri", "nostru", "nu", "ori", "oricând", "oricare", "oricât", "orice", "oricînd", "oricine", "oricît", "oricum", "oriunde", "până", "pe", "pentru", "peste", "pînă", "poate", "pot", "prea", "prima", "primul", "prin", "printr", "sa", "să", "săi", "sale", "sau", "său", "se", "şi", "sînt", "sîntem", "sînteţi", "spre", "sub", "sunt", "suntem", "sunteţi", "ta", "tăi", "tale", "tău", "te", "ţi", "ţie", "tine", "toată", "toate", "tot", "toţi", "totuşi", "tu", "un", "una", "unde", "undeva", "unei", "unele", "uneori", "unor", "vă", "vi", "voastră", "voastre", "voi", "voştri", "vostru", "vouă", "vreo", "vreun"] + }, + "romanian_keywords": { + "type": "keyword_marker", + "keywords": ["Alo", "lume", "căutare"] + }, + "romanian_stemmer": { + "type": "stemmer", + "language": "romanian" + }, + "romanian_override": { + "type": "stemmer_override", + "rules": [] + }, + "russian_stop": { + "type": "stop", + "stopwords": ["и", "в", "во", "не", "что", "он", "на", "я", "с", "со", "как", "а", "то", "все", "она", "так", "его", "но", "да", "ты", "к", "у", "же", "вы", "за", "бы", "по", "только", "ее", "мне", "было", "вот", "от", "меня", "еще", "нет", "о", "из", "ему", "теперь", "когда", "даже", "ну", "вдруг", "ли", "если", "уже", "или", "ни", "быть", "был", "него", "до", "вас", "нибудь", "опять", "уж", "вам", "сказал", "ведь", "там", "потом", "себя", "ничего", "ей", "может", "они", "тут", "где", "есть", "надо", "ней", "для", "мы", "тебя", "их", "чем", "была", "сам", "чтоб", "без", "будто", "человек", "чего", "раз", "тоже", "себе", "под", "жизнь", "будет", "ж", "тогда", "кто", "этот", "говорил", "того", "потому", "этого", "какой", "совсем", "ним", "здесь", "этом", "один", "почти", "мой", "тем", "чтобы", "нее", "кажется", "сейчас", "были", "куда", "зачем", "сказать", "всех", "никогда", "сегодня", "можно", "при", "наконец", "два", "об", "другой", "хоть", "после", "над", "больше", "тот", "через", "эти", "нас", "про", "всего", "них", "какая", "много", "разве", "сказала", "три", "эту", "моя", "впрочем", "хорошо", "свою", "этой", "перед", "иногда", "лучше", "чуть", "том", "нельзя", "такой", "им", "более", "всегда", "конечно", "всю", "между"] + }, + "russian_keywords": { + "type": "keyword_marker", + "keywords": ["привет", "мир", "поиск"] + }, + "russian_stemmer": { + "type": "stemmer", + "language": "russian" + }, + "russian_override": { + "type": "stemmer_override", + "rules": [] + }, + "simplified_chinese_stop": { + "type": "smartcn_stop", + "stopwords": ["_smartcn_"] + }, + "sorani_stop": { + "type": "stop", + "stopwords": ["و", "کە", "ی", "کرد", "ئەوەی", "سەر", "دوو", "هەروەها", "لەو", "دەکات", "چەند", "هەر", "ئەو", "ئەم", "من", "ئێمە", "تۆ", "ئێوە", "ئەو", "ئەوان", "بە", "پێ", "بەبێ", "بەدەم", "بەلای", "بەپێی", "بەرلە", "بەرەوی", "بەرەوە", "بەردەم", "بێ", "بێجگە", "بۆ", "دە", "تێ", "دەگەڵ", "دوای", "جگە", "لە", "لێ", "لەبەر", "لەبەینی", "لەبابەت", "لەبارەی", "لەباتی", "لەبن", "لەبرێتی", "لەدەم", "لەگەڵ", "لەلایەن", "لەناو", "لەنێو", "لەپێناوی", "لەرەوی", "لەرێ", "لەرێگا", "لەسەر", "لەژێر", "ناو", "نێوان", "پاش", "پێش", "وەک"] + }, + "sorani_keywords": { + "type": "keyword_marker", + "keywords": ["mînak"] + }, + "sorani_stemmer": { + "type": "stemmer", + "language": "sorani" + }, + "sorani_override": { + "type": "stemmer_override", + "rules": [] + }, + "spanish_stop": { + "type": "stop", + "stopwords": ["de", "la", "que", "el", "en", "y", "a", "los", "del", "se", "las", "por", "un", "para", "con", "no", "una", "su", "al", "lo", "como", "más", "pero", "sus", "le", "ya", "o", "este", "sí", "porque", "esta", "entre", "cuando", "muy", "sin", "sobre", "también", "me", "hasta", "hay", "donde", "quien", "desde", "todo", "nos", "durante", "todos", "uno", "les", "ni", "contra", "otros", "ese", "eso", "ante", "ellos", "e", "esto", "mí", "antes", "algunos", "qué", "unos", "yo", "otro", "otras", "otra", "él", "tanto", "esa", "estos", "mucho", "quienes", "nada", "muchos", "cual", "poco", "ella", "estar", "estas", "algunas", "algo", "nosotros", "mi", "mis", "tú", "te", "ti", "tu", "tus", "ellas", "nosotras", "vosotros", "vosotras", "os", "mío", "mía", "míos", "mías", "tuyo", "tuya", "tuyos", "tuyas", "suyo", "suya", "suyos", "suyas", "nuestro", "nuestra", "nuestros", "nuestras", "vuestro", "vuestra", "vuestros", "vuestras", "esos", "esas", "estoy", "estás", "está", "estamos", "estáis", "están", "esté", "estés", "estemos", "estéis", "estén", "estaré", "estarás", "estará", "estaremos", "estaréis", "estarán", "estaría", "estarías", "estaríamos", "estaríais", "estarían", "estaba", "estabas", "estábamos", "estabais", "estaban", "estuve", "estuviste", "estuvo", "estuvimos", "estuvisteis", "estuvieron", "estuviera", "estuvieras", "estuviéramos", "estuvierais", "estuvieran", "estuviese", "estuvieses", "estuviésemos", "estuvieseis", "estuviesen", "estando", "estado", "estada", "estados", "estadas", "estad", "he", "has", "ha", "hemos", "habéis", "han", "haya", "hayas", "hayamos", "hayáis", "hayan", "habré", "habrás", "habrá", "habremos", "habréis", "habrán", "habría", "habrías", "habríamos", "habríais", "habrían", "había", "habías", "habíamos", "habíais", "habían", "hube", "hubiste", "hubo", "hubimos", "hubisteis", "hubieron", "hubiera", "hubieras", "hubiéramos", "hubierais", "hubieran", "hubiese", "hubieses", "hubiésemos", "hubieseis", "hubiesen", "habiendo", "habido", "habida", "habidos", "habidas", "soy", "eres", "es", "somos", "sois", "son", "sea", "seas", "seamos", "seáis", "sean", "seré", "serás", "será", "seremos", "seréis", "serán", "sería", "serías", "seríamos", "seríais", "serían", "era", "eras", "éramos", "erais", "eran", "fui", "fuiste", "fue", "fuimos", "fuisteis", "fueron", "fuera", "fueras", "fuéramos", "fuerais", "fueran", "fuese", "fueses", "fuésemos", "fueseis", "fuesen", "siendo", "sido", "tengo", "tienes", "tiene", "tenemos", "tenéis", "tienen", "tenga", "tengas", "tengamos", "tengáis", "tengan", "tendré", "tendrás", "tendrá", "tendremos", "tendréis", "tendrán", "tendría", "tendrías", "tendríamos", "tendríais", "tendrían", "tenía", "tenías", "teníamos", "teníais", "tenían", "tuve", "tuviste", "tuvo", "tuvimos", "tuvisteis", "tuvieron", "tuviera", "tuvieras", "tuviéramos", "tuvierais", "tuvieran", "tuviese", "tuvieses", "tuviésemos", "tuvieseis", "tuviesen", "teniendo", "tenido", "tenida", "tenidos", "tenidas", "tened"] + }, + "spanish_keywords": { + "type": "keyword_marker", + "keywords": ["¡Hola", "mundo", "búsqueda"] + }, + "spanish_stemmer": { + "type": "stemmer", + "language": "light_spanish" + }, + "spanish_override": { + "type": "stemmer_override", + "rules": [] + }, + "swedish_stop": { + "type": "stop", + "stopwords": ["och", "det", "att", "i", "en", "jag", "hon", "som", "han", "på", "den", "med", "var", "sig", "för", "så", "till", "är", "men", "ett", "om", "hade", "de", "av", "icke", "mig", "du", "henne", "då", "sin", "nu", "har", "inte", "hans", "honom", "skulle", "hennes", "där", "min", "man", "ej", "vid", "kunde", "något", "från", "ut", "när", "efter", "upp", "vi", "dem", "vara", "vad", "över", "än", "dig", "kan", "sina", "här", "ha", "mot", "alla", "under", "någon", "eller", "allt", "mycket", "sedan", "ju", "denna", "själv", "detta", "åt", "utan", "varit", "hur", "ingen", "mitt", "ni", "bli", "blev", "oss", "din", "dessa", "några", "deras", "blir", "mina", "samma", "vilken", "er", "sådan", "vår", "blivit", "dess", "inom", "mellan", "sådant", "varför", "varje", "vilka", "ditt", "vem", "vilket", "sitta", "sådana", "vart", "dina", "vars", "vårt", "våra", "ert", "era", "vilkas"] + }, + "swedish_keywords": { + "type": "keyword_marker", + "keywords": ["Hallå", "material", "sök"] + }, + "swedish_stemmer": { + "type": "stemmer", + "language": "swedish" + }, + "swedish_override": { + "type": "stemmer_override", + "rules": [] + }, + "thai_stop": { + "type": "stop", + "stopwords": ["ไว้", "ไม่", "ไป", "ได้", "ให้", "ใน", "โดย", "แห่ง", "แล้ว", "และ", "แรก", "แบบ", "แต่", "เอง", "เห็น", "เลย", "เริ่ม", "เรา", "เมื่อ", "เพื่อ", "เพราะ", "เป็นการ", "เป็น", "เปิดเผย", "เปิด", "เนื่องจาก", "เดียวกัน", "เดียว", "เช่น", "เฉพาะ", "เคย", "เข้า", "เขา", "อีก", "อาจ", "อะไร", "ออก", "อย่าง", "อยู่", "อยาก", "หาก", "หลาย", "หลังจาก", "หลัง", "หรือ", "หนึ่ง", "ส่วน", "ส่ง", "สุด", "สําหรับ", "ว่า", "วัน", "ลง", "ร่วม", "ราย", "รับ", "ระหว่าง", "รวม", "ยัง", "มี", "มาก", "มา", "พร้อม", "พบ", "ผ่าน", "ผล", "บาง", "น่า", "นี้", "นํา", "นั้น", "นัก", "นอกจาก", "ทุก", "ที่สุด", "ที่", "ทําให้", "ทํา", "ทาง", "ทั้งนี้", "ทั้ง", "ถ้า", "ถูก", "ถึง", "ต้อง", "ต่างๆ", "ต่าง", "ต่อ", "ตาม", "ตั้งแต่", "ตั้ง", "ด้าน", "ด้วย", "ดัง", "ซึ่ง", "ช่วง", "จึง", "จาก", "จัด", "จะ", "คือ", "ความ", "ครั้ง", "คง", "ขึ้น", "ของ", "ขอ", "ขณะ", "ก่อน", "ก็", "การ", "กับ", "กัน", "กว่า", "กล่าว"] + }, + "thai_keywords": { + "type": "keyword_marker", + "keywords": ["สวัสดี", "โลก", "ค้นหา"] + }, + "turkish_stop": { + "type": "stop", + "stopwords": ["acaba", "altmış", "altı", "ama", "ancak", "arada", "aslında", "ayrıca", "bana", "bazı", "belki", "ben", "benden", "beni", "benim", "beri", "beş", "bile", "bin", "bir", "birçok", "biri", "birkaç", "birkez", "birşey", "birşeyi", "biz", "bize", "bizden", "bizi", "bizim", "böyle", "böylece", "bu", "buna", "bunda", "bundan", "bunlar", "bunları", "bunların", "bunu", "bunun", "burada", "çok", "çünkü", "da", "daha", "dahi", "de", "defa", "değil", "diğer", "diye", "doksan", "dokuz", "dolayı", "dolayısıyla", "dört", "edecek", "eden", "ederek", "edilecek", "ediliyor", "edilmesi", "ediyor", "eğer", "elli", "en", "etmesi", "etti", "ettiği", "ettiğini", "gibi", "göre", "halen", "hangi", "hatta", "hem", "henüz", "hep", "hepsi", "her", "herhangi", "herkesin", "hiç", "hiçbir", "için", "iki", "ile", "ilgili", "ise", "işte", "itibaren", "itibariyle", "kadar", "karşın", "katrilyon", "kendi", "kendilerine", "kendini", "kendisi", "kendisine", "kendisini", "kez", "ki", "kim", "kimden", "kime", "kimi", "kimse", "kırk", "milyar", "milyon", "mu", "mü", "mı", "nasıl", "ne", "neden", "nedenle", "nerde", "nerede", "nereye", "niye", "niçin", "o", "olan", "olarak", "oldu", "olduğu", "olduğunu", "olduklarını", "olmadı", "olmadığı", "olmak", "olması", "olmayan", "olmaz", "olsa", "olsun", "olup", "olur", "olursa", "oluyor", "on", "ona", "ondan", "onlar", "onlardan", "onları", "onların", "onu", "onun", "otuz", "oysa", "öyle", "pek", "rağmen", "sadece", "sanki", "sekiz", "seksen", "sen", "senden", "seni", "senin", "siz", "sizden", "sizi", "sizin", "şey", "şeyden", "şeyi", "şeyler", "şöyle", "şu", "şuna", "şunda", "şundan", "şunları", "şunu", "tarafından", "trilyon", "tüm", "üç", "üzere", "var", "vardı", "ve", "veya", "ya", "yani", "yapacak", "yapılan", "yapılması", "yapıyor", "yapmak", "yaptı", "yaptığı", "yaptığını", "yaptıkları", "yedi", "yerine", "yetmiş", "yine", "yirmi", "yoksa", "yüz", "zaten"] + }, + "turkish_lowercase": { + "type": "lowercase", + "language": "turkish" + }, + "turkish_keywords": { + "type": "keyword_marker", + "keywords": ["Merhaba", "Dünya", "arama"] + }, + "turkish_stemmer": { + "type": "stemmer", + "language": "turkish" + }, + "turkish_override": { + "type": "stemmer_override", + "rules": [] + }, + "truncate10_filter" : { + "type" : "truncate", + "length" : 10 + }, + "truncate20_filter" : { + "type" : "truncate", + "length" : 20 + }, + "synonym_filter" : { + "type" : "synonym_graph", + "synonyms": ["fess,フエス"] + } + }, + "tokenizer": { + "japanese_tokenizer": { + "type": "kuromoji_tokenizer", + "mode": "normal", + "discard_punctuation": false, + "user_dictionary_rules": ["令和,令和,レイワ,名詞-固有名詞-一般", "日本経済新聞,日本 経済 新聞,ニホン ケイザイ シンブン,カスタム名詞", "関西国際空港,関西 国際 空港,カンサイ コクサイ クウコウ,テスト名詞", "朝青龍,朝青龍,アサショウリュウ,カスタム名詞"] + }, + "korean_tokenizer": { + "type": "nori_tokenizer", + "decompound_mode": "mixed", + "user_dictionary_rules": ["덕후", "버카충", "낄끼빠빠" ] + }, + "simplified_chinese_tokenizer": { + "type": "smartcn_tokenizer" + } + }, + "analyzer": { + "arabic_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "arabic_stop", + "arabic_normalization", + "arabic_keywords", + "arabic_override", + "arabic_stemmer" + ] + }, + "armenian_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "armenian_stop", + "armenian_keywords", + "armenian_override", + "armenian_stemmer" + ] + }, + "basque_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "basque_stop", + "basque_keywords", + "basque_override", + "basque_stemmer" + ] + }, + "brazilian_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "brazilian_stop", + "brazilian_keywords", + "brazilian_override", + "brazilian_stemmer" + ] + }, + "bulgarian_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "bulgarian_stop", + "bulgarian_keywords", + "bulgarian_override", + "bulgarian_stemmer" + ] + }, + "catalan_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "catalan_elision", + "lowercase", + "catalan_stop", + "catalan_keywords", + "catalan_override", + "catalan_stemmer" + ] + }, + "czech_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "czech_stop", + "czech_keywords", + "czech_override", + "czech_stemmer" + ] + }, + "danish_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "danish_stop", + "danish_keywords", + "danish_override", + "danish_stemmer" + ] + }, + "dutch_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "dutch_stop", + "dutch_keywords", + "dutch_override", + "dutch_stemmer" + ] + }, + "english_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "english_keywords", + "english_override", + "possessive_stemmer_en_filter" + ] + }, + "finnish_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "finnish_stop", + "finnish_keywords", + "finnish_override", + "finnish_stemmer" + ] + }, + "french_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "french_elision", + "lowercase", + "french_stop", + "french_keywords", + "french_override", + "french_stemmer" + ] + }, + "galician_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "galician_stop", + "galician_keywords", + "galician_override", + "galician_stemmer" + ] + }, + "german_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "german_stop", + "german_normalization", + "german_override", + "german_stemmer" + ] + }, + "greek_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "greek_lowercase", + "greek_stop", + "greek_keywords", + "greek_override", + "greek_stemmer" + ] + }, + "hindi_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "indic_normalization", + "hindi_normalization", + "hindi_stop", + "hindi_keywords", + "hindi_override", + "hindi_stemmer" + ] + }, + "hungarian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "hungarian_stop", + "hungarian_keywords", + "hungarian_override", + "hungarian_stemmer" + ] + }, + "indonesian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "indonesian_stop", + "indonesian_keywords", + "indonesian_override", + "indonesian_stemmer" + ] + }, + "irish_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "irish_stop", + "irish_elision", + "irish_lowercase", + "irish_keywords", + "irish_override", + "irish_stemmer" + ] + }, + "italian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "italian_elision", + "lowercase", + "italian_stop", + "italian_keywords", + "italian_override", + "italian_stemmer" + ] + }, + "japanese_analyzer": { + "type": "custom", + "char_filter": [ + "mapping_ja_filter", + "kuromoji_iteration_mark" + ], + "tokenizer": "japanese_tokenizer", + "filter": [ + "truncate10_filter", + "kuromoji_baseform", + "kuromoji_stemmer", + "japanese_pos_filter", + "lowercase", + "japanese_stop" + ] + }, + "korean_analyzer": { + "type": "custom", + "tokenizer":"korean_tokenizer", + "filter": [ + "truncate10_filter", + "lowercase", + "korean_stop" + ] + }, + "latvian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "latvian_stop", + "latvian_keywords", + "latvian_override", + "latvian_stemmer" + ] + }, + "lithuanian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "lithuanian_stop", + "lithuanian_keywords", + "lithuanian_override", + "lithuanian_stemmer" + ] + }, + "norwegian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "norwegian_stop", + "norwegian_keywords", + "norwegian_override", + "norwegian_stemmer" + ] + }, + "persian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "char_filter": [ "mapping_fa_filter" ], + "filter": [ + "truncate20_filter", + "lowercase", + "arabic_normalization", + "persian_normalization", + "persian_stop" + ] + }, + "portuguese_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "portuguese_stop", + "portuguese_keywords", + "portuguese_override", + "portuguese_stemmer" + ] + }, + "romanian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "romanian_stop", + "romanian_override", + "romanian_stemmer" + ] + }, + "russian_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "russian_stop", + "russian_keywords", + "russian_override", + "russian_stemmer" + ] + }, + "simplified_chinese_analyzer": { + "tokenizer": "smartcn_tokenizer", + "filter": [ + "truncate10_filter", + "lowercase", + "simplified_chinese_stop" + ] + }, + "sorani_analyzer": { + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "sorani_normalization", + "lowercase", + "sorani_stop", + "sorani_keywords", + "sorani_override", + "sorani_stemmer" + ] + }, + "spanish_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "spanish_stop", + "spanish_keywords", + "spanish_override", + "spanish_stemmer" + ] + }, + "swedish_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "lowercase", + "swedish_stop", + "swedish_keywords", + "swedish_override", + "swedish_stemmer" + ] + }, + "thai_analyzer": { + "type": "custom", + "tokenizer": "thai", + "filter": [ + "truncate20_filter", + "lowercase", + "thai_stop" + ] + }, + "turkish_analyzer": { + "type": "custom", + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "apostrophe", + "turkish_lowercase", + "turkish_stop", + "turkish_keywords", + "turkish_override", + "turkish_stemmer" + ] + }, + "standard_analyzer": { + "type": "custom", + "char_filter": [ + "mapping_filter" + ], + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "cjk_bigram", + "lowercase", + "asciifolding", + "stopword_en_filter", + "english_keywords", + "english_override", + "stemmer_en_filter" + ] + }, + "standard_search_analyzer": { + "type": "custom", + "char_filter": [ + "mapping_filter" + ], + "tokenizer": "standard", + "filter": [ + "truncate20_filter", + "cjk_bigram", + "lowercase", + "stopword_en_filter", + "synonym_filter", + "english_keywords", + "english_override", + "stemmer_en_filter" + ] + }, + "empty_analyzer": { + "type": "custom", + "tokenizer": "standard", + "char_filter": [ + "removeall_filter" + ] + } + } + } + }, + "mappings": { + "_source": { + "excludes": [ + "content_ar", + "content_bg", + "content_bn", + "content_ca", + "content_ckb-iq", + "content_cs", + "content_da", + "content_de", + "content_el", + "content_en", + "content_en-ie", + "content_es", + "content_et", + "content_eu", + "content_fa", + "content_fi", + "content_fr", + "content_gl", + "content_gu", + "content_he", + "content_hi", + "content_hr", + "content_hu", + "content_hy", + "content_id", + "content_it", + "content_ja", + "content_ko", + "content_lt", + "content_lv", + "content_mk", + "content_ml", + "content_nl", + "content_no", + "content_pa", + "content_pl", + "content_pt", + "content_pt-br", + "content_ro", + "content_ru", + "content_si", + "content_sq", + "content_sv", + "content_ta", + "content_te", + "content_th", + "content_tl", + "content_tr", + "content_uk", + "content_ur", + "content_vi", + "content_zh-cn", + "content_zh-tw", + "important_content_ar", + "important_content_bg", + "important_content_bn", + "important_content_ca", + "important_content_ckb-iq", + "important_content_cs", + "important_content_da", + "important_content_de", + "important_content_el", + "important_content_en", + "important_content_en-ie", + "important_content_es", + "important_content_et", + "important_content_eu", + "important_content_fa", + "important_content_fi", + "important_content_fr", + "important_content_gl", + "important_content_gu", + "important_content_he", + "important_content_hi", + "important_content_hr", + "important_content_hu", + "important_content_hy", + "important_content_id", + "important_content_it", + "important_content_ja", + "important_content_ko", + "important_content_lt", + "important_content_lv", + "important_content_mk", + "important_content_ml", + "important_content_nl", + "important_content_no", + "important_content_pa", + "important_content_pl", + "important_content_pt", + "important_content_pt-br", + "important_content_ro", + "important_content_ru", + "important_content_si", + "important_content_sq", + "important_content_sv", + "important_content_ta", + "important_content_te", + "important_content_th", + "important_content_tl", + "important_content_tr", + "important_content_uk", + "important_content_ur", + "important_content_vi", + "important_content_zh-cn", + "important_content_zh-tw", + "title_ar", + "title_bg", + "title_bn", + "title_ca", + "title_ckb-iq", + "title_cs", + "title_da", + "title_de", + "title_el", + "title_en", + "title_en-ie", + "title_es", + "title_et", + "title_eu", + "title_fa", + "title_fi", + "title_fr", + "title_gl", + "title_gu", + "title_he", + "title_hi", + "title_hr", + "title_hu", + "title_hy", + "title_id", + "title_it", + "title_ja", + "title_ko", + "title_lt", + "title_lv", + "title_mk", + "title_ml", + "title_nl", + "title_no", + "title_pa", + "title_pl", + "title_pt", + "title_pt-br", + "title_ro", + "title_ru", + "title_si", + "title_sq", + "title_sv", + "title_ta", + "title_te", + "title_th", + "title_tl", + "title_tr", + "title_uk", + "title_ur", + "title_vi", + "title_zh-cn", + "title_zh-tw" + ] + } + } +} diff --git a/src/main/resources/fess_indices/_cloud/fess/doc.json b/src/main/resources/fess_indices/_cloud/fess/doc.json new file mode 100644 index 000000000..9e49f15f8 --- /dev/null +++ b/src/main/resources/fess_indices/_cloud/fess/doc.json @@ -0,0 +1,592 @@ +{ + "dynamic_templates": [ + { + "lang_ar": { + "match": "*_ar", + "mapping": { + "type": "text", + "analyzer": "arabic_analyzer" + } + } + }, + { + "lang_bg": { + "match": "*_bg", + "mapping": { + "type": "text", + "analyzer": "bulgarian_analyzer" + } + } + }, + { + "lang_bn": { + "match": "*_bn", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_ca": { + "match": "*_ca", + "mapping": { + "type": "text", + "analyzer": "catalan_analyzer" + } + } + }, + { + "lang_ca": { + "match": "*_ckb-iq", + "mapping": { + "type": "text", + "analyzer": "sorani_analyzer" + } + } + }, + { + "lang_cs": { + "match": "*_cs", + "mapping": { + "type": "text", + "analyzer": "czech_analyzer" + } + } + }, + { + "lang_da": { + "match": "*_da", + "mapping": { + "type": "text", + "analyzer": "danish_analyzer" + } + } + }, + { + "lang_de": { + "match": "*_de", + "mapping": { + "type": "text", + "analyzer": "german_analyzer" + } + } + }, + { + "lang_el": { + "match": "*_el", + "mapping": { + "type": "text", + "analyzer": "greek_analyzer" + } + } + }, + { + "lang_en": { + "match": "*_en", + "mapping": { + "type": "text", + "analyzer": "english_analyzer" + } + } + }, + { + "lang_en": { + "match": "*_en-ie", + "mapping": { + "type": "text", + "analyzer": "irish_analyzer" + } + } + }, + { + "lang_es": { + "match": "*_es", + "mapping": { + "type": "text", + "analyzer": "spanish_analyzer" + } + } + }, + { + "lang_et": { + "match": "*_et", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_et": { + "match": "*_eu", + "mapping": { + "type": "text", + "analyzer": "basque_analyzer" + } + } + }, + { + "lang_fa": { + "match": "*_fa", + "mapping": { + "type": "text", + "analyzer": "persian_analyzer" + } + } + }, + { + "lang_fi": { + "match": "*_fi", + "mapping": { + "type": "text", + "analyzer": "finnish_analyzer" + } + } + }, + { + "lang_fr": { + "match": "*_fr", + "mapping": { + "type": "text", + "analyzer": "french_analyzer" + } + } + }, + { + "lang_gl": { + "match": "*_gl", + "mapping": { + "type": "text", + "analyzer": "galician_analyzer" + } + } + }, + { + "lang_gu": { + "match": "*_gu", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_he": { + "match": "*_he", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_hi": { + "match": "*_hi", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_hr": { + "match": "*_hr", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_hu": { + "match": "*_hu", + "mapping": { + "type": "text", + "analyzer": "hungarian_analyzer" + } + } + }, + { + "lang_hu": { + "match": "*_hy", + "mapping": { + "type": "text", + "analyzer": "armenian_analyzer" + } + } + }, + { + "lang_id": { + "match": "*_id", + "mapping": { + "type": "text", + "analyzer": "indonesian_analyzer" + } + } + }, + { + "lang_it": { + "match": "*_it", + "mapping": { + "type": "text", + "analyzer": "italian_analyzer" + } + } + }, + { + "lang_ja": { + "match": "*_ja", + "mapping": { + "type": "text", + "analyzer": "japanese_analyzer" + } + } + }, + { + "lang_ko": { + "match": "*_ko", + "mapping": { + "type": "text", + "analyzer": "korean_analyzer" + } + } + }, + { + "lang_lt": { + "match": "*_lt", + "mapping": { + "type": "text", + "analyzer": "lithuanian_analyzer" + } + } + }, + { + "lang_lv": { + "match": "*_lv", + "mapping": { + "type": "text", + "analyzer": "latvian_analyzer" + } + } + }, + { + "lang_mk": { + "match": "*_mk", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_ml": { + "match": "*_ml", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_nl": { + "match": "*_nl", + "mapping": { + "type": "text", + "analyzer": "dutch_analyzer" + } + } + }, + { + "lang_no": { + "match": "*_no", + "mapping": { + "type": "text", + "analyzer": "norwegian_analyzer" + } + } + }, + { + "lang_pa": { + "match": "*_pa", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_pl": { + "match": "*_pl", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_pt": { + "match": "*_pt", + "mapping": { + "type": "text", + "analyzer": "portuguese_analyzer" + } + } + }, + { + "lang_pt-br": { + "match": "*_pt-br", + "mapping": { + "type": "text", + "analyzer": "brazilian_analyzer" + } + } + }, + { + "lang_ro": { + "match": "*_ro", + "mapping": { + "type": "text", + "analyzer": "romanian_analyzer" + } + } + }, + { + "lang_ru": { + "match": "*_ru", + "mapping": { + "type": "text", + "analyzer": "russian_analyzer" + } + } + }, + { + "lang_si": { + "match": "*_si", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_sq": { + "match": "*_sq", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_sv": { + "match": "*_sv", + "mapping": { + "type": "text", + "analyzer": "swedish_analyzer" + } + } + }, + { + "lang_ta": { + "match": "*_ta", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_te": { + "match": "*_te", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_th": { + "match": "*_th", + "mapping": { + "type": "text", + "analyzer": "thai_analyzer" + } + } + }, + { + "lang_tl": { + "match": "*_tl", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_tr": { + "match": "*_tr", + "mapping": { + "type": "text", + "analyzer": "turkish_analyzer" + } + } + }, + { + "lang_uk": { + "match": "*_uk", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_ur": { + "match": "*_ur", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_vi": { + "match": "*_vi", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + }, + { + "lang_zh-cn": { + "match": "*_zh-cn", + "mapping": { + "type": "text", + "analyzer": "simplified_chinese_analyzer" + } + } + }, + { + "lang_zh-tw": { + "match": "*_zh-tw", + "mapping": { + "type": "text", + "analyzer": "empty_analyzer" + } + } + } + ], + "properties": { + "anchor": { + "type": "keyword" + }, + "boost": { + "type": "float" + }, + "click_count": { + "type": "long" + }, + "config_id": { + "type": "keyword" + }, + "important_content": { + "type": "text", + "analyzer": "standard_analyzer", + "search_analyzer": "standard_search_analyzer", + "term_vector": "with_positions_offsets" + }, + "content": { + "type": "text", + "analyzer": "standard_analyzer", + "search_analyzer": "standard_search_analyzer", + "term_vector": "with_positions_offsets" + }, + "content_minhash": { + "type": "keyword", + "index": false + }, + "content_minhash_bits": { + "type": "keyword", + "index": false + }, + "content_length": { + "type": "long" + }, + "created": { + "type": "date", + "format": "date_optional_time" + }, + "timestamp": { + "type": "date", + "format": "date_optional_time" + }, + "expires": { + "type": "date", + "format": "date_optional_time" + }, + "digest": { + "type": "text", + "index": false + }, + "doc_id": { + "type": "keyword" + }, + "favorite_count": { + "type": "long" + }, + "filename": { + "type": "keyword" + }, + "filetype": { + "type": "keyword" + }, + "host": { + "type": "keyword" + }, + "lang": { + "type": "keyword" + }, + "last_modified": { + "type": "date", + "format": "date_optional_time" + }, + "location": { + "type": "geo_point" + }, + "mimetype": { + "type": "keyword" + }, + "parent_id": { + "type": "keyword" + }, + "role": { + "type": "keyword" + }, + "label": { + "type": "keyword" + }, + "virtual_host": { + "type": "keyword" + }, + "segment": { + "type": "keyword" + }, + "site": { + "type": "keyword" + }, + "title": { + "type": "text", + "analyzer": "standard_analyzer", + "search_analyzer": "standard_search_analyzer", + "term_vector": "with_positions_offsets" + }, + "thumbnail": { + "type": "keyword" + }, + "url": { + "type": "keyword" + } + } +} diff --git a/src/main/resources/suggest_indices/_cloud/suggest_analyzer.json b/src/main/resources/suggest_indices/_cloud/suggest_analyzer.json new file mode 100644 index 000000000..6ae494199 --- /dev/null +++ b/src/main/resources/suggest_indices/_cloud/suggest_analyzer.json @@ -0,0 +1,1707 @@ +{ + "index": { + "refresh_interval": "1s", + "number_of_shards": 1, + "number_of_replicas": 0, + "auto_expand_replicas": "0-1" + }, + "analysis" : { + "tokenizer" : { + "fess_japanese_normal" : { + "type" : "kuromoji_tokenizer", + "mode" : "normal", + "discard_punctuation" : "false" + }, + "fess_korean_normal": { + "type": "nori_tokenizer", + "decompound_mode": "mixed", + "user_dictionary_rules": ["덕후", "버카충", "낄끼빠빠" ] + } + }, + "analyzer" : { + "reading_analyzer" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "filter" : ["reading_form"] + }, + "reading_term_analyzer" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal" + }, + "normalize_analyzer" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "pos_filter", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "pos_filter", "content_length_filter", "limit_token_count_filter", "reading_form"] + }, + "reading_analyzer_ja" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "filter" : ["reading_form"] + }, + "reading_term_analyzer_ja" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal" + }, + "normalize_analyzer_ja" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ja" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "pos_filter", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_ja" : { + "type" : "custom", + "tokenizer" : "fess_japanese_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "pos_filter", "content_length_filter", "limit_token_count_filter", "reading_form"] + }, + "reading_analyzer_en" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_en" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_en" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_en" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "english_keywords"] + }, + "contents_reading_analyzer_en" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "english_keywords"] + }, + "reading_analyzer_ko" : { + "type" : "custom", + "tokenizer" : "fess_korean_normal" + }, + "reading_term_analyzer_ko" : { + "type" : "custom", + "tokenizer" : "fess_korean_normal" + }, + "normalize_analyzer_ko" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ko" : { + "type" : "custom", + "tokenizer" : "fess_korean_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "english_keywords"] + }, + "contents_reading_analyzer_ko" : { + "type" : "custom", + "tokenizer" : "fess_korean_normal", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "english_keywords"] + }, + "reading_analyzer_ar" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ar" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ar" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ar" : { + "type" : "custom", + "tokenizer" : "standard", + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "arabic_stop", "arabic_keywords"] + }, + "contents_reading_analyzer_ar" : { + "type" : "custom", + "tokenizer" : "standard", + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "arabic_stop", "arabic_normalization", "arabic_keywords"] + }, + "reading_analyzer_bg" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_bg" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_bg" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_bg" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter", "bulgarian_stop", "bulgarian_keywords", "bulgarian_stemmer"] + }, + "contents_reading_analyzer_bg" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter", "bulgarian_stop", "bulgarian_keywords", "bulgarian_stemmer"] + }, + "reading_analyzer_ca" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ca" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ca" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "catalan_elision"] + }, + "contents_analyzer_ca" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "catalan_elision", "catalan_stop", "catalan_keywords"] + }, + "contents_reading_analyzer_ca" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "catalan_elision", "catalan_stop", "catalan_keywords"] + }, + "reading_analyzer_cs" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_cs" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_cs" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_cs" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "czech_stop", "czech_keywords"] + }, + "contents_reading_analyzer_cs" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "czech_stop", "czech_keywords"] + }, + "reading_analyzer_da" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_da" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_da" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_da" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "danish_stop", "danish_keywords"] + }, + "contents_reading_analyzer_da" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "danish_stop", "danish_keywords"] + }, + "reading_analyzer_nl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_nl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_nl" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "dutch_override"] + }, + "contents_analyzer_nl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "dutch_stop", "dutch_keywords", "dutch_override"] + }, + "contents_reading_analyzer_nl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "dutch_stop", "dutch_keywords", "dutch_override"] + }, + "reading_analyzer_fi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_fi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_fi" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_fi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "finnish_stop", "finnish_keywords"] + }, + "contents_reading_analyzer_fi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "finnish_stop", "finnish_keywords"] + }, + "reading_analyzer_fr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_fr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_fr" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "french_elision"] + }, + "contents_analyzer_fr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "french_elision", "french_stop", "french_keywords"] + }, + "contents_reading_analyzer_fr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "french_elision", "french_stop", "french_keywords"] + }, + "reading_analyzer_de" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_de" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_de" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_de" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "german_stop", "german_keywords"] + }, + "contents_reading_analyzer_de" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "german_stop", "german_keywords", "german_normalization"] + }, + "reading_analyzer_el" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_el" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_el" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["greek_lowercase", "lowercase"] + }, + "contents_analyzer_el" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["greek_lowercase", "lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "greek_stop", "greek_keywords"] + }, + "contents_reading_analyzer_el" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["greek_lowercase", "lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "greek_stop", "greek_keywords"] + }, + + "reading_analyzer_hu" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_hu" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_hu" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_hu" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "hungarian_stop", "hungarian_keywords"] + }, + "contents_reading_analyzer_hu" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "hungarian_stop", "hungarian_keywords"] + }, + "reading_analyzer_id" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_id" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_id" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_id" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "indonesian_stop", "indonesian_keywords"] + }, + "contents_reading_analyzer_id" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "indonesian_stop", "indonesian_keywords"] + }, + "reading_analyzer_it" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_it" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_it" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "italian_elision"] + }, + "contents_analyzer_it" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "italian_elision", "italian_stop", "italian_keywords"] + }, + "contents_reading_analyzer_it" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "italian_elision", "italian_stop", "italian_keywords"] + }, + "reading_analyzer_lv" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_lv" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_lv" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_lv" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "latvian_stop", "latvian_keywords"] + }, + "contents_reading_analyzer_lv" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "latvian_stop", "latvian_keywords"] + }, + "reading_analyzer_lt" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_lt" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_lt" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_lt" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "lithuanian_stop", "lithuanian_keywords"] + }, + "contents_reading_analyzer_lt" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "lithuanian_stop", "lithuanian_keywords"] + }, + "reading_analyzer_no" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_no" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_no" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_no" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "norwegian_stop", "norwegian_keywords"] + }, + "contents_reading_analyzer_no" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "norwegian_stop", "norwegian_keywords"] + }, + "reading_analyzer_fa" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_fa" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_fa" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_fa" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "persian_stop"] + }, + "contents_reading_analyzer_fa" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "arabic_normalization", "persian_normalization", "persian_stop"] + }, + "reading_analyzer_pt" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_pt" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_pt" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_pt" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "portuguese_stop", "portuguese_keywords"] + }, + "contents_reading_analyzer_pt" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "portuguese_stop", "portuguese_keywords"] + }, + "reading_analyzer_ro" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ro" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ro" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ro" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "romanian_stop", "romanian_keywords"] + }, + "contents_reading_analyzer_ro" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "romanian_stop", "romanian_keywords"] + }, + "reading_analyzer_ru" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ru" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ru" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ru" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "russian_stop", "russian_keywords"] + }, + "contents_reading_analyzer_ru" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "russian_stop", "russian_keywords"] + }, + "reading_analyzer_es" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_es" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_es" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_es" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "spanish_stop", "spanish_keywords"] + }, + "contents_reading_analyzer_es" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "spanish_stop", "spanish_keywords"] + }, + "reading_analyzer_sv" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_sv" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_sv" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_sv" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "swedish_stop", "swedish_keywords"] + }, + "contents_reading_analyzer_sv" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "swedish_stop", "swedish_keywords"] + }, + "reading_analyzer_tr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_tr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_tr" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "apostrophe", "turkish_lowercase", "turkish_stemmer"] + }, + "contents_analyzer_tr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "apostrophe", "turkish_lowercase", "turkish_stop", "turkish_keywords"] + }, + "contents_reading_analyzer_tr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "apostrophe", "turkish_lowercase", "turkish_stop", "turkish_keywords"] + }, + "reading_analyzer_th" : { + "type" : "custom", + "tokenizer" : "thai" + }, + "reading_term_analyzer_th" : { + "type" : "custom", + "tokenizer" : "thai" + }, + "normalize_analyzer_th" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_th" : { + "type" : "custom", + "tokenizer" : "thai", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "thai_stop"] + }, + "contents_reading_analyzer_th" : { + "type" : "custom", + "tokenizer" : "thai", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "stopword_en_filter", "content_length_filter", "limit_token_count_filter", "thai_stop"] + }, + "reading_analyzer_bn" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_bn" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_bn" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_bn" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_bn" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_et" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_et" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_et" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_et" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_et" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_gu" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_gu" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_gu" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_gu" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_gu" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_he" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_he" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_he" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_he" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_he" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_hi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_hi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_hi" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_hi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_hi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_hr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_hr" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_hr" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_hr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_hr" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_mk" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_mk" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_mk" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_mk" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_mk" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_ml" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ml" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ml" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ml" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_ml" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_pa" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_pa" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_pa" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_pa" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_pa" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_pl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_pl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_pl" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_pl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_pl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_si" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_si" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_si" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_si" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_si" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_sq" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_sq" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_sq" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_sq" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_sq" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_ta" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ta" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ta" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ta" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_ta" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_te" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_te" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_te" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_te" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_te" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_tl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_tl" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_tl" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_tl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_tl" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_uk" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_uk" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_uk" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_uk" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_uk" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_ur" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_ur" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_ur" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_ur" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_ur" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_vi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_vi" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_vi" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_vi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_vi" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_zh-cn" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_zh-cn" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_zh-cn" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_zh-cn" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_zh-cn" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "reading_analyzer_zh-tw" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "reading_term_analyzer_zh-tw" : { + "type" : "custom", + "tokenizer" : "standard" + }, + "normalize_analyzer_zh-tw" : { + "type" : "custom", + "tokenizer" : "keyword", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase"] + }, + "contents_analyzer_zh-tw" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + }, + "contents_reading_analyzer_zh-tw" : { + "type" : "custom", + "tokenizer" : "standard", + "char_filter" : ["mapping_char"], + "filter" : ["lowercase", "content_length_filter", "limit_token_count_filter"] + } + }, + "char_filter" : { + "mapping_char" : { + "type" : "mapping", + "mappings" : ["ガ=>ガ", "ギ=>ギ", "グ=>グ", "ゲ=>ゲ", "ゴ=>ゴ", "ザ=>ザ", "ジ=>ジ", "ズ=>ズ", "ゼ=>ゼ", "ゾ=>ゾ", "ダ=>ダ", "ヂ=>ヂ", "ヅ=>ヅ", + "デ=>デ", "ド=>ド", "バ=>バ", "ビ=>ビ", "ブ=>ブ", "ベ=>ベ", "ボ=>ボ", "。=>。", "「=>「", "」=>」", "、=>、", "・=>・", "ヲ=>ヲ", "ァ=>ァ", "ィ=>ィ", "ゥ=>ゥ", "ェ=>ェ", "ォ=>ォ", "ャ=>ャ", "ュ=>ュ", "ョ=>ョ", "ッ=>ッ", "ア=>ア", + "イ=>イ", "ウ=>ウ", "エ=>エ", "オ=>オ", "カ=>カ", "キ=>キ", "ク=>ク", "ケ=>ケ", "コ=>コ", "サ=>サ", "シ=>シ", "ス=>ス", "セ=>セ", "ソ=>ソ", "タ=>タ", "チ=>チ", "ツ=>ツ", "テ=>テ", "ト=>ト", "ナ=>ナ", "ニ=>ニ", "ヌ=>ヌ", "ネ=>ネ", "ノ=>ノ", "ハ=>ハ", + "ヒ=>ヒ", "フ=>フ", "ヘ=>ヘ", "ホ=>ホ", "マ=>マ", "ミ=>ミ", "ム=>ム", "メ=>メ", "モ=>モ", "ヤ=>ヤ", "ユ=>ユ", "ヨ=>ヨ", "ラ=>ラ", "リ=>リ", "ル=>ル", "レ=>レ", "ロ=>ロ", "ワ=>ワ", "ン=>ン", + "a=>a", "b=>b","c=>c","d=>d","e=>e","f=>f","g=>g","h=>h","i=>i","j=>j","k=>k","l=>l","m=>m","n=>n","o=>o","p=>p","q=>q","r=>r","s=>s", + "t=>t","u=>u","v=>v","w=>w","x=>x", "y=>y", "z=>z", + "A=>A", "B=>B","C=>C","D=>D","E=>E","F=>F","G=>g","H=>H","I=>I","J=>j","K=>k","L=>L","M=>M","N=>N","O=>O","P=>P","Q=>Q","R=>R","S=>S", + "T=>T","U=>U","V=>V","W=>W","X=>X", "Y=>Y", "Z=>Z", + "1=>1", "2=>2", "3=>3", "4=>4", "5=>5", "6=>6", "7=>7", "8=>8", "9=>9", "0=>0" + ] + } + }, + "filter" : { + "reading_form" : { + "type" : "kuromoji_readingform" + }, + "pos_filter" : { + "type" : "kuromoji_part_of_speech", + "stoptags" : [ + "その他", + "その他-間投", + "フィラー", + "感動詞", + "記号", + "記号-アルファベット", + "記号-一般", + "記号-括弧開", + "記号-括弧閉", + "記号-句点", + "記号-空白", + "記号-読点", + "形容詞", + "形容詞-接尾", + "形容詞-非自立", + "語断片", + "助詞", + "助詞-格助詞", + "助詞-格助詞-一般", + "助詞-格助詞-引用", + "助詞-格助詞-連語", + "助詞-間投助詞", + "助詞-係助詞", + "助詞-終助詞", + "助詞-接続助詞", + "助詞-特殊", + "助詞-副詞化", + "助詞-副助詞", + "助詞-副助詞/並立助詞/終助詞", + "助詞-並立助詞", + "助詞-連体化", + "助動詞", + "接続詞", + "接頭詞", + "接頭詞-形容詞接続", + "接頭詞-数接続", + "接頭詞-動詞接続", + "接頭詞-名詞接続", + "動詞", + "動詞-自立", + "動詞-接尾", + "動詞-非自立", + "非言語音", + "副詞", + "副詞-一般", + "副詞-助詞類接続", + "名詞-ナイ形容詞語幹", + "名詞-引用文字列", + "名詞-形容動詞語幹", + "名詞-数", + "名詞-接続詞的", + "名詞-接尾", + "名詞-接尾-サ変接続", + "名詞-接尾-一般", + "名詞-接尾-形容動詞語幹", + "名詞-接尾-助数詞", + "名詞-接尾-助動詞語幹", + "名詞-接尾-人名", + "名詞-接尾-地域", + "名詞-接尾-特殊", + "名詞-接尾-副詞可能", + "名詞-代名詞", + "名詞-代名詞-一般", + "名詞-代名詞-縮約", + "名詞-動詞非自立的", + "名詞-特殊", + "名詞-特殊-助動詞語幹", + "名詞-非自立", + "名詞-非自立-一般", + "名詞-非自立-形容動詞語幹", + "名詞-非自立-助動詞語幹", + "名詞-非自立-副詞可能", + "名詞-副詞可能", + "連体詞" + ] + }, + "stopword_en_filter": { + "type": "stop", + "stopwords": "_english_" + }, + "content_length_filter": { + "type": "length", + "max": 30 + }, + "limit_token_count_filter": { + "type": "limit", + "max_token_count": 2147483647 + }, + "stemmer_en_filter": { + "type": "stemmer", + "name": "english" + }, + "arabic_stop": { + "type": "stop", + "stopwords": "_arabic_" + }, + "arabic_keywords": { + "type": "keyword_marker", + "keywords": ["ﻡﺮﺤﺑﺍﺍ", "ﻉﺎﻠﻣ", "ﺐﺤﺛ"] + }, + "arabic_stemmer": { + "type": "stemmer", + "language": "arabic" + }, + "bulgarian_stop": { + "type": "stop", + "stopwords": "_bulgarian_" + }, + "bulgarian_keywords": { + "type": "keyword_marker", + "keywords": ["Добър ден"] + }, + "bulgarian_stemmer": { + "type": "stemmer", + "language": "bulgarian" + }, + "catalan_elision": { + "type": "elision", + "articles": [ "d", "l", "m", "n", "s", "t"] + }, + "catalan_stop": { + "type": "stop", + "stopwords": "_catalan_" + }, + "catalan_keywords": { + "type": "keyword_marker", + "keywords": ["Hola", "món", "recerca"] + }, + "catalan_stemmer": { + "type": "stemmer", + "language": "catalan" + }, + "czech_stop": { + "type": "stop", + "stopwords": "_czech_" + }, + "czech_keywords": { + "type": "keyword_marker", + "keywords": ["Haló", "svět", "vyhledávání"] + }, + "czech_stemmer": { + "type": "stemmer", + "language": "czech" + }, + "danish_stop": { + "type": "stop", + "stopwords": "_danish_" + }, + "danish_keywords": { + "type": "keyword_marker", + "keywords": ["Hej", "verden", "Søg"] + }, + "danish_stemmer": { + "type": "stemmer", + "language": "danish" + }, + "dutch_stop": { + "type": "stop", + "stopwords": "_dutch_" + }, + "dutch_keywords": { + "type": "keyword_marker", + "keywords": ["hallo", "wereld", "zoeken"] + }, + "dutch_stemmer": { + "type": "stemmer", + "language": "dutch" + }, + "dutch_override": { + "type": "stemmer_override", + "rules": [ + "fiets=>fiets", + "bromfiets=>bromfiets", + "ei=>eier", + "kind=>kinder" + ] + }, + "english_keywords": { + "type": "keyword_marker", + "keywords": ["hello"] + }, + "finnish_stop": { + "type": "stop", + "stopwords": "_finnish_" + }, + "finnish_keywords": { + "type": "keyword_marker", + "keywords": ["Hei"] + }, + "finnish_stemmer": { + "type": "stemmer", + "language": "finnish" + }, + "french_elision": { + "type": "elision", + "articles_case": true, + "articles": [ + "l", "m", "t", "qu", "n", "s", + "j", "d", "c", "jusqu", "quoiqu", + "lorsqu", "puisqu" + ] + }, + "french_stop": { + "type": "stop", + "stopwords": "_french_" + }, + "french_keywords": { + "type": "keyword_marker", + "keywords": ["Bonjour", "monde", "recherche"] + }, + "french_stemmer": { + "type": "stemmer", + "language": "light_french" + }, + "german_stop": { + "type": "stop", + "stopwords": "_german_" + }, + "german_keywords": { + "type": "keyword_marker", + "keywords": ["Hallo", "Welt", "Suche"] + }, + "german_stemmer": { + "type": "stemmer", + "language": "light_german" + }, + "greek_stop": { + "type": "stop", + "stopwords": "_greek_" + }, + "greek_lowercase": { + "type": "lowercase", + "language": "greek" + }, + "greek_keywords": { + "type": "keyword_marker", + "keywords": ["Γεια σας", "κόσμος", "έρευνα"] + }, + "greek_stemmer": { + "type": "stemmer", + "language": "greek" + }, + "hindi_stop": { + "type": "stop", + "stopwords": "_hindi_" + }, + "hungarian_stop": { + "type": "stop", + "stopwords": "_hungarian_" + }, + "hungarian_keywords": { + "type": "keyword_marker", + "keywords": ["Helló", "világ", "keresés"] + }, + "hungarian_stemmer": { + "type": "stemmer", + "language": "hungarian" + }, + "indonesian_stop": { + "type": "stop", + "stopwords": "_indonesian_" + }, + "indonesian_keywords": { + "type": "keyword_marker", + "keywords": ["halo", "dunia", "pencarian"] + }, + "indonesian_stemmer": { + "type": "stemmer", + "language": "indonesian" + }, + "italian_elision": { + "type": "elision", + "articles": [ + "c", "l", "all", "dall", "dell", + "nell", "sull", "coll", "pell", + "gl", "agl", "dagl", "degl", "negl", + "sugl", "un", "m", "t", "s", "v", "d" + ] + }, + "italian_stop": { + "type": "stop", + "stopwords": "_italian_" + }, + "italian_keywords": { + "type": "keyword_marker", + "keywords": ["Ciao", "mondo", "ricerca"] + }, + "italian_stemmer": { + "type": "stemmer", + "language": "light_italian" + }, + "latvian_stop": { + "type": "stop", + "stopwords": "_latvian_" + }, + "latvian_keywords": { + "type": "keyword_marker", + "keywords": ["sveiki", "pasaule", "meklēšana"] + }, + "latvian_stemmer": { + "type": "stemmer", + "language": "latvian" + }, + "lithuanian_stop": { + "type": "stop", + "stopwords": "_lithuanian_" + }, + "lithuanian_keywords": { + "type": "keyword_marker", + "keywords": ["Sveiki", "pasaulis", "paieška"] + }, + "lithuanian_stemmer": { + "type": "stemmer", + "language": "lithuanian" + }, + "norwegian_stop": { + "type": "stop", + "stopwords": "_norwegian_" + }, + "norwegian_keywords": { + "type": "keyword_marker", + "keywords": ["Hallo", "verden", "Søk"] + }, + "norwegian_stemmer": { + "type": "stemmer", + "language": "norwegian" + }, + "persian_stop": { + "type": "stop", + "stopwords": "_persian_" + }, + "portuguese_stop": { + "type": "stop", + "stopwords": "_portuguese_" + }, + "portuguese_keywords": { + "type": "keyword_marker", + "keywords": ["Olá", "mundo", "pesquisa"] + }, + "portuguese_stemmer": { + "type": "stemmer", + "language": "light_portuguese" + }, + "romanian_stop": { + "type": "stop", + "stopwords": "_romanian_" + }, + "romanian_keywords": { + "type": "keyword_marker", + "keywords": ["Alo", "lume", "căutare"] + }, + "romanian_stemmer": { + "type": "stemmer", + "language": "romanian" + }, + "russian_stop": { + "type": "stop", + "stopwords": "_russian_" + }, + "russian_keywords": { + "type": "keyword_marker", + "keywords": ["привет", "мир", "поиск"] + }, + "russian_stemmer": { + "type": "stemmer", + "language": "russian" + }, + "spanish_stop": { + "type": "stop", + "stopwords": "_spanish_" + }, + "spanish_keywords": { + "type": "keyword_marker", + "keywords": ["¡Hola", "mundo", "búsqueda"] + }, + "spanish_stemmer": { + "type": "stemmer", + "language": "light_spanish" + }, + "swedish_stop": { + "type": "stop", + "stopwords": "_swedish_" + }, + "swedish_keywords": { + "type": "keyword_marker", + "keywords": ["Hallå", "material", "sök"] + }, + "swedish_stemmer": { + "type": "stemmer", + "language": "swedish" + }, + "turkish_stop": { + "type": "stop", + "stopwords": "_turkish_" + }, + "turkish_lowercase": { + "type": "lowercase", + "language": "turkish" + }, + "turkish_keywords": { + "type": "keyword_marker", + "keywords": ["Merhaba", "Dünya", "arama"] + }, + "turkish_stemmer": { + "type": "stemmer", + "language": "turkish" + }, + "thai_stop": { + "type": "stop", + "stopwords": "_thai_" + } + } + } +} diff --git a/src/main/webapp/WEB-INF/view/admin/general/admin_general.jsp b/src/main/webapp/WEB-INF/view/admin/general/admin_general.jsp index 158be401a..f021f12db 100644 --- a/src/main/webapp/WEB-INF/view/admin/general/admin_general.jsp +++ b/src/main/webapp/WEB-INF/view/admin/general/admin_general.jsp @@ -84,7 +84,7 @@
- + diff --git a/src/main/webapp/WEB-INF/view/admin/maintenance/admin_maintenance.jsp b/src/main/webapp/WEB-INF/view/admin/maintenance/admin_maintenance.jsp index 1d6b37ce6..9ce346822 100644 --- a/src/main/webapp/WEB-INF/view/admin/maintenance/admin_maintenance.jsp +++ b/src/main/webapp/WEB-INF/view/admin/maintenance/admin_maintenance.jsp @@ -63,7 +63,7 @@
- + diff --git a/src/main/webapp/WEB-INF/view/common/admin/sidebar.jsp b/src/main/webapp/WEB-INF/view/common/admin/sidebar.jsp index b64bd6377..57239ec42 100644 --- a/src/main/webapp/WEB-INF/view/common/admin/sidebar.jsp +++ b/src/main/webapp/WEB-INF/view/common/admin/sidebar.jsp @@ -75,7 +75,7 @@

- +