Jelajahi Sumber

#1742 replace with ngram_synonym

Shinsuke Sugaya 7 tahun lalu
induk
melakukan
cbfc0b8281
2 mengubah file dengan 15 tambahan dan 13 penghapusan
  1. 3 3
      plugin.xml
  2. 12 10
      src/main/resources/fess_indices/fess.json

+ 3 - 3
plugin.xml

@@ -22,12 +22,12 @@
 		</antcall>
 		<!-- analysis-extension -->
 		<antcall target="install.plugin">
-			<param name="repo.url" value="${maven.release.repo.url}" />
+			<param name="repo.url" value="${maven.snapshot.repo.url}" />
 			<param name="plugin.groupId" value="org/codelibs" />
 			<param name="plugin.name.prefix" value="elasticsearch-" />
 			<param name="plugin.name" value="analysis-extension" />
-			<param name="plugin.version" value="6.3.1" />
-			<param name="plugin.zip.version" value="6.3.1" />
+			<param name="plugin.version" value="6.3.2-SNAPSHOT" />
+			<param name="plugin.zip.version" value="6.3.2-20180805.010401-1" />
 		</antcall>
 		<!-- configsync -->
 		<antcall target="install.plugin">

+ 12 - 10
src/main/resources/fess_indices/fess.json

@@ -686,14 +686,18 @@
             "ambiguities_resolved": false
         },
         "unigram_tokenizer": {
-          "type": "ngram",
-          "min_gram": "1",
-          "max_gram": "1"
+          "type": "ngram_synonym",
+          "n": "1",
+          "synonyms_path": "${fess.dictionary.path}synonym.txt",
+          "dynamic_reload": true,
+          "reload_interval": "1m"
         },
         "bigram_tokenizer": {
-          "type": "ngram",
-          "min_gram": "2",
-          "max_gram": "2"
+          "type": "ngram_synonym",
+          "n": "2",
+          "synonyms_path": "${fess.dictionary.path}synonym.txt",
+          "dynamic_reload": true,
+          "reload_interval": "1m"
         }
       },
       "analyzer": {
@@ -1137,10 +1141,9 @@
           "tokenizer": "unigram_tokenizer",
           "filter": [
             "alphanum_word_filter",
+            "cjk_bigram",
             "lowercase",
             "stopword_en_filter",
-            "synonym_filter",
-            "cjk_bigram",
             "english_keywords",
             "english_override",
             "stemmer_en_filter"
@@ -1161,10 +1164,9 @@
           "tokenizer": "unigram_tokenizer",
           "filter": [
             "alphanum_word_filter",
+            "cjk_bigram",
             "lowercase",
             "stopword_en_filter",
-            "synonym_filter",
-            "cjk_bigram",
             "english_keywords",
             "english_override",
             "stemmer_en_filter",