fix #564 : remove style tag from indexed doc

This commit is contained in:
Shinsuke Sugaya 2016-06-30 12:43:04 +09:00
parent 3249527dfc
commit 1402c84baa
2 changed files with 3 additions and 3 deletions

View file

@ -169,7 +169,7 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction
/** The key of the configuration. e.g. //LINK[@rel='canonical']/@href */
String CRAWLER_DOCUMENT_HTML_CANNONICAL_XPATH = "crawler.document.html.cannonical.xpath";
/** The key of the configuration. e.g. noscript,script */
/** The key of the configuration. e.g. noscript,script,style */
String CRAWLER_DOCUMENT_HTML_PRUNED_TAGS = "crawler.document.html.pruned.tags";
/** The key of the configuration. e.g. 200 */
@ -1317,7 +1317,7 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction
/**
* Get the value for the key 'crawler.document.html.pruned.tags'. <br>
* The value is, e.g. noscript,script <br>
* The value is, e.g. noscript,script,style <br>
* @return The value of found property. (NotNull: if not found, exception but basically no way)
*/
String getCrawlerDocumentHtmlPrunedTags();

View file

@ -98,7 +98,7 @@ crawler.document.html.content.xpath=//BODY
crawler.document.html.lang.xpath=//HTML/@lang
crawler.document.html.digest.xpath=//META[@name='description']/@content
crawler.document.html.cannonical.xpath=//LINK[@rel='canonical']/@href
crawler.document.html.pruned.tags=noscript,script
crawler.document.html.pruned.tags=noscript,script,style
crawler.document.html.max.digest.length=200
# file