fix #1059 remove header/footer/nav tags from index
This commit is contained in:
parent
53fe2aeda2
commit
a5ccb5010a
2 changed files with 3 additions and 3 deletions
|
@ -204,7 +204,7 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction
|
|||
/** The key of the configuration. e.g. //LINK[@rel='canonical']/@href */
|
||||
String CRAWLER_DOCUMENT_HTML_CANONICAL_XPATH = "crawler.document.html.canonical.xpath";
|
||||
|
||||
/** The key of the configuration. e.g. noscript,script,style */
|
||||
/** The key of the configuration. e.g. noscript,script,style,header,footer,nav */
|
||||
String CRAWLER_DOCUMENT_HTML_PRUNED_TAGS = "crawler.document.html.pruned.tags";
|
||||
|
||||
/** The key of the configuration. e.g. 200 */
|
||||
|
@ -1683,7 +1683,7 @@ public interface FessConfig extends FessEnv, org.codelibs.fess.mylasta.direction
|
|||
|
||||
/**
|
||||
* Get the value for the key 'crawler.document.html.pruned.tags'. <br>
|
||||
* The value is, e.g. noscript,script,style <br>
|
||||
* The value is, e.g. noscript,script,style,header,footer,nav <br>
|
||||
* @return The value of found property. (NotNull: if not found, exception but basically no way)
|
||||
*/
|
||||
String getCrawlerDocumentHtmlPrunedTags();
|
||||
|
|
|
@ -113,7 +113,7 @@ crawler.document.html.content.xpath=//BODY
|
|||
crawler.document.html.lang.xpath=//HTML/@lang
|
||||
crawler.document.html.digest.xpath=//META[@name='description']/@content
|
||||
crawler.document.html.canonical.xpath=//LINK[@rel='canonical']/@href
|
||||
crawler.document.html.pruned.tags=noscript,script,style
|
||||
crawler.document.html.pruned.tags=noscript,script,style,header,footer,nav
|
||||
crawler.document.html.max.digest.length=200
|
||||
|
||||
# file
|
||||
|
|
Loading…
Add table
Reference in a new issue