Browse Source

fix #799 remove comment tags

Shinsuke Sugaya 8 years ago
parent
commit
c8fa12c650

+ 1 - 1
src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

@@ -476,7 +476,7 @@ public class FessXpathTransformer extends XpathTransformer implements FessTransf
                 final Node childNode = nodeList.item(i);
                 paseTextContent(childNode, buf);
             }
-        } else {
+        } else if (node.getNodeType() == Node.TEXT_NODE) {
             final String value = node.getTextContent();
             if (value != null) {
                 final String content = value.trim();

+ 10 - 0
src/test/java/org/codelibs/fess/crawler/transformer/FessXpathTransformerTest.java

@@ -549,6 +549,16 @@ public class FessXpathTransformerTest extends UnitFessTestCase {
         document = getDocument(data);
         value = transformer.getSingleNodeValue(document, "//BODY", false);
         assertEquals("aaa bbb ccc", value);
+
+        data = "<html><body> aaa <p> bbb <aaa>ccc</bbb> </p> </body></html>";
+        document = getDocument(data);
+        value = transformer.getSingleNodeValue(document, "//BODY", false);
+        assertEquals("aaa bbb ccc", value);
+
+        data = "<html><body> aaa <p> bbb <!-- test -->ccc<!-- test --> </p> </body></html>";
+        document = getDocument(data);
+        value = transformer.getSingleNodeValue(document, "//BODY", false);
+        assertEquals("aaa bbb ccc", value);
     }
 
     public void test_contentXpath() throws Exception {