// HTMLParser Library $Name: v1_6 $ - A java-based parser for HTML
// http://sourceforge.org/projects/htmlparser
// Copyright (C) 2004 Somik Raha
//
// Revision Control Information
//
// $Source: /cvsroot/htmlparser/htmlparser/src/org/htmlparser/tests/visitorsTests/TextExtractingVisitorTest.java,v $
// $Author: derrickoswald $
// $Date: 2004/01/02 16:24:57 $
// $Revision: 1.15 $
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
//
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public
// License along with this library; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
//
package org.htmlparser.tests.visitorsTests;
import org.htmlparser.tests.ParserTestCase;
import org.htmlparser.visitors.TextExtractingVisitor;
public class TextExtractingVisitorTest extends ParserTestCase {
static
{
System.setProperty ("org.htmlparser.tests.visitorsTests.TextExtractingVisitorTest", "TextExtractingVisitorTest");
}
public TextExtractingVisitorTest(String name) {
super(name);
}
public void testSimpleVisit() throws Exception {
createParser("<HTML><HEAD><TITLE>Hello World</TITLE></HEAD></HTML>");
TextExtractingVisitor visitor = new TextExtractingVisitor();
parser.visitAllNodesWith(visitor);
assertStringEquals(
"extracted text",
"Hello World",
visitor.getExtractedText()
);
}
public void testSimpleVisitWithRegisteredScanners() throws Exception {
createParser("<HTML><HEAD><TITLE>Hello World</TITLE></HEAD></HTML>");
TextExtractingVisitor visitor = new TextExtractingVisitor();
parser.visitAllNodesWith(visitor);
assertStringEquals(
"extracted text",
"Hello World",
visitor.getExtractedText()
);
}
public void testVisitHtmlWithSpecialChars() throws Exception {
createParser("<BODY>Hello World </BODY>");
TextExtractingVisitor visitor = new TextExtractingVisitor();
parser.visitAllNodesWith(visitor);
assertStringEquals(
"extracted text",
"Hello World ",
visitor.getExtractedText()
);
}
public void testVisitHtmlWithPreTags() throws Exception {
createParser(
"Some text with <pre>this should be preserved</pre>"
);
TextExtractingVisitor visitor = new TextExtractingVisitor();
parser.visitAllNodesWith(visitor);
assertStringEquals(
"extracted text",
"Some text with this should be preserved",
visitor.getExtractedText()
);
}
}