// HTMLParser Library $Name: v1_6 $ - A java-based parser for HTML
// http://sourceforge.org/projects/htmlparser
// Copyright (C) 2004 Derrick Oswald
//
// Revision Control Information
//
// $Source: /cvsroot/htmlparser/htmlparser/src/org/htmlparser/tests/lexerTests/SourceTests.java,v $
// $Author: derrickoswald $
// $Date: 2004/07/31 16:42:31 $
// $Revision: 1.18 $
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
//
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public
// License along with this library; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
//
package org.htmlparser.tests.lexerTests;
import java.io.BufferedInputStream;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.MalformedURLException;
import java.net.URL;
import java.net.URLConnection;
import org.htmlparser.lexer.InputStreamSource;
import org.htmlparser.lexer.Stream;
import org.htmlparser.lexer.Source;
import org.htmlparser.lexer.StringSource;
import org.htmlparser.tests.ParserTestCase;
public class SourceTests extends ParserTestCase
{
static
{
System.setProperty ("org.htmlparser.tests.lexerTests.SourceTests", "SourceTests");
}
/**
* The default charset.
* This should be <code>ISO-8859-1</code>,
* see RFC 2616 (http://www.ietf.org/rfc/rfc2616.txt?number=2616) section 3.7.1
* Another alias is "8859_1".
*/
public static final String DEFAULT_CHARSET = "ISO-8859-1";
/**
* Test the first level stream class.
*/
public SourceTests (String name)
{
super (name);
}
/**
* Test initialization with a null value.
*/
public void testInputStreamSourceNull () throws IOException
{
Source source;
source = new InputStreamSource (null);
assertTrue ("erroneous character", -1 == source.read ());
}
/**
* Test initialization of a InputStreamSource with a zero length byte array.
*/
public void testInputStreamSourceEmpty () throws IOException
{
Source source;
source = new InputStreamSource (new Stream (new ByteArrayInputStream (new byte[0])), null);
assertTrue ("erroneous character", -1 == source.read ());
}
/**
* Test initialization of a InputStreamSource with an input stream having only one byte.
*/
public void testInputStreamSourceOneByte () throws IOException
{
Source source;
source = new InputStreamSource (new Stream (new ByteArrayInputStream (new byte[] { (byte)0x42 })), null);
assertTrue ("erroneous character", 'B' == source.read ());
assertTrue ("extra character", -1 == source.read ());
}
/**
* Test closing a InputStreamSource.
*/
public void testInputStreamSourceClose () throws IOException
{
Source source;
source = new InputStreamSource (new Stream (new ByteArrayInputStream ("hello word".getBytes ())), null);
assertTrue ("no character", -1 != source.read ());
source.destroy ();
try
{
source.read ();
fail ("not closed");
}
catch (IOException ioe)
{
// expected outcome
}
}
/**
* Test resetting a InputStreamSource.
*/
public void testInputStreamSourceReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
buffer = new StringBuffer (reference.length ());
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.reset ();
buffer.setLength (0);
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test resetting a InputStreamSource in the middle of reading.
*/
public void testInputStreamSourceMidReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < 25; i++)
buffer.append ((char)source.read ());
source.reset ();
for (int i = 0; i < 25; i++)
source.read ();
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test mark/reset of a InputStreamSource in the middle of reading.
*/
public void testInputStreamSourceMarkReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
assertTrue ("not markable", source.markSupported ());
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < 25; i++)
buffer.append ((char)source.read ());
source.mark (88);
for (int i = 0; i < 25; i++)
source.read ();
source.reset ();
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test skipping a InputStreamSource.
*/
public void testInputStreamSourceSkip () throws IOException
{
String part1;
String part2;
String part3;
String reference;
Source source;
StringBuffer buffer;
int c;
part1 = "Now is the time ";
part2 = "for all good men ";
part3 = "to come to the aid of the party";
reference = part1 + part2 + part3;
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < part1.length (); i++)
buffer.append ((char)source.read ());
source.skip (part2.length ());
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", (part1 + part3).equals (buffer.toString ()));
source.close ();
}
/**
* Test multi-byte read with a InputStreamSource.
*/
public void testInputStreamSourceMultByte () throws IOException
{
String reference;
Source source;
char[] buffer;
reference = "Now is the time for all good men to come to the aid of the party";
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
buffer = new char[reference.length ()];
source.read (buffer, 0, buffer.length);
assertTrue ("string incorrect", reference.equals (new String (buffer)));
assertTrue ("extra character", -1 == source.read ());
source.close ();
}
/**
* Test positioned multi-byte read with a InputStreamSource.
*/
public void testInputStreamSourcePositionedMultByte () throws IOException
{
String part1;
String part2;
String part3;
String reference;
Source source;
char[] buffer;
int length;
part1 = "Now is the time ";
part2 = "for all good men ";
part3 = "to come to the aid of the party";
reference = part1 + part2 + part3;
source = new InputStreamSource (new Stream (new ByteArrayInputStream (reference.getBytes (DEFAULT_CHARSET))), null);
buffer = new char[reference.length ()];
for (int i = 0; i < part1.length (); i++)
buffer[i] = (char)source.read ();
length = source.read (buffer, part1.length (), part2.length ());
assertTrue ("incorrect length", part2.length () == length);
length += part1.length ();
for (int i = 0; i < part3.length (); i++)
buffer[i + length] = (char)source.read ();
assertTrue ("string incorrect", reference.equals (new String (buffer)));
assertTrue ("extra character", -1 == source.read ());
source.close ();
}
/**
* Test ready of a InputStreamSource.
*/
public void testInputStreamSourceReady () throws IOException
{
Source source;
source = new InputStreamSource (new Stream (new ByteArrayInputStream (new byte[] { (byte)0x42, (byte)0x62 })), null);
assertTrue ("ready?", !source.ready ());
assertTrue ("erroneous character", 'B' == source.read ());
assertTrue ("not ready", source.ready ());
assertTrue ("erroneous character", 'b' == source.read ());
assertTrue ("ready?", !source.ready ());
assertTrue ("extra character", -1 == source.read ());
}
/**
* Test that the same characters are returned as with another reader.
*/
public void testSameChars () throws IOException
{
String link;
URL url;
URLConnection connection1;
URLConnection connection2;
InputStreamReader in;
int c1;
int c2;
Source source;
int index;
link = "http://htmlparser.sourceforge.net";
try
{
url = new URL (link);
connection1 = url.openConnection ();
connection1.connect ();
in = new InputStreamReader (new BufferedInputStream (connection1.getInputStream ()), "UTF-8");
connection2 = url.openConnection ();
connection2.connect ();
source = new InputStreamSource (new Stream (connection2.getInputStream ()), "UTF-8");
index = 0;
while (-1 != (c1 = in.read ()))
{
c2 = source.read ();
if (c1 != c2)
fail ("characters differ at position " + index + ", expected " + c1 + ", actual " + c2);
index++;
}
c2 = source.read ();
assertTrue ("extra characters", -1 == c2);
source.close ();
in.close ();
}
catch (MalformedURLException murle)
{
fail ("bad url " + link);
}
}
/**
* Test initialization of a StringSource with a null value.
*/
public void testStringSourceNull () throws IOException
{
Source source;
source = new StringSource (null);
assertTrue ("erroneous character", -1 == source.read ());
}
/**
* Test initialization of a StringSource with a zero length string.
*/
public void testStringSourceEmpty () throws IOException
{
Source source;
source = new StringSource ("");
assertTrue ("erroneous character", -1 == source.read ());
}
/**
* Test initialization of a StringSource with a one character string.
*/
public void testStringSourceOneCharacter () throws IOException
{
Source source;
source = new StringSource (new String ("B"));
assertTrue ("erroneous character", 'B' == source.read ());
assertTrue ("extra character", -1 == source.read ());
}
/**
* Test closing a StringSource.
*/
public void testStringSourceClose () throws IOException
{
Source source;
source = new StringSource ("hello word");
assertTrue ("no character", -1 != source.read ());
source.destroy ();
try
{
source.read ();
fail ("not closed");
}
catch (IOException ioe)
{
// expected outcome
}
}
/**
* Test resetting a StringSource.
*/
public void testStringSourceReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new StringSource (reference);
buffer = new StringBuffer (reference.length ());
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.reset ();
buffer.setLength (0);
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test resetting a StringSource in the middle of reading.
*/
public void testStringSourceMidReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new StringSource (reference);
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < 25; i++)
buffer.append ((char)source.read ());
source.reset ();
for (int i = 0; i < 25; i++)
source.read ();
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test mark/reset of a StringSource in the middle of reading.
*/
public void testStringSourceMarkReset () throws IOException
{
String reference;
Source source;
StringBuffer buffer;
int c;
reference = "Now is the time for all good men to come to the aid of the party";
source = new StringSource (reference);
assertTrue ("not markable", source.markSupported ());
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < 25; i++)
buffer.append ((char)source.read ());
source.mark (88);
for (int i = 0; i < 25; i++)
source.read ();
source.reset ();
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", reference.equals (buffer.toString ()));
source.close ();
}
/**
* Test skipping a StringSource.
*/
public void testStringSourceSkip () throws IOException
{
String part1;
String part2;
String part3;
String reference;
Source source;
StringBuffer buffer;
int c;
part1 = "Now is the time ";
part2 = "for all good men ";
part3 = "to come to the aid of the party";
reference = part1 + part2 + part3;
source = new StringSource (reference);
buffer = new StringBuffer (reference.length ());
for (int i = 0; i < part1.length (); i++)
buffer.append ((char)source.read ());
source.skip (part2.length ());
while (-1 != (c = source.read ()))
buffer.append ((char)c);
assertTrue ("string incorrect", (part1 + part3).equals (buffer.toString ()));
source.close ();
}
/**
* Test multi-byte read with a StringSource.
*/
public void testStringSourceMultByte () throws IOException
{
String reference;
Source source;
char[] buffer;
reference = "Now is the time for all good men to come to the aid of the party";
source = new StringSource (reference);
buffer = new char[reference.length ()];
source.read (buffer, 0, buffer.length);
assertTrue ("string incorrect", reference.equals (new String (buffer)));
assertTrue ("extra character", -1 == source.read ());
source.close ();
}
/**
* Test positioned multi-byte read with a StringSource.
*/
public void testStringSourcePositionedMultByte () throws IOException
{
String part1;
String part2;
String part3;
String reference;
Source source;
char[] buffer;
int length;
part1 = "Now is the time ";
part2 = "for all good men ";
part3 = "to come to the aid of the party";
reference = part1 + part2 + part3;
source = new StringSource (reference);
buffer = new char[reference.length ()];
for (int i = 0; i < part1.length (); i++)
buffer[i] = (char)source.read ();
length = source.read (buffer, part1.length (), part2.length ());
assertTrue ("incorrect length", part2.length () == length);
length += part1.length ();
for (int i = 0; i < part3.length (); i++)
buffer[i + length] = (char)source.read ();
assertTrue ("string incorrect", reference.equals (new String (buffer)));
assertTrue ("extra character", -1 == source.read ());
source.close ();
}
/**
* Test ready of a StringSource.
*/
public void testStringSourceReady () throws IOException
{
Source source;
source = new StringSource ("Bb");
assertTrue ("ready?", source.ready ());
assertTrue ("erroneous character", 'B' == source.read ());
assertTrue ("not ready", source.ready ());
assertTrue ("erroneous character", 'b' == source.read ());
assertTrue ("ready?", !source.ready ());
assertTrue ("extra character", -1 == source.read ());
}
}