/**
*
*/
package com.maalaang.omtwitter.text;
import junit.framework.TestCase;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* @author Sangwon Park
*
*/
public class OMTweetTokenizerTest extends TestCase {
private Logger logger = null;
private OMTweetTokenizer tweetTokenizer = null;
/* (non-Javadoc)
* @see junit.framework.TestCase#setUp()
*/
protected void setUp() throws Exception {
super.setUp();
logger = LoggerFactory.getLogger(getClass());
tweetTokenizer = new OMTweetTokenizer();
}
/**
* Test method for {@link com.maalaang.omtwitter.text.OMTweetTokenizer#tokenize(java.lang.String)}.
*/
public void testTokenize() {
String tweet = "@redhat I looooooove my #iphone4s 100$ http://exampleurl.com/pic.jpg";
logger.info("tweet - " + tweet);
OMTweetToken[] list = tweetTokenizer.tokenize(tweet);
int idx = 0;
OMTweetToken tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_USER, tok.getType());
assertEquals("@redhat", tok.getText());
assertEquals(0, tok.getBegin());
assertEquals(7, tok.getEnd());
assertEquals(OMTweetToken.NORMALIZED_TEXT_USER, tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_NORMAL, tok.getType());
assertEquals("I", tok.getText());
assertEquals(8, tok.getBegin());
assertEquals(9, tok.getEnd());
assertEquals("i", tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_NORMAL, tok.getType());
assertEquals("looooooove", tok.getText());
assertEquals(10, tok.getBegin());
assertEquals(20, tok.getEnd());
assertEquals("loove", tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_NORMAL, tok.getType());
assertEquals("my", tok.getText());
assertEquals(21, tok.getBegin());
assertEquals(23, tok.getEnd());
assertEquals("my", tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_HASHTAG, tok.getType());
assertEquals("#iphone4s", tok.getText());
assertEquals(24, tok.getBegin());
assertEquals(33, tok.getEnd());
assertEquals("#iphone4s", tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_NORMAL, tok.getType());
assertEquals("100$", tok.getText());
assertEquals(34, tok.getBegin());
assertEquals(38, tok.getEnd());
assertEquals("100$", tok.getNormalizedText());
logger.info(tok.toString());
tok = list[idx++];
assertEquals(OMTweetToken.TOKEN_TYPE_URL, tok.getType());
assertEquals("http://exampleurl.com/pic.jpg", tok.getText());
assertEquals(39, tok.getBegin());
assertEquals(68, tok.getEnd());
assertEquals(OMTweetToken.NORMALIZED_TEXT_URL, tok.getNormalizedText());
logger.info(tok.toString());
}
}