/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* See LICENSE.txt included in this distribution for the specific
* language governing permissions and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at LICENSE.txt.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright (c) 2012, 2017, Oracle and/or its affiliates. All rights reserved.
*/
package org.opensolaris.opengrok.analysis.php;
import static org.junit.Assert.assertArrayEquals;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.Reader;
import java.io.StringReader;
import java.io.UnsupportedEncodingException;
import java.util.LinkedList;
import java.util.List;
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
import org.junit.Test;
import org.opensolaris.opengrok.analysis.FileAnalyzer;
import org.opensolaris.opengrok.analysis.JFlexTokenizer;
/**
* Tests the {@link PhpSymbolTokenizer} class.
*
* @author Gustavo Lopes
*/
public class PhpSymbolTokenizerTest {
private final FileAnalyzer analyzer;
public PhpSymbolTokenizerTest() {
PhpAnalyzerFactory analFact = new PhpAnalyzerFactory();
this.analyzer = analFact.getAnalyzer();
}
private String[] getTermsFor(Reader r) {
List<String> l = new LinkedList<>();
JFlexTokenizer ts = (JFlexTokenizer) this.analyzer.tokenStream("refs", r);
ts.setReader(r);
ts.yyreset(r);
CharTermAttribute term = ts.addAttribute(CharTermAttribute.class);
try {
while (ts.yylex()) {
l.add(term.toString());
}
} catch (IOException ex) {
throw new RuntimeException(ex);
}
return l.toArray(new String[l.size()]);
}
@Test
public void basicTest() {
String s = "<?php foobar eval $eval 0sdf _ds˙d";
String[] termsFor = getTermsFor(new StringReader(s));
assertArrayEquals(
new String[]{"foobar", "eval", "sdf", "_ds˙d"},
termsFor);
}
@Test
public void sampleTest() throws UnsupportedEncodingException {
InputStream res = getClass().getClassLoader().getResourceAsStream(
"org/opensolaris/opengrok/analysis/php/sample.php");
InputStreamReader r = new InputStreamReader(res, "UTF-8");
String[] termsFor = getTermsFor(r);
assertArrayEquals(
new String[]{
"a", //line 3
"foo", "bar", //line 5
"g", "a", "c", //line 6
"b", "c", "a", "a", //line 7
"doo", //line 9
"a", //line 10
"foo", "bar", //line 12
"name", //line 13
"foo", "bar", //line 14
"foo", //line 15
"ff", //line 20
"foo", //line 21
"FooException", //line 28
"used",
"Foo", "Bar", //line 30
"Foo", "Foo", "param", //line 31
"gata", //line 37
"gata", //line 38
"foo", "_SERVER", "_SERVER", "_SERVER", //line 39
"foo", "bar", "foo", "bar", "foo", "a", //line 40
},
termsFor);
}
}