1440N/Apackage org.opensolaris.opengrok.analysis.php;
1440N/A
1461N/Aimport static org.junit.Assert.assertArrayEquals;
1461N/A
1461N/Aimport java.io.IOException;
1450N/Aimport java.io.InputStream;
1450N/Aimport java.io.InputStreamReader;
1461N/Aimport java.io.Reader;
1440N/Aimport java.io.StringReader;
1440N/Aimport java.util.LinkedList;
1440N/Aimport java.util.List;
1461N/A
1440N/Aimport org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
1440N/Aimport org.junit.Test;
1440N/Aimport org.opensolaris.opengrok.analysis.FileAnalyzer;
1461N/Aimport org.opensolaris.opengrok.analysis.JFlexTokenizer;
1461N/Aimport org.opensolaris.opengrok.util.IOUtils;
1440N/A
1440N/A/**
1440N/A * Tests the {@link PhpSymbolTokenizer} class.
1440N/A * @author Gustavo Lopes
1440N/A */
1440N/Apublic class PhpSymbolTokenizerTest {
1440N/A private FileAnalyzer analyzer;
1440N/A
1461N/A /**
1461N/A * Create new test.
1461N/A */
1440N/A public PhpSymbolTokenizerTest() {
1440N/A PhpAnalyzerFactory analFact = new PhpAnalyzerFactory();
1440N/A this.analyzer = analFact.getAnalyzer();
1440N/A }
1440N/A
1440N/A private String[] getTermsFor(String s) {
1450N/A return getTermsFor(new StringReader(s));
1450N/A }
1450N/A
1461N/A @SuppressWarnings("resource")
1450N/A private String[] getTermsFor(Reader r) {
1440N/A List<String> l = new LinkedList<String>();
1440N/A JFlexTokenizer ts = (JFlexTokenizer)
1461N/A this.analyzer.overridableTokenStream("refs", null);
1450N/A ts.yyreset(r);
1440N/A CharTermAttribute term = ts.addAttribute(CharTermAttribute.class);
1440N/A try {
1440N/A while (ts.yylex()) {
1440N/A l.add(term.toString());
1440N/A }
1440N/A } catch (IOException ex) {
1440N/A throw new RuntimeException(ex);
1461N/A } finally {
1461N/A IOUtils.close(ts);
1440N/A }
1440N/A return l.toArray(new String[l.size()]);
1440N/A }
1440N/A
1461N/A /**
1461N/A * Simple tokenizer test.
1461N/A */
1440N/A @Test
1440N/A public void basicTest() {
1450N/A String s = "<?php foobar eval $eval 0sdf _ds˙d";
1440N/A String[] termsFor = getTermsFor(s);
1461N/A assertArrayEquals(new String[]{"foobar", "eval", "sdf", "_ds˙d"},
1461N/A termsFor);
1450N/A }
1450N/A
1461N/A /**
1461N/A * More complex tokenizer test using {@code sample.php}.
1461N/A * @throws IOException
1461N/A */
1450N/A @Test
1461N/A public void sampleTest() throws IOException {
1461N/A InputStream res = getClass().getResourceAsStream("sample.php");
1450N/A InputStreamReader r = new InputStreamReader(res, "UTF-8");
1450N/A String[] termsFor = getTermsFor(r);
1461N/A assertArrayEquals(new String[]
1461N/A {
1461N/A "a", //line 3
1461N/A "foo", "bar", //line 5
1461N/A "g", "a", "c", //line 6
1461N/A "b", "c", "a", "a", //line 7
1461N/A "doo", //line 9
1461N/A "a", //line 10
1461N/A "foo", "bar", //line 12
1461N/A "name", //line 13
1461N/A "foo", "bar", //line 14
1461N/A "foo", //line 15
1461N/A "ff", //line 20
1461N/A "foo", //line 21
1461N/A "FooException", //line 28
1461N/A "used",
1461N/A "Foo", "Bar", //line 30
1461N/A "Foo", "Foo", "param", //line 31
1461N/A "gata", //line 37
1461N/A "gata", //line 38
1461N/A "foo", "_SERVER", "_SERVER", "_SERVER", //line 39
1461N/A "foo", "bar", "foo", "bar", "foo", "a", //line 40
1461N/A }, termsFor);
1461N/A r.close();
1440N/A }
1440N/A}