PlainAnalyzer.java revision 6d7c6f82e644c205bc679ee5b1fa2929ec949963
1117N/A/*
1117N/A * CDDL HEADER START
1537N/A *
1117N/A * The contents of this file are subject to the terms of the
1117N/A * Common Development and Distribution License (the "License").
1117N/A * You may not use this file except in compliance with the License.
1117N/A *
1117N/A * See LICENSE.txt included in this distribution for the specific
1117N/A * language governing permissions and limitations under the License.
1117N/A *
1117N/A * When distributing Covered Code, include this CDDL HEADER in each
1117N/A * file and include the License file at LICENSE.txt.
1117N/A * If applicable, add the following below this CDDL HEADER, with the
1117N/A * fields enclosed by brackets "[]" replaced with your own identifying
1117N/A * information: Portions Copyright [yyyy] [name of copyright owner]
1117N/A *
1117N/A * CDDL HEADER END
1117N/A */
1117N/A
1117N/A/*
1117N/A * Copyright (c) 2005, 2011, Oracle and/or its affiliates. All rights reserved.
1117N/A */
1117N/Apackage org.opensolaris.opengrok.analysis.plain;
1117N/A
1117N/Aimport java.io.IOException;
1117N/Aimport java.io.Reader;
1117N/Aimport java.io.StringReader;
1117N/Aimport java.io.Writer;
1117N/Aimport java.util.Arrays;
1117N/Aimport org.apache.lucene.analysis.TokenStream;
1117N/Aimport org.apache.lucene.document.Document;
1117N/Aimport org.apache.lucene.document.Field;
1247N/Aimport org.opensolaris.opengrok.analysis.Definitions;
1117N/Aimport org.opensolaris.opengrok.analysis.ExpandTabsReader;
1117N/Aimport org.opensolaris.opengrok.analysis.FileAnalyzerFactory;
1117N/Aimport org.opensolaris.opengrok.analysis.Hash2TokenStream;
1117N/Aimport org.opensolaris.opengrok.analysis.TextAnalyzer;
1466N/Aimport org.opensolaris.opengrok.configuration.Project;
1117N/Aimport org.opensolaris.opengrok.history.Annotation;
1117N/A
1117N/A/**
1117N/A * Analyzer for plain text files
* Created on September 21, 2005
*
* @author Chandan
*/
public class PlainAnalyzer extends TextAnalyzer {
protected char[] content;
protected int len;
private final PlainFullTokenizer plainfull;
private final PlainSymbolTokenizer plainref;
private final PlainXref xref;
private static final Reader dummy = new StringReader(" ");
protected Definitions defs;
/** Creates a new instance of PlainAnalyzer */
protected PlainAnalyzer(FileAnalyzerFactory factory) {
super(factory);
content = new char[64 * 1024];
len = 0;
plainfull = new PlainFullTokenizer(dummy);
plainref = new PlainSymbolTokenizer(dummy);
xref = new PlainXref((Reader) null);
}
@Override
public void analyze(Document doc, Reader in) throws IOException {
Reader inReader =
ExpandTabsReader.wrap(in, project);
len = 0;
do {
int rbytes = inReader.read(content, len, content.length - len);
if (rbytes >= 0) {
if (rbytes == (content.length - len)) {
content = Arrays.copyOf(content, content.length * 2);
}
len += rbytes;
} else {
break;
}
} while (true);
doc.add(new Field("full", dummy));
String fullpath;
if ((fullpath = doc.get("fullpath")) != null && ctags != null) {
defs = ctags.doCtags(fullpath + "\n");
if (defs != null && defs.numberOfSymbols() > 0) {
doc.add(new Field("defs", dummy));
doc.add(new Field("refs", dummy)); //@FIXME adding a refs field only if it has defs?
byte[] tags = defs.serialize();
doc.add(new Field("tags", tags));
}
}
}
@Override
public TokenStream tokenStream(String fieldName, Reader reader) {
if ("full".equals(fieldName)) {
plainfull.reInit(content, len);
return plainfull;
} else if ("refs".equals(fieldName)) {
plainref.reInit(content, len);
return plainref;
} else if ("defs".equals(fieldName)) {
return new Hash2TokenStream(defs.getSymbols());
}
return super.tokenStream(fieldName, reader);
}
/**
* Write a cross referenced HTML file.
* @param out Writer to write HTML cross-reference
*/
@Override
public void writeXref(Writer out) throws IOException {
xref.reInit(content, len);
xref.project = project;
xref.write(out);
}
/**
* Write a cross referenced HTML file reads the source from in
* @param in Input source
* @param out Output xref writer
* @param defs definitions for the file (could be null)
* @param annotation annotation for the file (could be null)
*/
static void writeXref(Reader in, Writer out, Definitions defs, Annotation annotation, Project project) throws IOException {
PlainXref xref = new PlainXref(in);
xref.annotation = annotation;
xref.project = project;
xref.setDefs(defs);
xref.write(out);
}
}