PlainAnalyzer.java revision c23e82b612acd5e947c164114377578116f6d298
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* See LICENSE.txt included in this distribution for the specific
* language governing permissions and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at LICENSE.txt.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 2005 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
/*
* ident "%Z%%M% %I% %E% SMI"
*/
package org.opensolaris.opengrok.analysis.plain;
import org.apache.lucene.document.*;
import org.apache.lucene.analysis.*;
import java.io.*;
import org.opensolaris.opengrok.analysis.*;
import java.util.*;
import java.util.prefs.*;
/**
* Analyzer for plain text files
* Created on September 21, 2005
*
* @author Chandan
*/
public class PlainAnalyzer extends FileAnalyzer {
public static char[] content;
public int len;
int flen;
PlainFullTokenizer plainfull;
PlainSymbolTokenizer plainref;
PlainXref xref;
private static Reader dummy = new StringReader(" ");
Ctags ctags;
public HashMap<String, HashMap<Integer, String>> defs;
public static String contentType = "text/plain";
public static String getContentType() {
return "text/plain";
}
public static Class isMagic(byte[] content) {
for(byte b: content) {
if(b == 9 || b == 10 || b == 13 || (b >= 32 && b < 127) ) {
} else {
return null;
}
}
return PlainAnalyzer.class;
}
public static Genre g = Genre.PLAIN;
public Genre getGenre() {
return g;
}
/** Creates a new instance of PlainAnalyzer */
public PlainAnalyzer() {
super();
content = new char[64 * 1024];
len = 0;
plainfull = new PlainFullTokenizer(dummy);
plainref = new PlainSymbolTokenizer(dummy);
xref = new PlainXref((Reader) null);
//using pref to pass the path to ctags!
//Preferences prefs = Preferences.userNodeForPackage(PlainAnalyzer.class);
//String ctagsPath = prefs.get("ctags", null);
String ctagsPath = System.getProperty("ctags");
if (ctagsPath != null ) {
try {
ctags = new Ctags(ctagsPath);
} catch (IOException e) {
// System.err.println("ERROR: running ctags: " + ctagsPath + " searching definitions will not work!");
}
}
if(ctags == null) {
System.err.println("WARNING: unable to run ctags! searching definitions will not work!");
}
}
public void analyze(Document doc, InputStream in) {
try {
InputStreamReader inReader = new InputStreamReader(in);
len = 0;
do{
int rbytes = inReader.read(content, len, content.length - len);
if(rbytes > 0 ) {
if(rbytes == (content.length - len)) {
char[] content2 = new char[content.length * 2];
System.arraycopy(content,0, content2, 0, content.length);
content = content2;
}
len += rbytes;
} else {
break;
}
} while(true);
} catch (IOException e) {
return;
}
doc.add(Field.Text("full", dummy));
try {
String fullpath;
if((fullpath = doc.get("fullpath")) != null && ctags != null) {
defs = ctags.doCtags(fullpath+"\n");
if(defs != null && defs.size() > 0) {
doc.add(Field.Text("defs", dummy));
doc.add(Field.Text("refs", dummy)); //XXX adding a refs field only if it has defs?
doc.add(new Field("tags", ctags.tagString(), true, false, false));
}
}
} catch (IOException e) {
}
}
public TokenStream tokenStream(String fieldName, Reader reader) {
if("full".equals(fieldName)) {
plainfull.reInit(content, len);
return plainfull;
} else if ("refs".equals(fieldName)) {
plainref.reInit(content, len);
return plainref;
} else if("defs".equals(fieldName)) {
return new Hash2TokenStream(defs);
}
return super.tokenStream(fieldName, reader);
}
/**
* Write a cross referenced HTML file.
* @param out Writer to write HTML cross-reference
*/
public void writeXref(Writer out) throws IOException {
xref.reInit(content, len);
xref.write(out);
//lines = xref.getLine();
}
/**
* Write a cross referenced HTML file reads the source from in
* @param in Input source
* @param out Output xref writer
*/
public static void writeXref(InputStream in, Writer out) throws IOException {
PlainXref xref = new PlainXref(in);
xref.write(out);
}
}