/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* See LICENSE.txt included in this distribution for the specific
* language governing permissions and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at LICENSE.txt.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright (c) 2005, 2012, Oracle and/or its affiliates. All rights reserved.
*/
package org.opensolaris.opengrok.analysis.archive;
import java.io.IOException;
import java.io.InputStream;
import java.io.Reader;
import java.io.Writer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.TextField;
import org.apache.tools.tar.TarEntry;
import org.apache.tools.tar.TarInputStream;
import org.opensolaris.opengrok.analysis.AnalyzerGuru;
import org.opensolaris.opengrok.analysis.FileAnalyzer;
import org.opensolaris.opengrok.analysis.FileAnalyzerFactory;
import org.opensolaris.opengrok.analysis.plain.PlainFullTokenizer;
import org.opensolaris.opengrok.web.Util;
/**
* Analyzes TAR files Created on September 22, 2005
*
* @author Chandan
*/
public class TarAnalyzer extends FileAnalyzer {
private final StringBuilder content;
private PlainFullTokenizer plainfull;
TokenStreamComponents tsc_pf;
protected TarAnalyzer(FileAnalyzerFactory factory) {
super(factory);
content = new StringBuilder(64 * 1024);
}
@Override
public void analyze(Document doc, InputStream in) throws IOException {
content.setLength(0);
TarInputStream zis = new TarInputStream(in);
TarEntry entry;
while ((entry = zis.getNextEntry()) != null) {
content.append(entry.getName()).append('\n');
}
content.trimToSize();
doc.add(new Field("full", AnalyzerGuru.dummyS, TextField.TYPE_STORED));
}
@Override
public TokenStreamComponents createComponents(String fieldName, Reader reader) {
if ("full".equals(fieldName)) {
plainfull = new PlainFullTokenizer(reader);
plainfull.reInit(content.toString());
tsc_pf = new TokenStreamComponents(plainfull) {
@Override
protected void setReader(final Reader reader) throws IOException {
plainfull.reInit(content.toString());
super.setReader(reader);
}
};
return tsc_pf;
}
return super.createComponents(fieldName, reader);
}
/**
* Write a cross referenced HTML file.
*
* @param out Writer to store HTML cross-reference
*/
@Override
public void writeXref(Writer out) throws IOException {
out.write(Util.htmlize(content));
}
}