Hash2TokenStream.java revision 0
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* See LICENSE.txt included in this distribution for the specific
* language governing permissions and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at LICENSE.txt.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 2005 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
/*
* ident "%Z%%M% %I% %E% SMI"
*/
package org.opensolaris.opengrok.analysis;
import java.util.*;
import org.apache.lucene.analysis.Token;
import org.apache.lucene.analysis.TokenStream;
public final class Hash2TokenStream extends TokenStream {
int i=0;
String term;
String terms[];
Iterator<String> keys;
public Hash2TokenStream(HashMap<String, HashMap<Integer, String>> h){
keys = h.keySet().iterator();
}
public Token next() {
while(true) {
if (i <= 0) {
if (keys.hasNext()) {
term = keys.next();
terms = term.split("[^a-zA-Z_0-9]+");
i = terms.length;
if (i > 0) {
//repeat = h.get(term).size();
//System.out.println("Returning " + term + h.get(term));
return new Token(terms[--i], 0, 0);
} else {
//System.err.println(" ERRROR term " + term);
//return null;
}
} else {
return null;
}
} else {
//System.out.println("Returning " + term + h.get(term));
return new Token(terms[--i], 0, 0);
}
}
}
public void close() {
}
}