/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License (the "License"). * You may not use this file except in compliance with the License. * * See LICENSE.txt included in this distribution for the specific * language governing permissions and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at LICENSE.txt. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright (c) 2005, 2012, Oracle and/or its affiliates. All rights reserved. */ package org.opensolaris.opengrok.analysis; import java.util.Iterator; import java.util.List; import org.apache.lucene.analysis.TokenStream; import org.apache.lucene.analysis.tokenattributes.CharTermAttribute; public final class List2TokenStream extends TokenStream { private Iterator it; private String[] subTokens; private int si; private final CharTermAttribute termAtt = addAttribute(CharTermAttribute.class); public List2TokenStream(List l) { it = l.iterator(); } @Override public final boolean incrementToken() { if (!it.hasNext()) { // reached end of stream return false; } if (subTokens == null || subTokens.length == si) { String tok = it.next(); if (tok == null) { return false; } if (tok.indexOf('.') > 0) { subTokens = tok.split("[^a-z0-9A-Z_]+"); } else { subTokens = null; termAtt.setEmpty(); termAtt.append(tok); return true; } si = 0; } if (si < subTokens.length) { termAtt.setEmpty(); termAtt.append(subTokens[si++]); return true; } return false; } @Override public void close() { it = null; } }