/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.search.spans;


import java.io.IOException;
import java.util.Objects;

import org.apache.lucene.search.TwoPhaseIterator;

A Spans implementation wrapping another spans instance, allowing to filter spans matches easily by implementing accept
/** * A {@link Spans} implementation wrapping another spans instance, * allowing to filter spans matches easily by implementing {@link #accept} */
public abstract class FilterSpans extends Spans {
The wrapped spans instance.
/** The wrapped spans instance. */
protected final Spans in; private boolean atFirstInCurrentDoc = false; private int startPos = -1;
Wrap the given Spans.
/** Wrap the given {@link Spans}. */
protected FilterSpans(Spans in) { this.in = Objects.requireNonNull(in); }
Returns YES if the candidate should be an accepted match, NO if it should not, and NO_MORE_IN_CURRENT_DOC if iteration should move on to the next document.
/** * Returns YES if the candidate should be an accepted match, * NO if it should not, and NO_MORE_IN_CURRENT_DOC if iteration * should move on to the next document. */
protected abstract AcceptStatus accept(Spans candidate) throws IOException; @Override public final int nextDoc() throws IOException { while (true) { int doc = in.nextDoc(); if (doc == NO_MORE_DOCS) { return NO_MORE_DOCS; } else if (twoPhaseCurrentDocMatches()) { return doc; } } } @Override public final int advance(int target) throws IOException { int doc = in.advance(target); while (doc != NO_MORE_DOCS) { if (twoPhaseCurrentDocMatches()) { break; } doc = in.nextDoc(); } return doc; } @Override public final int docID() { return in.docID(); } @Override public final int nextStartPosition() throws IOException { if (atFirstInCurrentDoc) { atFirstInCurrentDoc = false; return startPos; } for (;;) { startPos = in.nextStartPosition(); if (startPos == NO_MORE_POSITIONS) { return NO_MORE_POSITIONS; } switch(accept(in)) { case YES: return startPos; case NO: break; case NO_MORE_IN_CURRENT_DOC: return startPos = NO_MORE_POSITIONS; // startPos ahead for the current doc. } } } @Override public final int startPosition() { return atFirstInCurrentDoc ? -1 : startPos; } @Override public final int endPosition() { return atFirstInCurrentDoc ? -1 : (startPos != NO_MORE_POSITIONS) ? in.endPosition() : NO_MORE_POSITIONS; } @Override public int width() { return in.width(); } @Override public void collect(SpanCollector collector) throws IOException { in.collect(collector); } @Override public final long cost() { return in.cost(); } @Override public String toString() { return "Filter(" + in.toString() + ")"; } @Override public final TwoPhaseIterator asTwoPhaseIterator() { TwoPhaseIterator inner = in.asTwoPhaseIterator(); if (inner != null) { // wrapped instance has an approximation return new TwoPhaseIterator(inner.approximation()) { @Override public boolean matches() throws IOException { return inner.matches() && twoPhaseCurrentDocMatches(); } @Override public float matchCost() { return inner.matchCost(); // underestimate } @Override public String toString() { return "FilterSpans@asTwoPhaseIterator(inner=" + inner + ", in=" + in + ")"; } }; } else { // wrapped instance has no approximation, but // we can still defer matching until absolutely needed. return new TwoPhaseIterator(in) { @Override public boolean matches() throws IOException { return twoPhaseCurrentDocMatches(); } @Override public float matchCost() { return in.positionsCost(); // overestimate } @Override public String toString() { return "FilterSpans@asTwoPhaseIterator(in=" + in + ")"; } }; } } @Override public float positionsCost() { throw new UnsupportedOperationException(); // asTwoPhaseIterator never returns null }
Returns true if the current document matches.

This is called during two-phase processing.

/** * Returns true if the current document matches. * <p> * This is called during two-phase processing. */
// return true if the current document matches @SuppressWarnings("fallthrough") private final boolean twoPhaseCurrentDocMatches() throws IOException { atFirstInCurrentDoc = false; startPos = in.nextStartPosition(); assert startPos != NO_MORE_POSITIONS; for (;;) { switch(accept(in)) { case YES: atFirstInCurrentDoc = true; return true; case NO: startPos = in.nextStartPosition(); if (startPos != NO_MORE_POSITIONS) { break; } // else fallthrough case NO_MORE_IN_CURRENT_DOC: startPos = -1; return false; } } }
Status returned from FilterSpans.accept(Spans) that indicates whether a candidate match should be accepted, rejected, or rejected and move on to the next document.
/** * Status returned from {@link FilterSpans#accept(Spans)} that indicates * whether a candidate match should be accepted, rejected, or rejected * and move on to the next document. */
public static enum AcceptStatus {
Indicates the match should be accepted
/** Indicates the match should be accepted */
YES,
Indicates the match should be rejected
/** Indicates the match should be rejected */
NO,
Indicates the match should be rejected, and the enumeration may continue with the next document.
/** * Indicates the match should be rejected, and the enumeration may continue * with the next document. */
NO_MORE_IN_CURRENT_DOC }; }