MtasSpanFullyAlignedWithSpans.java.html 15.6 KB
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml" lang="en"><head><meta http-equiv="Content-Type" content="text/html;charset=UTF-8"/><link rel="stylesheet" href="../jacoco-resources/report.css" type="text/css"/><link rel="shortcut icon" href="../jacoco-resources/report.gif" type="image/gif"/><title>MtasSpanFullyAlignedWithSpans.java</title><link rel="stylesheet" href="../jacoco-resources/prettify.css" type="text/css"/><script type="text/javascript" src="../jacoco-resources/prettify.js"></script></head><body onload="window['PR_TAB_WIDTH']=4;prettyPrint()"><div class="breadcrumb" id="breadcrumb"><span class="info"><a href="../jacoco-sessions.html" class="el_session">Sessions</a></span><a href="../index.html" class="el_report">MTAS</a> &gt; <a href="index.source.html" class="el_package">mtas.search.spans</a> &gt; <span class="el_source">MtasSpanFullyAlignedWithSpans.java</span></div><h1>MtasSpanFullyAlignedWithSpans.java</h1><pre class="source lang-java linenums">package mtas.search.spans;

import java.io.IOException;
import java.util.HashSet;
import org.apache.lucene.search.spans.SpanCollector;
import org.apache.lucene.search.spans.Spans;

import mtas.search.spans.MtasSpanFullyAlignedWithQuery.MtasSpanFullyAlignedWithQuerySpans;
import mtas.search.spans.util.MtasSpans;

/**
 * The Class MtasSpanFullyAlignedWithSpans.
 */
public class MtasSpanFullyAlignedWithSpans extends Spans implements MtasSpans {

  /** The spans 1. */
  private MtasSpanFullyAlignedWithQuerySpans spans1;

  /** The spans 2. */
  private MtasSpanFullyAlignedWithQuerySpans spans2;

  /** The last spans 2 start position. */
  private int lastSpans2StartPosition;

  /** The last spans 2 end position. */
  private int lastSpans2EndPosition;

  /** The previous spans 2 start position. */
  private int previousSpans2StartPosition;

  /** The previous spans 2 end positions. */
  private HashSet&lt;Integer&gt; previousSpans2EndPositions;

  /** The called next start position. */
  private boolean calledNextStartPosition;

  /** The no more positions. */
  private boolean noMorePositions;
  private boolean noMorePositionsSpan2;

  /** The doc id. */
  private int docId;

  /**
   * Instantiates a new mtas span fully aligned with spans.
   *
   * @param mtasSpanFullyAlignedWithQuery
   *          the mtas span fully aligned with query
   * @param spans1
   *          the spans 1
   * @param spans2
   *          the spans 2
   */
  public MtasSpanFullyAlignedWithSpans(
      MtasSpanFullyAlignedWithQuerySpans spans1,
      MtasSpanFullyAlignedWithQuerySpans spans2) {
<span class="fc" id="L57">    super();</span>
<span class="fc" id="L58">    docId = -1;</span>
<span class="fc" id="L59">    this.spans1 = spans1;</span>
<span class="fc" id="L60">    this.spans2 = spans2;</span>
<span class="fc" id="L61">    previousSpans2EndPositions = new HashSet&lt;&gt;();</span>
<span class="fc" id="L62">  }</span>

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.spans.Spans#nextStartPosition()
   */
  @Override
  public int nextStartPosition() throws IOException {
    // no document
<span class="pc bpc" id="L72" title="2 of 4 branches missed.">    if (docId == -1 || docId == NO_MORE_DOCS) {</span>
<span class="nc" id="L73">      throw new IOException(&quot;no document&quot;);</span>
      // finished
<span class="pc bpc" id="L75" title="1 of 2 branches missed.">    } else if (noMorePositions) {</span>
<span class="nc" id="L76">      return NO_MORE_POSITIONS;</span>
      // littleSpans already at start match, because of check for matching
      // document
<span class="fc bfc" id="L79" title="All 2 branches covered.">    } else if (!calledNextStartPosition) {</span>
<span class="fc" id="L80">      calledNextStartPosition = true;</span>
<span class="fc" id="L81">      return spans1.spans.startPosition();</span>
      // compute next match
    } else {
<span class="fc bfc" id="L84" title="All 2 branches covered.">      if (goToNextStartPosition()) {</span>
        // match found
<span class="fc" id="L86">        return spans1.spans.startPosition();</span>
      } else {
        // no more matches: document finished
<span class="fc" id="L89">        return NO_MORE_POSITIONS;</span>
      }
    }
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.spans.Spans#startPosition()
   */
  @Override
  public int startPosition() {
<span class="pc bpc" id="L101" title="1 of 2 branches missed.">    if(calledNextStartPosition) {</span>
<span class="pc bpc" id="L102" title="1 of 2 branches missed.">      if(noMorePositions) {</span>
<span class="nc" id="L103">        return NO_MORE_POSITIONS;</span>
      } else {
<span class="fc" id="L105">        return spans1.spans.startPosition();</span>
      }
    } else {
<span class="nc" id="L108">      return -1;</span>
    }
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.spans.Spans#endPosition()
   */
  @Override
  public int endPosition() {
<span class="pc bpc" id="L119" title="1 of 2 branches missed.">    if(calledNextStartPosition) {</span>
<span class="pc bpc" id="L120" title="1 of 2 branches missed.">      if(noMorePositions) {</span>
<span class="nc" id="L121">        return NO_MORE_POSITIONS;</span>
      } else { 
<span class="fc" id="L123">        return spans1.spans.endPosition();</span>
      }
    } else {
<span class="nc" id="L126">      return -1;</span>
    }    
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.spans.Spans#width()
   */
  @Override
  public int width() {
<span class="nc bnc" id="L137" title="All 2 branches missed.">    if(calledNextStartPosition) {</span>
<span class="nc bnc" id="L138" title="All 2 branches missed.">      if(noMorePositions) {</span>
<span class="nc" id="L139">        return 0;</span>
      } else {
<span class="nc" id="L141">        return spans1.spans.endPosition() - spans1.spans.startPosition();</span>
      }
    } else {
<span class="nc" id="L144">      return 0;</span>
    }    
  }

  /*
   * (non-Javadoc)
   * 
   * @see
   * org.apache.lucene.search.spans.Spans#collect(org.apache.lucene.search.spans
   * .SpanCollector)
   */
  @Override
  public void collect(SpanCollector collector) throws IOException {
<span class="nc" id="L157">    spans1.spans.collect(collector);</span>
<span class="nc" id="L158">    spans2.spans.collect(collector);</span>
<span class="nc" id="L159">  }</span>

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.spans.Spans#positionsCost()
   */
  @Override
  public float positionsCost() {
<span class="nc" id="L168">    return 0;</span>
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.DocIdSetIterator#docID()
   */
  @Override
  public int docID() {
<span class="fc" id="L178">    return docId;</span>
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.DocIdSetIterator#nextDoc()
   */
  @Override
  public int nextDoc() throws IOException {
<span class="fc" id="L188">    reset();</span>
<span class="pc bpc" id="L189" title="1 of 2 branches missed.">    while (!goToNextDoc())</span>
<span class="nc" id="L190">      ;</span>
<span class="fc" id="L191">    return docId;</span>
  }

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.DocIdSetIterator#advance(int)
   */
  @Override
  public int advance(int target) throws IOException {
<span class="nc" id="L201">    reset();</span>
<span class="nc bnc" id="L202" title="All 2 branches missed.">    if (docId == NO_MORE_DOCS) {</span>
<span class="nc" id="L203">      return docId;</span>
<span class="nc bnc" id="L204" title="All 2 branches missed.">    } else if (target &lt; docId) {</span>
      // should not happen
<span class="nc" id="L206">      docId = NO_MORE_DOCS;</span>
<span class="nc" id="L207">      return docId;</span>
    } else {
      // advance 1
<span class="nc" id="L210">      int spans1DocId = spans1.spans.docID();</span>
<span class="nc" id="L211">      int newTarget = target;</span>
<span class="nc bnc" id="L212" title="All 2 branches missed.">      if (spans1DocId &lt; newTarget) {</span>
<span class="nc" id="L213">        spans1DocId = spans1.spans.advance(target);</span>
<span class="nc bnc" id="L214" title="All 2 branches missed.">        if (spans1DocId == NO_MORE_DOCS) {</span>
<span class="nc" id="L215">          docId = NO_MORE_DOCS;</span>
<span class="nc" id="L216">          return docId;</span>
        }
<span class="nc" id="L218">        newTarget = Math.max(newTarget, spans1DocId);</span>
      }
<span class="nc" id="L220">      int spans2DocId = spans2.spans.docID();</span>
      // advance 2
<span class="nc bnc" id="L222" title="All 2 branches missed.">      if (spans2DocId &lt; newTarget) {</span>
<span class="nc" id="L223">        spans2DocId = spans2.spans.advance(newTarget);</span>
<span class="nc bnc" id="L224" title="All 2 branches missed.">        if (spans2DocId == NO_MORE_DOCS) {</span>
<span class="nc" id="L225">          docId = NO_MORE_DOCS;</span>
<span class="nc" id="L226">          return docId;</span>
        }
      }
      // check equal docId, otherwise next
<span class="nc bnc" id="L230" title="All 2 branches missed.">      if (spans1DocId == spans2DocId) {</span>
<span class="nc" id="L231">        docId = spans1DocId;</span>
        // check match
<span class="nc bnc" id="L233" title="All 2 branches missed.">        if (goToNextStartPosition()) {</span>
<span class="nc" id="L234">          return docId;</span>
        } else {
<span class="nc" id="L236">          return nextDoc();</span>
        }
      } else {
<span class="nc" id="L239">        return nextDoc();</span>
      }
    }
  }

  /**
   * Go to next doc.
   *
   * @return true, if successful
   * @throws IOException
   *           Signals that an I/O exception has occurred.
   */
  private boolean goToNextDoc() throws IOException {
<span class="pc bpc" id="L252" title="1 of 2 branches missed.">    if (docId == NO_MORE_DOCS) {</span>
<span class="nc" id="L253">      return true;</span>
    } else {
<span class="fc" id="L255">      int spans1DocId = spans1.spans.nextDoc();</span>
<span class="fc" id="L256">      int spans2DocId = spans2.spans.docID();</span>
<span class="fc" id="L257">      docId = Math.max(spans1DocId, spans2DocId);</span>
<span class="fc bfc" id="L258" title="All 4 branches covered.">      while (spans1DocId != spans2DocId &amp;&amp; docId != NO_MORE_DOCS) {</span>
<span class="pc bpc" id="L259" title="1 of 2 branches missed.">        if (spans1DocId &lt; spans2DocId) {</span>
<span class="nc" id="L260">          spans1DocId = spans1.spans.advance(spans2DocId);</span>
<span class="nc" id="L261">          docId = spans1DocId;</span>
        } else {
<span class="fc" id="L263">          spans2DocId = spans2.spans.advance(spans1DocId);</span>
<span class="fc" id="L264">          docId = spans2DocId;</span>
        }
      }
<span class="pc bpc" id="L267" title="1 of 4 branches missed.">      if (docId != NO_MORE_DOCS &amp;&amp; !goToNextStartPosition()) {</span>
<span class="nc" id="L268">        reset();</span>
<span class="nc" id="L269">        return false;</span>
      }
<span class="fc" id="L271">      return true;</span>
    }
  }

  /**
   * Go to next start position.
   *
   * @return true, if successful
   * @throws IOException
   *           Signals that an I/O exception has occurred.
   */
  private boolean goToNextStartPosition() throws IOException {
    int nextSpans1StartPosition;
    int nextSpans1EndPosition;
    int nextSpans2StartPosition;
    int nextSpans2EndPosition;
    // loop over span1
<span class="fc" id="L288">    while ((nextSpans1StartPosition = spans1.spans</span>
<span class="fc bfc" id="L289" title="All 2 branches covered.">        .nextStartPosition()) != NO_MORE_POSITIONS) {</span>
<span class="fc" id="L290">      nextSpans1EndPosition = spans1.spans.endPosition();</span>
<span class="fc bfc" id="L291" title="All 4 branches covered.">      if (noMorePositionsSpan2</span>
          &amp;&amp; nextSpans1StartPosition &gt; lastSpans2StartPosition) {
<span class="fc" id="L293">        noMorePositions = true;</span>
<span class="fc" id="L294">        return false;</span>
        // check if start/en span1 matches start/end span2 from last or previous
<span class="fc bfc" id="L296" title="All 6 branches covered.">      } else if ((nextSpans1StartPosition == lastSpans2StartPosition</span>
          &amp;&amp; nextSpans1EndPosition == lastSpans2EndPosition)
          || (nextSpans1StartPosition == previousSpans2StartPosition
<span class="fc bfc" id="L299" title="All 2 branches covered.">              &amp;&amp; previousSpans2EndPositions.contains(nextSpans1EndPosition))) {</span>
<span class="fc" id="L300">        return true;</span>
      } else {
        // try to find matching span2
<span class="fc bfc" id="L303" title="All 4 branches covered.">        while (!noMorePositionsSpan2</span>
            &amp;&amp; nextSpans1StartPosition &gt;= lastSpans2StartPosition) {
          // get new span2
<span class="fc" id="L306">          nextSpans2StartPosition = spans2.spans.nextStartPosition();</span>
          // check for finished span2
<span class="fc bfc" id="L308" title="All 2 branches covered.">          if (nextSpans2StartPosition == NO_MORE_POSITIONS) {</span>
<span class="fc" id="L309">            noMorePositionsSpan2 = true;</span>
          } else {
            // get end for new span2
<span class="fc" id="L312">            nextSpans2EndPosition = spans2.spans.endPosition();</span>
            // check for registering last span2 as previous
<span class="fc bfc" id="L314" title="All 2 branches covered.">            if (nextSpans1StartPosition &lt;= lastSpans2StartPosition) {</span>
<span class="pc bpc" id="L315" title="1 of 2 branches missed.">              if (previousSpans2StartPosition != lastSpans2StartPosition) {</span>
<span class="fc" id="L316">                previousSpans2StartPosition = lastSpans2StartPosition;</span>
<span class="fc" id="L317">                previousSpans2EndPositions.clear();</span>
              }
<span class="fc" id="L319">              previousSpans2EndPositions.add(lastSpans2EndPosition);</span>
            }
            // register span2 as last
<span class="fc" id="L322">            lastSpans2StartPosition = nextSpans2StartPosition;</span>
<span class="fc" id="L323">            lastSpans2EndPosition = nextSpans2EndPosition;</span>
            // check for match
<span class="fc bfc" id="L325" title="All 4 branches covered.">            if (nextSpans1StartPosition == nextSpans2StartPosition</span>
                &amp;&amp; nextSpans1EndPosition == nextSpans2EndPosition) {
<span class="fc" id="L327">              return true;</span>
            }
          }
        }

      }
    }
<span class="fc" id="L334">    noMorePositions = true;</span>
<span class="fc" id="L335">    return false;</span>
  }

  /**
   * Reset.
   */
  private void reset() {
<span class="fc" id="L342">    calledNextStartPosition = false;</span>
<span class="fc" id="L343">    noMorePositions = false;</span>
<span class="fc" id="L344">    noMorePositionsSpan2 = false;</span>
<span class="fc" id="L345">    lastSpans2StartPosition = -1;</span>
<span class="fc" id="L346">    lastSpans2EndPosition = -1;</span>
<span class="fc" id="L347">    previousSpans2StartPosition = -1;</span>
<span class="fc" id="L348">    previousSpans2EndPositions.clear();</span>
<span class="fc" id="L349">  }</span>

  /*
   * (non-Javadoc)
   * 
   * @see org.apache.lucene.search.DocIdSetIterator#cost()
   */
  @Override
  public long cost() {
<span class="nc" id="L358">    return 0;</span>
  }

}
</pre><div class="footer"><span class="right">Created with <a href="http://www.jacoco.org/jacoco">JaCoCo</a> 0.7.9.201702052155</span></div></body></html>