All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.lucene.facet.range.LongRangeFacetCounts Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.facet.range;

import java.io.IOException;
import java.util.List;
import org.apache.lucene.facet.Facets;
import org.apache.lucene.facet.FacetsCollector;
import org.apache.lucene.facet.FacetsCollector.MatchingDocs;
import org.apache.lucene.facet.MultiLongValues;
import org.apache.lucene.facet.MultiLongValuesSource;
import org.apache.lucene.index.NumericDocValues;
import org.apache.lucene.index.SortedNumericDocValues;
import org.apache.lucene.search.DocIdSetIterator;
import org.apache.lucene.search.LongValues;
import org.apache.lucene.search.LongValuesSource;
import org.apache.lucene.search.Query;

/**
 * {@link Facets} implementation that computes counts for dynamic long ranges. Use this for
 * dimensions that change in real-time (e.g. a relative time based dimension like "Past day", "Past
 * 2 days", etc.) or that change for each request (e.g. distance from the user's location, "< 1
 * km", "< 2 km", etc.).
 *
 * @lucene.experimental
 */
public class LongRangeFacetCounts extends RangeFacetCounts {

  /**
   * Create {@code LongRangeFacetCounts} using long values from the specified field. The field may
   * be single-valued ({@link NumericDocValues}) or multi-valued ({@link SortedNumericDocValues}),
   * and will be interpreted as containing long values.
   */
  public LongRangeFacetCounts(String field, FacetsCollector hits, LongRange... ranges)
      throws IOException {
    this(field, (LongValuesSource) null, hits, ranges);
  }

  /**
   * Create {@code LongRangeFacetCounts}, using the provided {@link LongValuesSource} if non-null.
   * If {@code valueSource} is null, doc values from the provided {@code field} will be used.
   */
  public LongRangeFacetCounts(
      String field, LongValuesSource valueSource, FacetsCollector hits, LongRange... ranges)
      throws IOException {
    this(field, valueSource, hits, null, ranges);
  }

  /**
   * Create {@code LongRangeFacetCounts}, using the provided {@link MultiLongValuesSource} if
   * non-null. If {@code valuesSource} is null, doc values from the provided {@code field} will be
   * used.
   */
  public LongRangeFacetCounts(
      String field, MultiLongValuesSource valuesSource, FacetsCollector hits, LongRange... ranges)
      throws IOException {
    this(field, valuesSource, hits, null, ranges);
  }

  /**
   * Create {@code LongRangeFacetCounts}, using the provided {@link LongValuesSource} if non-null.
   * If {@code valueSource} is null, doc values from the provided {@code field} will be used. Use
   * the provided {@code Query} as a fastmatch: only documents passing the filter are checked for
   * the matching ranges, which is helpful when the provided {@link LongValuesSource} is costly
   * per-document, such as a geo distance.
   */
  public LongRangeFacetCounts(
      String field,
      LongValuesSource valueSource,
      FacetsCollector hits,
      Query fastMatchQuery,
      LongRange... ranges)
      throws IOException {
    super(field, ranges, fastMatchQuery);
    // use the provided valueSource if non-null, otherwise use the doc values associated with the
    // field
    if (valueSource != null) {
      count(valueSource, hits.getMatchingDocs());
    } else {
      count(field, hits.getMatchingDocs());
    }
  }

  /**
   * Create {@code LongRangeFacetCounts}, using the provided {@link MultiLongValuesSource} if
   * non-null. If {@code valuesSource} is null, doc values from the provided {@code field} will be
   * used. Use the provided {@code Query} as a fastmatch: only documents passing the filter are
   * checked for the matching ranges, which is helpful when the provided {@link LongValuesSource} is
   * costly per-document, such as a geo distance.
   */
  public LongRangeFacetCounts(
      String field,
      MultiLongValuesSource valuesSource,
      FacetsCollector hits,
      Query fastMatchQuery,
      LongRange... ranges)
      throws IOException {
    super(field, ranges, fastMatchQuery);
    // use the provided valueSource if non-null, otherwise use the doc values associated with the
    // field
    if (valuesSource != null) {
      LongValuesSource singleValues = MultiLongValuesSource.unwrapSingleton(valuesSource);
      if (singleValues != null) {
        count(singleValues, hits.getMatchingDocs());
      } else {
        count(valuesSource, hits.getMatchingDocs());
      }
    } else {
      count(field, hits.getMatchingDocs());
    }
  }

  /** Counts from the provided valueSource. */
  private void count(LongValuesSource valueSource, List matchingDocs)
      throws IOException {

    LongRangeCounter counter = null;

    int missingCount = 0;

    for (MatchingDocs hits : matchingDocs) {
      if (hits.totalHits() == 0) {
        continue;
      }

      final DocIdSetIterator it = createIterator(hits);
      if (it == null) {
        continue;
      }

      if (counter == null) {
        counter = setupCounter();
      }

      LongValues fv = valueSource.getValues(hits.context(), null);
      totCount += hits.totalHits();

      for (int doc = it.nextDoc(); doc != DocIdSetIterator.NO_MORE_DOCS; ) {
        // Skip missing docs:
        if (fv.advanceExact(doc)) {
          counter.addSingleValued(fv.longValue());
        } else {
          missingCount++;
        }

        doc = it.nextDoc();
      }
    }

    if (counter != null) {
      missingCount += counter.finish();
      totCount -= missingCount;
    }
  }

  /** Counts from the provided valueSource. */
  private void count(MultiLongValuesSource valueSource, List matchingDocs)
      throws IOException {

    LongRangeCounter counter = null;

    for (MatchingDocs hits : matchingDocs) {
      if (hits.totalHits() == 0) {
        continue;
      }

      final DocIdSetIterator it = createIterator(hits);
      if (it == null) {
        continue;
      }

      if (counter == null) {
        counter = setupCounter();
      }

      MultiLongValues multiValues = valueSource.getValues(hits.context());

      for (int doc = it.nextDoc(); doc != DocIdSetIterator.NO_MORE_DOCS; ) {
        // Skip missing docs:
        if (multiValues.advanceExact(doc)) {
          long limit = multiValues.getValueCount();
          // optimize single-valued case:
          if (limit == 1) {
            counter.addSingleValued(multiValues.nextValue());
            totCount++;
          } else {
            counter.startMultiValuedDoc();
            long previous = 0;
            for (int i = 0; i < limit; i++) {
              long val = multiValues.nextValue();
              if (i == 0 || val != previous) {
                counter.addMultiValued(val);
                previous = val;
              }
            }
            if (counter.endMultiValuedDoc()) {
              totCount++;
            }
          }
        }

        doc = it.nextDoc();
      }
    }

    if (counter != null) {
      int missingCount = counter.finish();
      totCount -= missingCount;
    }
  }

  @Override
  protected LongRange[] getLongRanges() {
    return (LongRange[]) this.ranges;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy