All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.browseengine.bobo.facets.impl.BucketFacetCountCollector Maven / Gradle / Ivy

Go to download

Bobo is a Faceted Search implementation written purely in Java, an extension of Apache Lucene

The newest version!
package com.browseengine.bobo.facets.impl;

import java.util.Arrays;
import java.util.List;
import java.util.Map;

import org.apache.lucene.util.FixedBitSet;

import com.browseengine.bobo.api.BrowseFacet;
import com.browseengine.bobo.api.FacetIterator;
import com.browseengine.bobo.api.FacetSpec;
import com.browseengine.bobo.facets.FacetCountCollector;
import com.browseengine.bobo.facets.data.FacetDataCache;
import com.browseengine.bobo.facets.data.TermStringList;
import com.browseengine.bobo.facets.data.TermValueList;
import com.browseengine.bobo.util.BigSegmentedArray;
import com.browseengine.bobo.util.LazyBigIntArray;

public class BucketFacetCountCollector implements FacetCountCollector {
  private final String _name;
  private final DefaultFacetCountCollector _subCollector;
  private final FacetSpec _ospec;
  private final Map _predefinedBuckets;
  private BigSegmentedArray _collapsedCounts;
  private final TermStringList _bucketValues;
  private final int _numdocs;

  protected BucketFacetCountCollector(String name, DefaultFacetCountCollector subCollector,
      FacetSpec ospec, Map predefinedBuckets, int numdocs) {
    _name = name;
    _subCollector = subCollector;
    _ospec = ospec;
    _numdocs = numdocs;

    _predefinedBuckets = predefinedBuckets;
    _collapsedCounts = null;

    _bucketValues = new TermStringList();
    _bucketValues.add("");

    String[] bucketArray = _predefinedBuckets.keySet().toArray(new String[0]);
    Arrays.sort(bucketArray);
    for (String bucket : bucketArray) {
      _bucketValues.add(bucket);
    }
    _bucketValues.seal();
  }

  private BigSegmentedArray getCollapsedCounts() {
    if (_collapsedCounts == null) {
      _collapsedCounts = new LazyBigIntArray(_bucketValues.size());
      FacetDataCache dataCache = _subCollector._dataCache;
      TermValueList subList = dataCache.valArray;
      BigSegmentedArray subcounts = _subCollector._count;
      FixedBitSet indexSet = new FixedBitSet(subcounts.size());
      int c = 0;
      int i = 0;
      for (String val : _bucketValues) {
        if (val.length() > 0) {
          String[] subVals = _predefinedBuckets.get(val);
          int count = 0;
          for (String subVal : subVals) {
            int index = subList.indexOf(subVal);
            if (index > 0) {
              int subcount = subcounts.get(index);
              count += subcount;
              if (!indexSet.get(index)) {
                indexSet.set(index);
                c += dataCache.freqs[index];
              }
            }
          }
          _collapsedCounts.add(i, count);
        }
        i++;
      }
      _collapsedCounts.add(0, (_numdocs - c));
    }
    return _collapsedCounts;
  }

  // get the total count of all possible elements
  @Override
  public BigSegmentedArray getCountDistribution() {
    return getCollapsedCounts();
  }

  @Override
  public String getName() {
    return _name;
  }

  // get the facet of one particular bucket
  @Override
  public BrowseFacet getFacet(String bucketValue) {
    int index = _bucketValues.indexOf(bucketValue);
    if (index < 0) {
      return new BrowseFacet(bucketValue, 0);
    }

    BigSegmentedArray counts = getCollapsedCounts();

    return new BrowseFacet(bucketValue, counts.get(index));
  }

  @Override
  public int getFacetHitsCount(Object value) {
    int index = _bucketValues.indexOf(value);
    if (index < 0) {
      return 0;
    }

    BigSegmentedArray counts = getCollapsedCounts();

    return counts.get(index);
  }

  @Override
  public final void collect(int docid) {
    _subCollector.collect(docid);
  }

  @Override
  public final void collectAll() {
    _subCollector.collectAll();
  }

  // get facets for all predefined buckets
  @Override
  public List getFacets() {

    BigSegmentedArray counts = getCollapsedCounts();
    return DefaultFacetCountCollector.getFacets(_ospec, counts, counts.size(), _bucketValues);

  }

  @Override
  public void close() {
    _subCollector.close();
  }

  @Override
  public FacetIterator iterator() {
    BigSegmentedArray counts = getCollapsedCounts();
    return new DefaultFacetIterator(_bucketValues, counts, counts.size(), true);
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy