com.yelp.nrtsearch.server.luceneserver.SearchHandler Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of server Show documentation
GRPC lucene server using near-real-time replication
There is a newer version: 1.0.0-beta.1
/*
 * Copyright 2020 Yelp Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.yelp.nrtsearch.server.luceneserver;

import com.google.common.collect.Lists;
import com.google.common.util.concurrent.MoreExecutors;
import com.yelp.nrtsearch.server.grpc.DeadlineUtils;
import com.yelp.nrtsearch.server.grpc.FacetResult;
import com.yelp.nrtsearch.server.grpc.ProfileResult;
import com.yelp.nrtsearch.server.grpc.SearchRequest;
import com.yelp.nrtsearch.server.grpc.SearchResponse;
import com.yelp.nrtsearch.server.grpc.SearchResponse.Hit;
import com.yelp.nrtsearch.server.grpc.SearchResponse.Hit.CompositeFieldValue;
import com.yelp.nrtsearch.server.grpc.SearchResponse.Hit.FieldValue;
import com.yelp.nrtsearch.server.grpc.SearchResponse.SearchState;
import com.yelp.nrtsearch.server.grpc.TotalHits;
import com.yelp.nrtsearch.server.luceneserver.doc.LoadedDocValues;
import com.yelp.nrtsearch.server.luceneserver.facet.DrillSidewaysImpl;
import com.yelp.nrtsearch.server.luceneserver.facet.FacetTopDocs;
import com.yelp.nrtsearch.server.luceneserver.field.BooleanFieldDef;
import com.yelp.nrtsearch.server.luceneserver.field.DateTimeFieldDef;
import com.yelp.nrtsearch.server.luceneserver.field.FieldDef;
import com.yelp.nrtsearch.server.luceneserver.field.IndexableFieldDef;
import com.yelp.nrtsearch.server.luceneserver.field.RuntimeFieldDef;
import com.yelp.nrtsearch.server.luceneserver.field.VirtualFieldDef;
import com.yelp.nrtsearch.server.luceneserver.innerhit.InnerHitFetchTask;
import com.yelp.nrtsearch.server.luceneserver.rescore.RescoreTask;
import com.yelp.nrtsearch.server.luceneserver.script.RuntimeScript;
import com.yelp.nrtsearch.server.luceneserver.search.FieldFetchContext;
import com.yelp.nrtsearch.server.luceneserver.search.SearchContext;
import com.yelp.nrtsearch.server.luceneserver.search.SearchCutoffWrapper.CollectionTimeoutException;
import com.yelp.nrtsearch.server.luceneserver.search.SearchRequestProcessor;
import com.yelp.nrtsearch.server.luceneserver.search.SearcherResult;
import com.yelp.nrtsearch.server.monitoring.SearchResponseCollector;
import com.yelp.nrtsearch.server.utils.ObjectToCompositeFieldTransformer;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Comparator;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.concurrent.*;
import java.util.concurrent.locks.Condition;
import java.util.concurrent.locks.Lock;
import java.util.concurrent.locks.ReentrantLock;
import java.util.stream.Collectors;
import org.apache.lucene.facet.DrillDownQuery;
import org.apache.lucene.facet.DrillSideways;
import org.apache.lucene.facet.taxonomy.SearcherTaxonomyManager;
import org.apache.lucene.index.*;
import org.apache.lucene.search.*;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class SearchHandler implements Handler {
  private static final ExecutorService DIRECT_EXECUTOR = MoreExecutors.newDirectExecutorService();

  private static final Logger logger = LoggerFactory.getLogger(SearchHandler.class);
  private final ThreadPoolExecutor threadPoolExecutor;
  private final boolean warming;

  public SearchHandler(ThreadPoolExecutor threadPoolExecutor) {
    this(threadPoolExecutor, false);
  }

  /**
   * @param threadPoolExecutor Threadpool to execute a parallel search
   * @param warming set to true if we are warming the index right now
   */
  public SearchHandler(ThreadPoolExecutor threadPoolExecutor, boolean warming) {
    this.threadPoolExecutor = threadPoolExecutor;
    this.warming = warming;
  }

  @Override
  public SearchResponse handle(IndexState indexState, SearchRequest searchRequest)
      throws SearchHandlerException {
    // this request may have been waiting in the grpc queue too long
    DeadlineUtils.checkDeadline("SearchHandler: start", "SEARCH");

    ShardState shardState = indexState.getShard(0);

    // Index won't be started if we are currently warming
    if (!warming) {
      indexState.verifyStarted();
    }

    var diagnostics = SearchResponse.Diagnostics.newBuilder();

    SearcherTaxonomyManager.SearcherAndTaxonomy s = null;
    SearchContext searchContext;
    try {
      s =
          getSearcherAndTaxonomy(
              searchRequest, indexState, shardState, diagnostics, threadPoolExecutor);

      ProfileResult.Builder profileResultBuilder = null;
      if (searchRequest.getProfile()) {
        profileResultBuilder = ProfileResult.newBuilder();
      }

      searchContext =
          SearchRequestProcessor.buildContextForRequest(
              searchRequest, indexState, shardState, s, diagnostics, profileResultBuilder);

      long searchStartTime = System.nanoTime();

      SearcherResult searcherResult;
      if (!searchRequest.getFacetsList().isEmpty()) {
        DrillDownQuery ddq = (DrillDownQuery) searchContext.getQuery();

        List grpcFacetResults = new ArrayList<>();
        // Run the drill sideways search on the direct executor to run subtasks in the
        // current (grpc) thread. If we use the search thread pool for this, it can cause a
        // deadlock trying to execute the dependent parallel search tasks. Since we do not
        // currently add additional drill down definitions, there will only be one drill
        // sideways task per query.
        DrillSideways drillS =
            new DrillSidewaysImpl(
                s.searcher,
                indexState.getFacetsConfig(),
                s.taxonomyReader,
                searchRequest.getFacetsList(),
                s,
                indexState,
                shardState,
                searchContext.getQueryFields(),
                grpcFacetResults,
                DIRECT_EXECUTOR,
                diagnostics);
        DrillSideways.ConcurrentDrillSidewaysResult concurrentDrillSidewaysResult;
        try {
          concurrentDrillSidewaysResult =
              drillS.search(ddq, searchContext.getCollector().getWrappedManager());
        } catch (RuntimeException e) {
          // Searching with DrillSideways wraps exceptions in a few layers.
          // Try to find if this was caused by a timeout, if so, re-wrap
          // so that the top level exception is the same as when not using facets.
          CollectionTimeoutException timeoutException = findTimeoutException(e);
          if (timeoutException != null) {
            throw new CollectionTimeoutException(timeoutException.getMessage(), e);
          }
          throw e;
        }
        searcherResult = concurrentDrillSidewaysResult.collectorResult;
        searchContext.getResponseBuilder().addAllFacetResult(grpcFacetResults);
        searchContext
            .getResponseBuilder()
            .addAllFacetResult(
                FacetTopDocs.facetTopDocsSample(
                    searcherResult.getTopDocs(),
                    searchRequest.getFacetsList(),
                    indexState,
                    s.searcher,
                    diagnostics));
      } else {
        try {
          searcherResult =
              s.searcher.search(
                  searchContext.getQuery(), searchContext.getCollector().getWrappedManager());
        } catch (RuntimeException e) {
          CollectionTimeoutException timeoutException = findTimeoutException(e);
          if (timeoutException != null) {
            throw new CollectionTimeoutException(timeoutException.getMessage(), e);
          }
          throw e;
        }
      }
      TopDocs hits = searcherResult.getTopDocs();

      // add results from any extra collectors
      searchContext
          .getResponseBuilder()
          .putAllCollectorResults(searcherResult.getCollectorResults());

      searchContext.getResponseBuilder().setHitTimeout(searchContext.getCollector().hadTimeout());
      searchContext
          .getResponseBuilder()
          .setTerminatedEarly(searchContext.getCollector().terminatedEarly());

      diagnostics.setFirstPassSearchTimeMs(((System.nanoTime() - searchStartTime) / 1000000.0));

      DeadlineUtils.checkDeadline("SearchHandler: post recall", diagnostics, "SEARCH");

      // add detailed timing metrics for query execution
      if (profileResultBuilder != null) {
        searchContext.getCollector().maybeAddProfiling(profileResultBuilder);
      }

      long rescoreStartTime = System.nanoTime();

      if (!searchContext.getRescorers().isEmpty()) {
        for (RescoreTask rescorer : searchContext.getRescorers()) {
          long startNS = System.nanoTime();
          hits = rescorer.rescore(hits, searchContext);
          long endNS = System.nanoTime();
          diagnostics.putRescorersTimeMs(rescorer.getName(), (endNS - startNS) / 1000000.0);
          DeadlineUtils.checkDeadline(
              "SearchHandler: post " + rescorer.getName(), diagnostics, "SEARCH");
        }
        diagnostics.setRescoreTimeMs(((System.nanoTime() - rescoreStartTime) / 1000000.0));
      }

      long t0 = System.nanoTime();

      hits = getHitsFromOffset(hits, searchContext.getStartHit(), searchContext.getTopHits());

      // create Hit.Builder for each hit, and populate with lucene doc id and ranking info
      setResponseHits(searchContext, hits);

      // fill Hit.Builder with requested fields
      fetchFields(searchContext);

      SearchState.Builder searchState = SearchState.newBuilder();
      searchContext.getResponseBuilder().setSearchState(searchState);
      searchState.setTimestamp(searchContext.getTimestampSec());

      // Record searcher version that handled this request:
      searchState.setSearcherVersion(((DirectoryReader) s.searcher.getIndexReader()).getVersion());

      // Fill in lastDoc for searchAfter:
      if (hits.scoreDocs.length != 0) {
        ScoreDoc lastHit = hits.scoreDocs[hits.scoreDocs.length - 1];
        searchState.setLastDocId(lastHit.doc);
        searchContext.getCollector().fillLastHit(searchState, lastHit);
      }
      searchContext.getResponseBuilder().setSearchState(searchState);

      diagnostics.setGetFieldsTimeMs(((System.nanoTime() - t0) / 1000000.0));

      if (searchContext.getFetchTasks().getHighlightFetchTask() != null) {
        diagnostics.setHighlightTimeMs(
            searchContext.getFetchTasks().getHighlightFetchTask().getTimeTakenMs());
      }
      if (searchContext.getFetchTasks().getInnerHitFetchTaskList() != null) {
        diagnostics.putAllInnerHitsDiagnostics(
            searchContext.getFetchTasks().getInnerHitFetchTaskList().stream()
                .collect(
                    Collectors.toMap(
                        task -> task.getInnerHitContext().getInnerHitName(),
                        InnerHitFetchTask::getDiagnostic)));
      }
      searchContext.getResponseBuilder().setDiagnostics(diagnostics);

      if (profileResultBuilder != null) {
        searchContext.getResponseBuilder().setProfileResult(profileResultBuilder);
      }
    } catch (IOException | InterruptedException | ExecutionException e) {
      logger.warn(e.getMessage(), e);
      throw new SearchHandlerException(e);
    } finally {
      // NOTE: this is a little iffy, because we may not
      // have obtained this searcher from the NRTManager
      // (i.e. sometimes we pulled from
      // SearcherLifetimeManager, other times (if
      // snapshot was specified) we opened ourselves,
      // but under-the-hood all these methods just call
      // s.getIndexReader().decRef(), which is what release
      // does:
      try {
        if (s != null) {
          shardState.release(s);
        }
      } catch (IOException e) {
        logger.warn("Failed to release searcher reference previously acquired by acquire()", e);
        throw new SearchHandlerException(e);
      }
    }

    // Add searchRequest to warmer if needed
    try {
      if (!warming && indexState.getWarmer() != null) {
        indexState.getWarmer().addSearchRequest(searchRequest);
      }
    } catch (Exception e) {
      logger.error("Unable to add warming query", e);
    }

    // if we are out of time, don't bother with serialization
    DeadlineUtils.checkDeadline("SearchHandler: end", diagnostics, "SEARCH");
    SearchResponse searchResponse = searchContext.getResponseBuilder().build();
    if (!warming) {
      SearchResponseCollector.updateSearchResponseMetrics(
          searchResponse,
          searchContext.getIndexState().getName(),
          searchContext.getIndexState().getVerboseMetrics());
    }
    return searchResponse;
  }

  /**
   * Fetch/compute field values for the top hits. This operation may be done in parallel, based on
   * the setting for the fetch thread pool. In addition to filling hit fields, any query {@link
   * com.yelp.nrtsearch.server.luceneserver.search.FetchTasks.FetchTask}s are executed.
   *
   * @param searchContext search parameters
   * @throws IOException on error reading index data
   * @throws ExecutionException on error when performing parallel fetch
   * @throws InterruptedException if parallel fetch is interrupted
   */
  private void fetchFields(SearchContext searchContext)
      throws IOException, ExecutionException, InterruptedException {
    if (searchContext.getResponseBuilder().getHitsBuilderList().isEmpty()) {
      return;
    }

    // sort hits by lucene doc id
    List hitBuilders =
        new ArrayList<>(searchContext.getResponseBuilder().getHitsBuilderList());
    hitBuilders.sort(Comparator.comparing(Hit.Builder::getLuceneDocId));

    IndexState indexState = searchContext.getIndexState();
    int fetch_thread_pool_size = indexState.getThreadPoolConfiguration().getMaxFetchThreads();
    int min_parallel_fetch_num_fields =
        indexState.getThreadPoolConfiguration().getMinParallelFetchNumFields();
    int min_parallel_fetch_num_hits =
        indexState.getThreadPoolConfiguration().getMinParallelFetchNumHits();
    boolean parallelFetchByField =
        indexState.getThreadPoolConfiguration().getParallelFetchByField();

    if (parallelFetchByField
        && fetch_thread_pool_size > 1
        && searchContext.getRetrieveFields().keySet().size() > min_parallel_fetch_num_fields
        && hitBuilders.size() > min_parallel_fetch_num_hits) {
      // Fetch fields in parallel

      List leaves =
          searchContext.getSearcherAndTaxonomy().searcher.getIndexReader().leaves();
      List hitIdToLeaves = new ArrayList<>();
      for (int hitIndex = 0; hitIndex < hitBuilders.size(); ++hitIndex) {
        var hitResponse = hitBuilders.get(hitIndex);
        LeafReaderContext leaf =
            leaves.get(ReaderUtil.subIndex(hitResponse.getLuceneDocId(), leaves));
        hitIdToLeaves.add(hitIndex, leaf);
      }
      List fields = new ArrayList<>(searchContext.getRetrieveFields().keySet());

      // parallelism is min of fetchThreadPoolSize and fields.size() / MIN_PARALLEL_NUM_FIELDS
      // round up
      int parallelism =
          Math.min(
              fetch_thread_pool_size,
              (fields.size() + min_parallel_fetch_num_fields - 1) / min_parallel_fetch_num_fields);
      List> fieldsChunks =
          Lists.partition(fields, (fields.size() + parallelism - 1) / parallelism);
      List>>> futures = new ArrayList<>();

      // Only parallel by fields here, which should work well for doc values and virtual fields
      // For row based stored fields, we should do it by hit id.
      // Stored fields are not widely used for NRTSearch (not recommended for memory usage)
      for (List fieldsChunk : fieldsChunks) {
        futures.add(
            indexState
                .getFetchThreadPoolExecutor()
                .submit(
                    new FillFieldsTask(
                        indexState,
                        searchContext.getSearcherAndTaxonomy().searcher,
                        hitIdToLeaves,
                        hitBuilders,
                        fieldsChunk,
                        searchContext)));
      }
      for (Future>> future : futures) {
        List> values = future.get();
        for (int hitIndex = 0; hitIndex < hitBuilders.size(); ++hitIndex) {
          var hitResponse = hitBuilders.get(hitIndex);
          hitResponse.putAllFields(values.get(hitIndex));
        }
      }

      // execute per hit fetch tasks
      for (int hitIndex = 0; hitIndex < hitBuilders.size(); ++hitIndex) {
        var hitResponse = hitBuilders.get(hitIndex);
        LeafReaderContext leaf = hitIdToLeaves.get(hitIndex);
        if (searchContext.isExplain()) {
          hitResponse.setExplain(
              searchContext
                  .getSearcherAndTaxonomy()
                  .searcher
                  .explain(searchContext.getQuery(), hitResponse.getLuceneDocId())
                  .toString());
        }
        searchContext.getFetchTasks().processHit(searchContext, leaf, hitResponse);
      }
    } else if (!parallelFetchByField
        && fetch_thread_pool_size > 1
        && hitBuilders.size() > min_parallel_fetch_num_hits) {
      // Fetch docs in parallel

      // parallelism is min of fetchThreadPoolSize and hitsBuilder.size() / MIN_PARALLEL_NUM_HITS
      // round up
      int parallelism =
          Math.min(
              fetch_thread_pool_size,
              (hitBuilders.size() + min_parallel_fetch_num_hits - 1) / min_parallel_fetch_num_hits);
      List> docChunks =
          Lists.partition(hitBuilders, (hitBuilders.size() + parallelism - 1) / parallelism);

      // process each document chunk in parallel
      List> futures = new ArrayList<>();
      for (List docChunk : docChunks) {
        futures.add(
            indexState
                .getFetchThreadPoolExecutor()
                .submit(new FillDocsTask(searchContext, docChunk, searchContext.getQuery())));
      }
      for (Future future : futures) {
        future.get();
      }
      // no need to run the per hit fetch tasks here, since they were done in the FillDocsTask
    } else {
      // single threaded fetch
      FillDocsTask fillDocsTask =
          new FillDocsTask(searchContext, hitBuilders, searchContext.getQuery());
      fillDocsTask.run();
    }

    // execute all hits fetch tasks
    searchContext
        .getFetchTasks()
        .processAllHits(searchContext, searchContext.getResponseBuilder().getHitsBuilderList());
  }

  /**
   * Given all the top documents, produce a slice of the documents starting from a start offset and
   * going up to the query needed maximum hits. There may be more top docs than the topHits limit,
   * if top docs sampling facets are used.
   *
   * @param hits all hits
   * @param startHit offset into top docs
   * @param topHits maximum number of hits needed for search response
   * @return slice of hits starting at given offset, or empty slice if there are less than startHit
   *     docs
   */
  public static TopDocs getHitsFromOffset(TopDocs hits, int startHit, int topHits) {
    int retrieveHits = Math.min(topHits, hits.scoreDocs.length);
    if (startHit != 0 || retrieveHits != hits.scoreDocs.length) {
      // Slice:
      int count = Math.max(0, retrieveHits - startHit);
      ScoreDoc[] newScoreDocs = new ScoreDoc[count];
      if (count > 0) {
        System.arraycopy(hits.scoreDocs, startHit, newScoreDocs, 0, count);
      }
      return new TopDocs(hits.totalHits, newScoreDocs);
    }
    return hits;
  }

  /**
   * Add {@link com.yelp.nrtsearch.server.grpc.SearchResponse.Hit.Builder}s to the context {@link
   * SearchResponse.Builder} for each of the query hits. Populate the builders with the lucene doc
   * id and ranking info.
   *
   * @param context search context
   * @param hits hits from query
   */
  private static void setResponseHits(SearchContext context, TopDocs hits) {
    TotalHits totalHits =
        TotalHits.newBuilder()
            .setRelation(TotalHits.Relation.valueOf(hits.totalHits.relation.name()))
            .setValue(hits.totalHits.value)
            .build();
    context.getResponseBuilder().setTotalHits(totalHits);
    for (int hitIndex = 0; hitIndex < hits.scoreDocs.length; hitIndex++) {
      var hitResponse = context.getResponseBuilder().addHitsBuilder();
      ScoreDoc hit = hits.scoreDocs[hitIndex];
      hitResponse.setLuceneDocId(hit.doc);
      context.getCollector().fillHitRanking(hitResponse, hit);
    }
  }

  /**
   * Returns the requested searcher + taxoReader, either by indexGen, snapshot, version or just the
   * current (latest) one.
   */
  public static SearcherTaxonomyManager.SearcherAndTaxonomy getSearcherAndTaxonomy(
      SearchRequest searchRequest,
      IndexState indexState,
      ShardState state,
      SearchResponse.Diagnostics.Builder diagnostics,
      ThreadPoolExecutor threadPoolExecutor)
      throws InterruptedException, IOException {
    // TODO: Figure out which searcher to use:
    // final long searcherVersion; e.g. searcher.getLong("version")
    // final IndexState.Gens searcherSnapshot; e.g. searcher.getLong("indexGen")
    // Currently we only use the current(latest) searcher
    SearcherTaxonomyManager.SearcherAndTaxonomy s;

    SearchRequest.SearcherCase searchCase = searchRequest.getSearcherCase();
    long version;
    IndexState.Gens snapshot;

    if (searchCase.equals(SearchRequest.SearcherCase.VERSION)) {
      // Searcher is identified by a version, returned by
      // a prior search or by a refresh.  Apps use this when
      // the user does a follow-on search (next page, drill
      // down, etc.), or to ensure changes from a refresh
      // or NRT replication point are reflected:
      version = searchRequest.getVersion();
      snapshot = null;
      // nocommit need to generify this so we can pull
      // TaxoReader too:
      IndexSearcher priorSearcher = state.slm.acquire(version);
      if (priorSearcher == null) {
        if (snapshot != null) {
          // First time this snapshot is being searched
          // against since this server started, or the call
          // to createSnapshot didn't specify
          // openSearcher=true; now open the reader:
          s = openSnapshotReader(indexState, state, snapshot, diagnostics, threadPoolExecutor);
        } else {
          SearcherTaxonomyManager.SearcherAndTaxonomy current = state.acquire();
          long currentVersion = ((DirectoryReader) current.searcher.getIndexReader()).getVersion();
          if (currentVersion == version) {
            s = current;
          } else if (version > currentVersion) {
            logger.info(
                "SearchHandler: now await version="
                    + version
                    + " vs currentVersion="
                    + currentVersion);

            // TODO: should we have some timeout here? if user passes bogus future version, we hang
            // forever:

            // user is asking for search version beyond what we are currently searching ... wait for
            // us to refresh to it:

            state.release(current);

            // TODO: Use FutureTask here?

            // nocommit: do this in an async way instead!  this task should be parked somewhere and
            // resumed once refresh runs and exposes
            // the requested version, instead of blocking the current search thread
            Lock lock = new ReentrantLock();
            Condition cond = lock.newCondition();
            ReferenceManager.RefreshListener listener =
                new ReferenceManager.RefreshListener() {
                  @Override
                  public void beforeRefresh() {}

                  @Override
                  public void afterRefresh(boolean didRefresh) throws IOException {
                    SearcherTaxonomyManager.SearcherAndTaxonomy current = state.acquire();
                    logger.info(
                        "SearchHandler: refresh completed newVersion="
                            + ((DirectoryReader) current.searcher.getIndexReader()).getVersion());
                    try {
                      if (((DirectoryReader) current.searcher.getIndexReader()).getVersion()
                          >= version) {
                        lock.lock();
                        try {
                          logger.info("SearchHandler: now signal new version");
                          cond.signal();
                        } finally {
                          lock.unlock();
                        }
                      }
                    } finally {
                      state.release(current);
                    }
                  }
                };
            state.addRefreshListener(listener);
            lock.lock();
            try {
              current = state.acquire();
              if (((DirectoryReader) current.searcher.getIndexReader()).getVersion() < version) {
                // still not there yet
                state.release(current);
                cond.await();
                current = state.acquire();
                logger.info(
                    "SearchHandler: await released,  current version "
                        + ((DirectoryReader) current.searcher.getIndexReader()).getVersion()
                        + " required minimum version "
                        + version);
                assert ((DirectoryReader) current.searcher.getIndexReader()).getVersion()
                    >= version;
              }
              s = current;
            } finally {
              lock.unlock();
              state.removeRefreshListener(listener);
            }
          } else {
            // Specific searcher version was requested,
            // but this searcher has timed out.  App
            // should present a "your session expired" to
            // user:
            throw new RuntimeException(
                "searcher: This searcher has expired version="
                    + version
                    + " vs currentVersion="
                    + currentVersion);
          }
        }
      } else {
        // nocommit messy ... we pull an old searcher
        // but the latest taxoReader ... necessary
        // because SLM can't take taxo reader yet:
        SearcherTaxonomyManager.SearcherAndTaxonomy s2 = state.acquire();
        s = new SearcherTaxonomyManager.SearcherAndTaxonomy(priorSearcher, s2.taxonomyReader);
        s2.searcher.getIndexReader().decRef();
      }
    } else if (searchCase.equals((SearchRequest.SearcherCase.INDEXGEN))) {
      // Searcher is identified by an indexGen, returned
      // from a previous indexing operation,
      // e.g. addDocument.  Apps use this then they want
      // to ensure a specific indexing change is visible:
      long t0 = System.nanoTime();
      long gen = searchRequest.getIndexGen();
      if (gen > state.writer.getMaxCompletedSequenceNumber()) {
        throw new RuntimeException(
            "indexGen: requested indexGen ("
                + gen
                + ") is beyond the current maximum generation ("
                + state.writer.getMaxCompletedSequenceNumber()
                + ")");
      }
      state.waitForGeneration(gen);
      if (diagnostics != null) {
        diagnostics.setNrtWaitTimeMs((System.nanoTime() - t0) / 1000000.0);
      }
      s = state.acquire();
      state.slm.record(s.searcher);
    } else if (searchCase.equals(SearchRequest.SearcherCase.SEARCHER_NOT_SET)) {
      // Request didn't specify any specific searcher;
      // just use the current (latest) searcher:
      s = state.acquire();
      state.slm.record(s.searcher);
    } else {
      throw new UnsupportedOperationException(searchCase.name() + " is not yet supported ");
    }

    return s;
  }

  /** Returns a ref. */
  private static SearcherTaxonomyManager.SearcherAndTaxonomy openSnapshotReader(
      IndexState indexState,
      ShardState state,
      IndexState.Gens snapshot,
      SearchResponse.Diagnostics.Builder diagnostics,
      ThreadPoolExecutor threadPoolExecutor)
      throws IOException {
    // TODO: this "reverse-NRT" is ridiculous: we acquire
    // the latest reader, and from that do a reopen to an
    // older snapshot ... this is inefficient if multiple
    // snaphots share older segments that the latest reader
    // does not share ... Lucene needs a reader pool
    // somehow:
    SearcherTaxonomyManager.SearcherAndTaxonomy s = state.acquire();
    try {
      // This returns a new reference to us, which
      // is decRef'd in the finally clause after
      // search is done:
      long t0 = System.nanoTime();

      // Returns a ref, which we return to caller:
      IndexReader r =
          DirectoryReader.openIfChanged(
              (DirectoryReader) s.searcher.getIndexReader(),
              state.snapshots.getIndexCommit(snapshot.indexGen));

      // Ref that we return to caller
      s.taxonomyReader.incRef();

      SearcherTaxonomyManager.SearcherAndTaxonomy result =
          new SearcherTaxonomyManager.SearcherAndTaxonomy(
              new MyIndexSearcher(
                  r,
                  new MyIndexSearcher.ExecutorWithParams(
                      threadPoolExecutor,
                      indexState.getSliceMaxDocs(),
                      indexState.getSliceMaxSegments(),
                      indexState.getVirtualShards())),
              s.taxonomyReader);
      state.slm.record(result.searcher);
      long t1 = System.nanoTime();
      if (diagnostics != null) {
        diagnostics.setNewSnapshotSearcherOpenMs(((t1 - t0) / 1000000.0));
      }
      return result;
    } finally {
      state.release(s);
    }
  }

  public static class FillFieldsTask implements Callable>> {

    private IndexState state;
    private IndexSearcher s;
    private List hitIdToleaves;
    private List hitBuilders;
    private List fields;
    private SearchContext searchContext;

    public FillFieldsTask(
        IndexState indexState,
        IndexSearcher indexSearcher,
        List hitIdToleaves,
        List hitBuilders,
        List fields,
        SearchContext searchContext) {
      this.state = indexState;
      this.s = indexSearcher;
      this.fields = fields;
      this.searchContext = searchContext;
      this.hitBuilders = hitBuilders;
      this.hitIdToleaves = hitIdToleaves;
    }

    private List> fillFields(
        IndexSearcher s,
        List hitBuilders,
        List fields,
        SearchContext searchContext)
        throws IOException {
      List> values = new ArrayList<>();
      for (int hitIndex = 0; hitIndex < hitBuilders.size(); ++hitIndex) {
        values.add(new HashMap<>());
      }
      for (String field : fields) {
        for (int hitIndex = 0; hitIndex < hitBuilders.size(); ++hitIndex) {
          var hitResponse = hitBuilders.get(hitIndex);
          LeafReaderContext leaf = hitIdToleaves.get(hitIndex);
          CompositeFieldValue v =
              getFieldForHit(s, hitResponse, leaf, field, searchContext.getRetrieveFields());
          values.get(hitIndex).put(field, v);
        }
      }
      return values;
    }

    /**
     * retrieve one field (some hilited) for one hit:
     *
     * @return
     */
    private CompositeFieldValue getFieldForHit(
        IndexSearcher s,
        Hit.Builder hit,
        LeafReaderContext leaf,
        String field,
        Map dynamicFields)
        throws IOException {
      assert field != null;
      CompositeFieldValue.Builder compositeFieldValue = CompositeFieldValue.newBuilder();
      FieldDef fd = dynamicFields.get(field);

      // We detect invalid field above:
      assert fd != null;
      if (fd instanceof VirtualFieldDef) {
        VirtualFieldDef virtualFieldDef = (VirtualFieldDef) fd;

        int docID = hit.getLuceneDocId() - leaf.docBase;

        assert !Double.isNaN(hit.getScore()) || !virtualFieldDef.getValuesSource().needsScores();
        DoubleValues scoreValue =
            new DoubleValues() {
              @Override
              public double doubleValue() throws IOException {
                return hit.getScore();
              }

              @Override
              public boolean advanceExact(int doc) throws IOException {
                return !Double.isNaN(hit.getScore());
              }
            };
        DoubleValues doubleValues = virtualFieldDef.getValuesSource().getValues(leaf, scoreValue);
        doubleValues.advanceExact(docID);
        compositeFieldValue.addFieldValue(
            FieldValue.newBuilder().setDoubleValue(doubleValues.doubleValue()));
      } else if (fd instanceof RuntimeFieldDef) {
        RuntimeFieldDef runtimeFieldDef = (RuntimeFieldDef) fd;
        RuntimeScript.SegmentFactory segmentFactory = runtimeFieldDef.getSegmentFactory();
        RuntimeScript values = segmentFactory.newInstance(leaf);
        int docID = hit.getLuceneDocId() - leaf.docBase;
        // Check if the value is available for the current document
        if (values != null) {
          values.setDocId(docID);
          Object obj = values.execute();
          ObjectToCompositeFieldTransformer.enrichCompositeField(obj, compositeFieldValue);
        }

      } else if (fd instanceof IndexableFieldDef && ((IndexableFieldDef) fd).hasDocValues()) {
        int docID = hit.getLuceneDocId() - leaf.docBase;
        // it may be possible to cache this if there are multiple hits in the same segment
        LoadedDocValues docValues = ((IndexableFieldDef) fd).getDocValues(leaf);
        docValues.setDocId(docID);
        for (int i = 0; i < docValues.size(); ++i) {
          compositeFieldValue.addFieldValue(docValues.toFieldValue(i));
        }

      }
      // retrieve stored fields
      else if (fd instanceof IndexableFieldDef indexableFieldDef && indexableFieldDef.isStored()) {
        IndexableField[] values = s.doc(hit.getLuceneDocId()).getFields(field);
        for (IndexableField fieldValue : values) {
          compositeFieldValue.addFieldValue(
              indexableFieldDef.getStoredFieldValue(fieldValue.storedValue()));
        }
      } else {
        // TODO: throw exception here after confirming that legitimate requests do not enter this
        logger.error("Unable to fill hit for field: {}", field);
      }

      return compositeFieldValue.build();
    }

    @Override
    public List> call() throws IOException {
      return fillFields(s, hitBuilders, fields, searchContext);
    }
  }

  /** Task to fetch all the fields for a chunk of hits. Also executes any per hit fetch tasks. */
  public static class FillDocsTask implements Runnable {
    private final FieldFetchContext fieldFetchContext;
    private final List docChunk;
    private final Query explainQuery;

    /**
     * Constructor.
     *
     * @param fieldFetchContext context info needed to retrieve field data
     * @param docChunk list of hit builders for query response, must be in lucene doc id order
     */
    public FillDocsTask(FieldFetchContext fieldFetchContext, List docChunk) {
      this(fieldFetchContext, docChunk, null);
    }

    public FillDocsTask(
        FieldFetchContext fieldFetchContext, List docChunk, Query explainQuery) {
      this.fieldFetchContext = fieldFetchContext;
      this.docChunk = docChunk;
      this.explainQuery = explainQuery;
    }

    @Override
    public void run() {
      List leaves =
          fieldFetchContext.getSearcherAndTaxonomy().searcher.getIndexReader().leaves();
      int hitIndex = 0;
      // process documents, grouped by lucene segment
      while (hitIndex < docChunk.size()) {
        int leafIndex = ReaderUtil.subIndex(docChunk.get(hitIndex).getLuceneDocId(), leaves);
        LeafReaderContext sliceSegment = leaves.get(leafIndex);

        // get all hits in the same segment and process them together for better resource reuse
        List sliceHits = getSliceHits(docChunk, hitIndex, sliceSegment);
        try {
          fetchSlice(fieldFetchContext, explainQuery, sliceHits, sliceSegment);
        } catch (IOException e) {
          throw new RuntimeException("Error fetching field data", e);
        }

        hitIndex += sliceHits.size();
      }
    }

    /** Get all hits belonging to the same lucene segment */
    private static List getSliceHits(
        List sortedHits,
        int startIndex,
        LeafReaderContext sliceSegment) {
      int endDoc = sliceSegment.docBase + sliceSegment.reader().maxDoc();
      int endIndex = startIndex + 1;
      while (endIndex < sortedHits.size()) {
        if (sortedHits.get(endIndex).getLuceneDocId() >= endDoc) {
          break;
        }
        endIndex++;
      }
      return sortedHits.subList(startIndex, endIndex);
    }

    /**
     * Fetch all the required field data For a slice of hits. All these hit reside in the same
     * lucene segment.
     *
     * @param context field fetch context
     * @param sliceHits hits in this slice
     * @param sliceSegment lucene segment context for slice
     * @throws IOException on issue reading document data
     */
    private static void fetchSlice(
        FieldFetchContext context,
        Query explainQuery,
        List sliceHits,
        LeafReaderContext sliceSegment)
        throws IOException {
      for (Map.Entry fieldDefEntry : context.getRetrieveFields().entrySet()) {
        if (fieldDefEntry.getValue() instanceof VirtualFieldDef) {
          fetchFromValueSource(
              sliceHits,
              sliceSegment,
              fieldDefEntry.getKey(),
              (VirtualFieldDef) fieldDefEntry.getValue());
        } else if (fieldDefEntry.getValue() instanceof RuntimeFieldDef) {
          fetchRuntimeFromSegmentFactory(
              sliceHits,
              sliceSegment,
              fieldDefEntry.getKey(),
              (RuntimeFieldDef) fieldDefEntry.getValue());
        } else if (fieldDefEntry.getValue() instanceof IndexableFieldDef) {
          IndexableFieldDef indexableFieldDef = (IndexableFieldDef) fieldDefEntry.getValue();
          if (indexableFieldDef.hasDocValues()) {
            fetchFromDocVales(sliceHits, sliceSegment, fieldDefEntry.getKey(), indexableFieldDef);
          } else if (indexableFieldDef.isStored()) {
            fetchFromStored(context, sliceHits, fieldDefEntry.getKey(), indexableFieldDef);
          } else {
            throw new IllegalStateException(
                "No valid method to retrieve indexable field: " + fieldDefEntry.getKey());
          }
        } else {
          throw new IllegalStateException(
              "No valid method to retrieve field: " + fieldDefEntry.getKey());
        }
      }

      // execute any per hit fetch tasks
      Query resolvedExplainQuery = null;
      if (context.isExplain()) {
        resolvedExplainQuery =
            explainQuery != null ? explainQuery : context.getSearchContext().getQuery();
      }
      for (Hit.Builder hit : sliceHits) {
        if (context.isExplain()) {
          hit.setExplain(
              context
                  .getSearcherAndTaxonomy()
                  .searcher
                  .explain(resolvedExplainQuery, hit.getLuceneDocId())
                  .toString());
        }
        context.getFetchTasks().processHit(context.getSearchContext(), sliceSegment, hit);
      }
    }

    /**
     * Fetch field value from virtual field's {@link org.apache.lucene.search.DoubleValuesSource}
     */
    private static void fetchFromValueSource(
        List sliceHits,
        LeafReaderContext sliceSegment,
        String name,
        VirtualFieldDef virtualFieldDef)
        throws IOException {
      SettableScoreDoubleValues scoreValue = new SettableScoreDoubleValues();
      DoubleValues doubleValues =
          virtualFieldDef.getValuesSource().getValues(sliceSegment, scoreValue);
      for (SearchResponse.Hit.Builder hit : sliceHits) {
        int docID = hit.getLuceneDocId() - sliceSegment.docBase;
        scoreValue.setScore(hit.getScore());
        doubleValues.advanceExact(docID);

        SearchResponse.Hit.CompositeFieldValue.Builder compositeFieldValue =
            SearchResponse.Hit.CompositeFieldValue.newBuilder();
        compositeFieldValue.addFieldValue(
            SearchResponse.Hit.FieldValue.newBuilder().setDoubleValue(doubleValues.doubleValue()));
        hit.putFields(name, compositeFieldValue.build());
      }
    }

    /** Fetch field value from runtime field's Object. */
    private static void fetchRuntimeFromSegmentFactory(
        List sliceHits,
        LeafReaderContext sliceSegment,
        String name,
        RuntimeFieldDef runtimeFieldDef)
        throws IOException {
      RuntimeScript.SegmentFactory segmentFactory = runtimeFieldDef.getSegmentFactory();
      RuntimeScript values = segmentFactory.newInstance(sliceSegment);

      for (SearchResponse.Hit.Builder hit : sliceHits) {
        int docID = hit.getLuceneDocId() - sliceSegment.docBase;
        // Check if the value is available for the current document
        if (values != null) {
          values.setDocId(docID);
          Object obj = values.execute();
          SearchResponse.Hit.CompositeFieldValue.Builder compositeFieldValue =
              SearchResponse.Hit.CompositeFieldValue.newBuilder();
          ObjectToCompositeFieldTransformer.enrichCompositeField(obj, compositeFieldValue);
          hit.putFields(name, compositeFieldValue.build());
        }
      }
    }

    /** Fetch field value from its doc value */
    private static void fetchFromDocVales(
        List sliceHits,
        LeafReaderContext sliceSegment,
        String name,
        IndexableFieldDef indexableFieldDef)
        throws IOException {
      LoadedDocValues docValues = indexableFieldDef.getDocValues(sliceSegment);
      for (SearchResponse.Hit.Builder hit : sliceHits) {
        int docID = hit.getLuceneDocId() - sliceSegment.docBase;
        docValues.setDocId(docID);

        SearchResponse.Hit.CompositeFieldValue.Builder compositeFieldValue =
            SearchResponse.Hit.CompositeFieldValue.newBuilder();
        for (int i = 0; i < docValues.size(); ++i) {
          compositeFieldValue.addFieldValue(docValues.toFieldValue(i));
        }
        hit.putFields(name, compositeFieldValue.build());
      }
    }

    /** Fetch field value stored in the index */
    private static void fetchFromStored(
        FieldFetchContext context,
        List sliceHits,
        String name,
        IndexableFieldDef indexableFieldDef)
        throws IOException {
      for (SearchResponse.Hit.Builder hit : sliceHits) {
        SearchResponse.Hit.CompositeFieldValue.Builder compositeFieldValue =
            SearchResponse.Hit.CompositeFieldValue.newBuilder();
        IndexableField[] values =
            context.getSearcherAndTaxonomy().searcher.doc(hit.getLuceneDocId()).getFields(name);
        for (IndexableField fieldValue : values) {
          compositeFieldValue.addFieldValue(
              indexableFieldDef.getStoredFieldValue(fieldValue.storedValue()));
        }
        hit.putFields(name, compositeFieldValue.build());
      }
    }

    /**
     * {@link DoubleValues} implementation used to inject the document score into the execution of
     * scripts to populate virtual fields.
     */
    private static class SettableScoreDoubleValues extends DoubleValues {
      private double score = Double.NaN;

      @Override
      public double doubleValue() {
        return score;
      }

      @Override
      public boolean advanceExact(int doc) {
        return !Double.isNaN(score);
      }

      public void setScore(double score) {
        this.score = score;
      }
    }
  }

  private static FieldValue convertType(FieldDef fd, Object o) {
    var fieldValue = FieldValue.newBuilder();
    if (fd instanceof BooleanFieldDef) {
      if ((Integer) o == 1) {
        fieldValue.setBooleanValue(Boolean.TRUE);
      } else {
        assert (Integer) o == 0;
        fieldValue.setBooleanValue(Boolean.FALSE);
      }
    } else if (fd instanceof DateTimeFieldDef) {
      fieldValue.setTextValue(msecToDateString(((DateTimeFieldDef) fd), ((Number) o).longValue()));
    } else {
      throw new IllegalArgumentException("Unable to convert object: " + o);
    }

    return fieldValue.build();
  }

  private static String msecToDateString(DateTimeFieldDef fd, long value) {
    // nocommit use CTL to reuse these?
    return fd.formatEpochMillis(value);
  }

  public static class SearchHandlerException extends HandlerException {

    public SearchHandlerException(Throwable err) {
      super(err);
    }

    public SearchHandlerException(String message) {
      super(message);
    }

    public SearchHandlerException(String message, Throwable err) {
      super(message, err);
    }
  }

  /**
   * Find an instance of {@link CollectionTimeoutException} in the cause path of an exception.
   *
   * @return found exception instance or null
   */
  private static CollectionTimeoutException findTimeoutException(Throwable e) {
    if (e instanceof CollectionTimeoutException) {
      return (CollectionTimeoutException) e;
    }
    if (e.getCause() != null) {
      return findTimeoutException(e.getCause());
    }
    return null;
  }
}