All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.elasticsearch.index.field.data.support.FieldDataLoader Maven / Gradle / Ivy

There is a newer version: 8.15.1
Show newest version
/*
 * Licensed to Elastic Search and Shay Banon under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership. Elastic Search licenses this
 * file to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.elasticsearch.index.field.data.support;

import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermDocs;
import org.apache.lucene.index.TermEnum;
import org.apache.lucene.util.StringHelper;
import org.elasticsearch.index.field.data.FieldData;

import java.io.IOException;
import java.util.Arrays;

/**
 * @author kimchy (shay.banon)
 */
public class FieldDataLoader {

    @SuppressWarnings({"StringEquality"})
    public static  T load(IndexReader reader, String field, TypeLoader loader) throws IOException {

        loader.init();

        field = StringHelper.intern(field);
        int[][] orders = new int[reader.maxDoc()][];

        int t = 1;  // current term number

        boolean multiValued = false;
        TermDocs termDocs = reader.termDocs();
        TermEnum termEnum = reader.terms(new Term(field));
        try {
            do {
                Term term = termEnum.term();
                if (term == null || term.field() != field) break;
                loader.collectTerm(term.text());
                termDocs.seek(termEnum);
                while (termDocs.next()) {
                    int doc = termDocs.doc();
                    int[] orderPerDoc = orders[doc];
                    if (orderPerDoc == null) {
                        orderPerDoc = new int[1];
                        orderPerDoc[0] = t;
                        orders[doc] = orderPerDoc;
                    } else {
                        multiValued = true;
                        orderPerDoc = Arrays.copyOf(orderPerDoc, orderPerDoc.length + 1);
                        orderPerDoc[orderPerDoc.length - 1] = t;
                        orders[doc] = orderPerDoc;
                    }
                }

                t++;
            } while (termEnum.next());
        } catch (RuntimeException e) {
            if (e.getClass().getName().endsWith("StopFillCacheException")) {
                // all is well, in case numeric parsers are used.
            } else {
                throw e;
            }
        } finally {
            termDocs.close();
            termEnum.close();
        }

        if (multiValued) {
            return loader.buildMultiValue(field, orders);
        } else {
            // optimize for a single valued
            int[] sOrders = new int[reader.maxDoc()];
            for (int i = 0; i < orders.length; i++) {
                if (orders[i] != null) {
                    sOrders[i] = orders[i][0];
                }
            }
            return loader.buildSingleValue(field, sOrders);
        }
    }

    public static interface TypeLoader {

        void init();

        void collectTerm(String term);

        T buildSingleValue(String fieldName, int[] order);

        T buildMultiValue(String fieldName, int[][] order);
    }

    public static abstract class FreqsTypeLoader implements TypeLoader {

        protected FreqsTypeLoader() {
        }

        @Override public void init() {
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy