All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.elasticsearch.index.mapper.core.NumberFieldMapper Maven / Gradle / Ivy

 * Licensed to Elasticsearch under one or more contributor
 * license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright
 * ownership. Elasticsearch licenses this file to you under
 * the Apache License, Version 2.0 (the "License"); you may
 * not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.

package org.elasticsearch.index.mapper.core;

import com.carrotsearch.hppc.DoubleOpenHashSet;
import com.carrotsearch.hppc.LongArrayList;
import com.carrotsearch.hppc.LongOpenHashSet;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.NumericTokenStream;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.FieldType;
import org.apache.lucene.index.FieldInfo;
import org.apache.lucene.index.FieldInfo.IndexOptions;
import org.apache.lucene.index.IndexableField;
import org.apache.lucene.index.IndexableFieldType;
import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.NumericUtils;
import org.elasticsearch.common.Explicit;
import org.elasticsearch.common.Nullable;
import org.elasticsearch.common.settings.Settings;
import org.elasticsearch.common.unit.Fuzziness;
import org.elasticsearch.common.util.ByteUtils;
import org.elasticsearch.common.util.CollectionUtils;
import org.elasticsearch.common.xcontent.XContentBuilder;
import org.elasticsearch.index.analysis.NamedAnalyzer;
import org.elasticsearch.index.codec.docvaluesformat.DocValuesFormatProvider;
import org.elasticsearch.index.codec.postingsformat.PostingsFormatProvider;
import org.elasticsearch.index.fielddata.IndexFieldDataService;
import org.elasticsearch.index.fielddata.IndexNumericFieldData;
import org.elasticsearch.index.mapper.*;
import org.elasticsearch.index.mapper.internal.AllFieldMapper;
import org.elasticsearch.index.query.QueryParseContext;
import org.elasticsearch.index.similarity.SimilarityProvider;

import java.util.List;

public abstract class NumberFieldMapper extends AbstractFieldMapper implements AllFieldMapper.IncludeInAll {

    public static class Defaults extends AbstractFieldMapper.Defaults {
        public static final int PRECISION_STEP = NumericUtils.PRECISION_STEP_DEFAULT;

        public static final FieldType FIELD_TYPE = new FieldType(AbstractFieldMapper.Defaults.FIELD_TYPE);

        static {

        public static final Explicit IGNORE_MALFORMED = new Explicit(false, false);
        public static final Explicit COERCE = new Explicit(true, false);

    public abstract static class Builder extends AbstractFieldMapper.Builder {

        protected int precisionStep = Defaults.PRECISION_STEP;

        private Boolean ignoreMalformed;

        private Boolean coerce;
        public Builder(String name, FieldType fieldType) {
            super(name, fieldType);

        public T precisionStep(int precisionStep) {
            this.precisionStep = precisionStep;
            return builder;

        public T ignoreMalformed(boolean ignoreMalformed) {
            this.ignoreMalformed = ignoreMalformed;
            return builder;

        protected Explicit ignoreMalformed(BuilderContext context) {
            if (ignoreMalformed != null) {
                return new Explicit(ignoreMalformed, true);
            if (context.indexSettings() != null) {
                return new Explicit(context.indexSettings().getAsBoolean("index.mapping.ignore_malformed", Defaults.IGNORE_MALFORMED.value()), false);
            return Defaults.IGNORE_MALFORMED;
        public T coerce(boolean coerce) {
            this.coerce = coerce;
            return builder;

        protected Explicit coerce(BuilderContext context) {
            if (coerce != null) {
                return new Explicit(coerce, true);
            if (context.indexSettings() != null) {
                return new Explicit(context.indexSettings().getAsBoolean("index.mapping.coerce", Defaults.COERCE.value()), false);
            return Defaults.COERCE;

    protected int precisionStep;

    protected Boolean includeInAll;

    protected Explicit ignoreMalformed;

    protected Explicit coerce;
    private ThreadLocal tokenStream = new ThreadLocal() {
        protected NumericTokenStream initialValue() {
            return new NumericTokenStream(precisionStep);

    private static ThreadLocal tokenStream4 = new ThreadLocal() {
        protected NumericTokenStream initialValue() {
            return new NumericTokenStream(4);

    private static ThreadLocal tokenStream8 = new ThreadLocal() {
        protected NumericTokenStream initialValue() {
            return new NumericTokenStream(8);

    private static ThreadLocal tokenStreamMax = new ThreadLocal() {
        protected NumericTokenStream initialValue() {
            return new NumericTokenStream(Integer.MAX_VALUE);

    protected NumberFieldMapper(Names names, int precisionStep, float boost, FieldType fieldType, Boolean docValues,
                                Explicit ignoreMalformed, Explicit coerce, NamedAnalyzer indexAnalyzer,
                                NamedAnalyzer searchAnalyzer, PostingsFormatProvider postingsProvider,
                                DocValuesFormatProvider docValuesProvider, SimilarityProvider similarity,
                                Loading normsLoading, @Nullable Settings fieldDataSettings, Settings indexSettings,
                                MultiFields multiFields) {
        // LUCENE 4 UPGRADE: Since we can't do anything before the super call, we have to push the boost check down to subclasses
        super(names, boost, fieldType, docValues, indexAnalyzer, searchAnalyzer, postingsProvider, docValuesProvider, 
                similarity, normsLoading, fieldDataSettings, indexSettings, multiFields);
        if (precisionStep <= 0 || precisionStep >= maxPrecisionStep()) {
            this.precisionStep = Integer.MAX_VALUE;
        } else {
            this.precisionStep = precisionStep;
        this.ignoreMalformed = ignoreMalformed;
        this.coerce = coerce;

    public void includeInAll(Boolean includeInAll) {
        if (includeInAll != null) {
            this.includeInAll = includeInAll;

    public void includeInAllIfNotSet(Boolean includeInAll) {
        if (includeInAll != null && this.includeInAll == null) {
            this.includeInAll = includeInAll;

    public void unsetIncludeInAll() {
        includeInAll = null;

    protected abstract int maxPrecisionStep();

    public int precisionStep() {
        return this.precisionStep;

    protected void parseCreateField(ParseContext context, List fields) throws IOException {
        RuntimeException e = null;
        try {
            innerParseCreateField(context, fields);
        } catch (IllegalArgumentException e1) {
            e = e1;
        } catch (MapperParsingException e2) {
            e = e2;

        if (e != null && !ignoreMalformed.value()) {
            throw e;

    protected abstract void innerParseCreateField(ParseContext context, List fields) throws IOException;

    protected final void addDocValue(ParseContext context, long value) {
        CustomLongNumericDocValuesField field = (CustomLongNumericDocValuesField) context.doc().getByKey(names().indexName());
        if (field != null) {
        } else {
            field = new CustomLongNumericDocValuesField(names().indexName(), value);
            context.doc().addWithKey(names().indexName(), field);

     * Use the field query created here when matching on numbers.
    public boolean useTermQueryWithQueryString() {
        return true;

     * Numeric field level query are basically range queries with same value and included. That's the recommended
     * way to execute it.
    public Query termQuery(Object value, @Nullable QueryParseContext context) {
        return rangeQuery(value, value, true, true, context);

     * Numeric field level filter are basically range queries with same value and included. That's the recommended
     * way to execute it.
    public Filter termFilter(Object value, @Nullable QueryParseContext context) {
        return rangeFilter(value, value, true, true, context);

    public abstract Query rangeQuery(Object lowerTerm, Object upperTerm, boolean includeLower, boolean includeUpper, @Nullable QueryParseContext context);

    public abstract Filter rangeFilter(Object lowerTerm, Object upperTerm, boolean includeLower, boolean includeUpper, @Nullable QueryParseContext context);

    public abstract Query fuzzyQuery(String value, Fuzziness fuzziness, int prefixLength, int maxExpansions, boolean transpositions);

     * A range filter based on the field data cache.
    public abstract Filter rangeFilter(IndexFieldDataService fieldData, Object lowerTerm, Object upperTerm, boolean includeLower, boolean includeUpper, @Nullable QueryParseContext context);

     * A terms filter based on the field data cache for numeric fields.
    public Filter termsFilter(IndexFieldDataService fieldDataService, List values, @Nullable QueryParseContext context) {
        IndexNumericFieldData fieldData = fieldDataService.getForField(this);
        if (fieldData.getNumericType().isFloatingPoint()) {
            // create with initial size large enough to avoid rehashing
            DoubleOpenHashSet terms =
                    new DoubleOpenHashSet((int) (values.size() * (1 + DoubleOpenHashSet.DEFAULT_LOAD_FACTOR)));
            for (int i = 0, len = values.size(); i < len; i++) {

            return FieldDataTermsFilter.newDoubles(fieldData, terms);
        } else {
            // create with initial size large enough to avoid rehashing
            LongOpenHashSet terms =
                    new LongOpenHashSet((int) (values.size() * (1 + LongOpenHashSet.DEFAULT_LOAD_FACTOR)));
            for (int i = 0, len = values.size(); i < len; i++) {

            return FieldDataTermsFilter.newLongs(fieldData, terms);

     * Converts an object value into a double
    public double parseDoubleValue(Object value) {
        if (value instanceof Number) {
            return ((Number) value).doubleValue();

        if (value instanceof BytesRef) {
            return Double.parseDouble(((BytesRef) value).utf8ToString());

        return Double.parseDouble(value.toString());

     * Converts an object value into a long
    public long parseLongValue(Object value) {
        if (value instanceof Number) {
            return ((Number) value).longValue();

        if (value instanceof BytesRef) {
            return Long.parseLong(((BytesRef) value).utf8ToString());

        return Long.parseLong(value.toString());

     * Override the default behavior (to return the string, and return the actual Number instance).
     * @param value
    public Object valueForSearch(Object value) {
        return value(value);

    public void merge(Mapper mergeWith, MergeContext mergeContext) throws MergeMappingException {
        super.merge(mergeWith, mergeContext);
        if (!this.getClass().equals(mergeWith.getClass())) {
        if (!mergeContext.mergeFlags().simulate()) {
            NumberFieldMapper nfmMergeWith = (NumberFieldMapper) mergeWith;
            this.precisionStep = nfmMergeWith.precisionStep;
            this.includeInAll = nfmMergeWith.includeInAll;
            if (nfmMergeWith.ignoreMalformed.explicit()) {
                this.ignoreMalformed = nfmMergeWith.ignoreMalformed;
            if (nfmMergeWith.coerce.explicit()) {
                this.coerce = nfmMergeWith.coerce;

    public void close() {

    protected NumericTokenStream popCachedStream() {
        if (precisionStep == 4) {
            return tokenStream4.get();
        if (precisionStep == 8) {
            return tokenStream8.get();
        if (precisionStep == Integer.MAX_VALUE) {
            return tokenStreamMax.get();
        return tokenStream.get();

    // used to we can use a numeric field in a document that is then parsed twice!
    public abstract static class CustomNumericField extends Field {

        protected final NumberFieldMapper mapper;

        public CustomNumericField(NumberFieldMapper mapper, Number value, FieldType fieldType) {
            super(mapper.names().indexName(), fieldType);
            this.mapper = mapper;
            if (value != null) {
                this.fieldsData = value;

        public String stringValue() {
            return null;

        public Reader readerValue() {
            return null;

        public abstract String numericAsString();

    public static abstract class CustomNumericDocValuesField implements IndexableField {

        public static final FieldType TYPE = new FieldType();
        static {

        private final String name;

        public CustomNumericDocValuesField(String  name) {
   = name;

        public String name() {
            return name;

        public IndexableFieldType fieldType() {
            return TYPE;

        public float boost() {
            return 1f;

        public String stringValue() {
            return null;

        public Reader readerValue() {
            return null;

        public Number numericValue() {
            return null;

        public TokenStream tokenStream(Analyzer analyzer) throws IOException {
            return null;


    public static class CustomLongNumericDocValuesField extends CustomNumericDocValuesField {

        public static final FieldType TYPE = new FieldType();
        static {

        private final LongArrayList values;

        public CustomLongNumericDocValuesField(String  name, long value) {
            values = new LongArrayList();

        public void add(long value) {

        public BytesRef binaryValue() {

            // here is the trick:
            //  - the first value is zig-zag encoded so that eg. -5 would become positive and would be better compressed by vLong
            //  - for other values, we only encode deltas using vLong
            final byte[] bytes = new byte[values.size() * ByteUtils.MAX_BYTES_VLONG];
            final ByteArrayDataOutput out = new ByteArrayDataOutput(bytes);
            ByteUtils.writeVLong(out, ByteUtils.zigZagEncode(values.get(0)));
            for (int i = 1; i < values.size(); ++i) {
                final long delta = values.get(i) - values.get(i - 1);
                ByteUtils.writeVLong(out, delta);
            return new BytesRef(bytes, 0, out.getPosition());


    protected void doXContentBody(XContentBuilder builder, boolean includeDefaults, Params params) throws IOException {
        super.doXContentBody(builder, includeDefaults, params);

        if (includeDefaults || ignoreMalformed.explicit()) {
            builder.field("ignore_malformed", ignoreMalformed.value());
        if (includeDefaults || coerce.explicit()) {
            builder.field("coerce", coerce.value());

    public boolean isNumeric() {
        return true;

© 2015 - 2024 Weber Informatics LLC | Privacy Policy