All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.elasticsearch.search.facet.terms.strings.HashedScriptAggregator Maven / Gradle / Ivy

There is a newer version: 8.14.1
Show newest version
/*
 * Licensed to ElasticSearch and Shay Banon under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership. ElasticSearch licenses this
 * file to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package org.elasticsearch.search.facet.terms.strings;

import com.google.common.collect.ImmutableSet;
import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.CharsRef;
import org.apache.lucene.util.UnicodeUtil;
import org.elasticsearch.index.fielddata.BytesValues;
import org.elasticsearch.script.SearchScript;

import java.util.regex.Matcher;
import java.util.regex.Pattern;

public final class HashedScriptAggregator extends HashedAggregator {

    private final ImmutableSet excluded;
    private final Matcher matcher;
    private final SearchScript script;
    private final CharsRef spare = new CharsRef();
    private final BytesRef scriptSpare = new BytesRef();
    private final boolean convert;
    
    public HashedScriptAggregator(ImmutableSet excluded, Pattern pattern, SearchScript script) {
        this.excluded = excluded;
        this.matcher = pattern != null ? pattern.matcher("") : null;
        this.script = script;
        this.convert = script != null || matcher != null;
    }

    @Override
    public void addValue(BytesRef value, int hashCode, BytesValues values) {
        if (accept(value)) {
            super.addValue(value, hashCode, values);
        }
    }
    
    private boolean accept(BytesRef value) {
        if (excluded != null && excluded.contains(value)) {
            return false;
        }
        if(convert) {
            // only convert if we need to and only once per doc...
            UnicodeUtil.UTF8toUTF16(value, spare);
            if (matcher != null) {
                assert convert : "regexp: [convert == false] but should be true";
                assert value.utf8ToString().equals(spare.toString()) : "not converted";
                return matcher.reset(spare).matches();
            }
        }
        return true;
    }
    
    @Override
    protected void onValue(int docId, BytesRef value, int hashCode, BytesValues values) {
        if (accept(value)) {
            if (script != null) {
                assert convert : "script: [convert == false] but should be true";
                assert value.utf8ToString().equals(spare.toString()) : "not converted";
                script.setNextDocId(docId);
                // LUCENE 4 UPGRADE: needs optimization -- maybe a CharSequence
                // does the job here?
                // we only creat that string if we really need
                script.setNextVar("term", spare.toString());
                Object scriptValue = script.run();
                if (scriptValue == null) {
                    return;
                }
                if (scriptValue instanceof Boolean) {
                    if (!((Boolean) scriptValue)) {
                        return;
                    }
                } else {
                    // LUCENE 4 UPGRADE: should be possible to convert directly
                    // to BR
                    scriptSpare.copyChars(scriptValue.toString());
                    hashCode = scriptSpare.hashCode();
                    super.onValue(docId, scriptSpare, hashCode, values);
                    return;
                }
            }
            assert convert || (matcher == null && script == null);
            super.onValue(docId, value, hashCode, values);
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy