co.elastic.clients.elasticsearch.inference.ElserServiceSettings Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of org.apache.servicemix.bundles.elasticsearch-java
This OSGi bundle wraps ${pkgArtifactId} ${pkgVersion} jar files.
The newest version!
/*
 * Licensed to Elasticsearch B.V. under one or more contributor
 * license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright
 * ownership. Elasticsearch B.V. licenses this file to you under
 * the Apache License, Version 2.0 (the "License"); you may
 * not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package co.elastic.clients.elasticsearch.inference;

import co.elastic.clients.json.JsonpDeserializable;
import co.elastic.clients.json.JsonpDeserializer;
import co.elastic.clients.json.JsonpMapper;
import co.elastic.clients.json.JsonpSerializable;
import co.elastic.clients.json.JsonpUtils;
import co.elastic.clients.json.ObjectBuilderDeserializer;
import co.elastic.clients.json.ObjectDeserializer;
import co.elastic.clients.util.ApiTypeHelper;
import co.elastic.clients.util.ObjectBuilder;
import co.elastic.clients.util.WithJsonObjectBuilderBase;
import jakarta.json.stream.JsonGenerator;
import java.lang.Integer;
import java.util.Objects;
import java.util.function.Function;
import javax.annotation.Nullable;

//----------------------------------------------------------------
//       THIS CODE IS GENERATED. MANUAL EDITS WILL BE LOST.
//----------------------------------------------------------------
//
// This code is generated from the Elasticsearch API specification
// at https://github.com/elastic/elasticsearch-specification
//
// Manual updates to this file will be lost when the code is
// re-generated.
//
// If you find a property that is missing or wrongly typed, please
// open an issue or a PR on the API specification repository.
//
//----------------------------------------------------------------

// typedef: inference._types.ElserServiceSettings

/**
 *
 * @see API
 *      specification
 */
@JsonpDeserializable
public class ElserServiceSettings implements JsonpSerializable {
	@Nullable
	private final AdaptiveAllocations adaptiveAllocations;

	private final int numAllocations;

	private final int numThreads;

	// ---------------------------------------------------------------------------------------------

	private ElserServiceSettings(Builder builder) {

		this.adaptiveAllocations = builder.adaptiveAllocations;
		this.numAllocations = ApiTypeHelper.requireNonNull(builder.numAllocations, this, "numAllocations", 0);
		this.numThreads = ApiTypeHelper.requireNonNull(builder.numThreads, this, "numThreads", 0);

	}

	public static ElserServiceSettings of(Function> fn) {
		return fn.apply(new Builder()).build();
	}

	/**
	 * Adaptive allocations configuration details. If enabled is true,
	 * the number of allocations of the model is set based on the current load the
	 * process gets. When the load is high, a new model allocation is automatically
	 * created, respecting the value of max_number_of_allocations if
	 * it's set. When the load is low, a model allocation is automatically removed,
	 * respecting the value of min_number_of_allocations if it's set.
	 * If enabled is true, do not set the number of allocations
	 * manually.
	 * 
	 * API name: {@code adaptive_allocations}
	 */
	@Nullable
	public final AdaptiveAllocations adaptiveAllocations() {
		return this.adaptiveAllocations;
	}

	/**
	 * Required - The total number of allocations this model is assigned across
	 * machine learning nodes. Increasing this value generally increases the
	 * throughput. If adaptive allocations is enabled, do not set this value because
	 * it's automatically set.
	 * 

	 * API name: {@code num_allocations}
	 */
	public final int numAllocations() {
		return this.numAllocations;
	}

	/**
	 * Required - The number of threads used by each model allocation during
	 * inference. Increasing this value generally increases the speed per inference
	 * request. The inference process is a compute-bound process;
	 * threads_per_allocations must not exceed the number of available
	 * allocated processors per node. The value must be a power of 2. The maximum
	 * value is 32. 

	 * 
	 * info If you want to optimize your ELSER endpoint for ingest, set the number
	 * of threads to 1. If you want to optimize your ELSER endpoint for search, set
	 * the number of threads to greater than 1.
	 * 
	 * 
	 * 
	 * API name: {@code num_threads}
	 */
	public final int numThreads() {
		return this.numThreads;
	}

	/**
	 * Serialize this object to JSON.
	 */
	public void serialize(JsonGenerator generator, JsonpMapper mapper) {
		generator.writeStartObject();
		serializeInternal(generator, mapper);
		generator.writeEnd();
	}

	protected void serializeInternal(JsonGenerator generator, JsonpMapper mapper) {

		if (this.adaptiveAllocations != null) {
			generator.writeKey("adaptive_allocations");
			this.adaptiveAllocations.serialize(generator, mapper);

		}
		generator.writeKey("num_allocations");
		generator.write(this.numAllocations);

		generator.writeKey("num_threads");
		generator.write(this.numThreads);

	}

	@Override
	public String toString() {
		return JsonpUtils.toString(this);
	}

	// ---------------------------------------------------------------------------------------------

	/**
	 * Builder for {@link ElserServiceSettings}.
	 */

	public static class Builder extends WithJsonObjectBuilderBase
			implements
				ObjectBuilder {
		@Nullable
		private AdaptiveAllocations adaptiveAllocations;

		private Integer numAllocations;

		private Integer numThreads;

		/**
		 * Adaptive allocations configuration details. If enabled is true,
		 * the number of allocations of the model is set based on the current load the
		 * process gets. When the load is high, a new model allocation is automatically
		 * created, respecting the value of max_number_of_allocations if
		 * it's set. When the load is low, a model allocation is automatically removed,
		 * respecting the value of min_number_of_allocations if it's set.
		 * If enabled is true, do not set the number of allocations
		 * manually.
		 * 

		 * API name: {@code adaptive_allocations}
		 */
		public final Builder adaptiveAllocations(@Nullable AdaptiveAllocations value) {
			this.adaptiveAllocations = value;
			return this;
		}

		/**
		 * Adaptive allocations configuration details. If enabled is true,
		 * the number of allocations of the model is set based on the current load the
		 * process gets. When the load is high, a new model allocation is automatically
		 * created, respecting the value of max_number_of_allocations if
		 * it's set. When the load is low, a model allocation is automatically removed,
		 * respecting the value of min_number_of_allocations if it's set.
		 * If enabled is true, do not set the number of allocations
		 * manually.
		 * 

		 * API name: {@code adaptive_allocations}
		 */
		public final Builder adaptiveAllocations(
				Function> fn) {
			return this.adaptiveAllocations(fn.apply(new AdaptiveAllocations.Builder()).build());
		}

		/**
		 * Required - The total number of allocations this model is assigned across
		 * machine learning nodes. Increasing this value generally increases the
		 * throughput. If adaptive allocations is enabled, do not set this value because
		 * it's automatically set.
		 * 

		 * API name: {@code num_allocations}
		 */
		public final Builder numAllocations(int value) {
			this.numAllocations = value;
			return this;
		}

		/**
		 * Required - The number of threads used by each model allocation during
		 * inference. Increasing this value generally increases the speed per inference
		 * request. The inference process is a compute-bound process;
		 * threads_per_allocations must not exceed the number of available
		 * allocated processors per node. The value must be a power of 2. The maximum
		 * value is 32. 

		 * 
		 * info If you want to optimize your ELSER endpoint for ingest, set the number
		 * of threads to 1. If you want to optimize your ELSER endpoint for search, set
		 * the number of threads to greater than 1.
		 * 
		 * 
		 * 
		 * API name: {@code num_threads}
		 */
		public final Builder numThreads(int value) {
			this.numThreads = value;
			return this;
		}

		@Override
		protected Builder self() {
			return this;
		}

		/**
		 * Builds a {@link ElserServiceSettings}.
		 *
		 * @throws NullPointerException
		 *             if some of the required fields are null.
		 */
		public ElserServiceSettings build() {
			_checkSingleUse();

			return new ElserServiceSettings(this);
		}
	}

	// ---------------------------------------------------------------------------------------------

	/**
	 * Json deserializer for {@link ElserServiceSettings}
	 */
	public static final JsonpDeserializer _DESERIALIZER = ObjectBuilderDeserializer
			.lazy(Builder::new, ElserServiceSettings::setupElserServiceSettingsDeserializer);

	protected static void setupElserServiceSettingsDeserializer(ObjectDeserializer op) {

		op.add(Builder::adaptiveAllocations, AdaptiveAllocations._DESERIALIZER, "adaptive_allocations");
		op.add(Builder::numAllocations, JsonpDeserializer.integerDeserializer(), "num_allocations");
		op.add(Builder::numThreads, JsonpDeserializer.integerDeserializer(), "num_threads");

	}

}