
io.milvus.param.dml.SearchIteratorParam Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of milvus-sdk-java Show documentation
Show all versions of milvus-sdk-java Show documentation
Java SDK for Milvus, a distributed high-performance vector database.
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package io.milvus.param.dml;
import com.google.common.collect.Lists;
import io.milvus.common.clientenum.ConsistencyLevelEnum;
import io.milvus.exception.ParamException;
import io.milvus.grpc.PlaceholderType;
import io.milvus.param.Constant;
import io.milvus.param.MetricType;
import io.milvus.param.ParamUtils;
import lombok.Getter;
import lombok.NonNull;
import lombok.ToString;
import org.jetbrains.annotations.NotNull;
import java.nio.ByteBuffer;
import java.util.List;
import java.util.SortedMap;
import static io.milvus.param.Constant.UNLIMITED;
/**
* Parameters for searchIterator
interface.
*/
@Getter
@ToString
public class SearchIteratorParam {
private final String databaseName;
private final String collectionName;
private final List partitionNames;
private final String metricType;
private final String vectorFieldName;
private final int topK;
private final String expr;
private final List outFields;
private final List> vectors;
private final Long NQ;
private final int roundDecimal;
private final String params;
private final long travelTimestamp;
private final long guaranteeTimestamp;
private final Long gracefulTime;
private final ConsistencyLevelEnum consistencyLevel;
private final boolean ignoreGrowing;
private final String groupByFieldName;
private final PlaceholderType plType;
private final long batchSize;
private SearchIteratorParam(@NonNull Builder builder) {
this.databaseName = builder.databaseName;
this.collectionName = builder.collectionName;
this.partitionNames = builder.partitionNames;
this.metricType = builder.metricType.name();
this.vectorFieldName = builder.vectorFieldName;
this.topK = builder.topK;
this.expr = builder.expr;
this.outFields = builder.outFields;
this.vectors = builder.vectors;
this.NQ = builder.NQ;
this.roundDecimal = builder.roundDecimal;
this.params = builder.params;
this.travelTimestamp = builder.travelTimestamp;
this.guaranteeTimestamp = builder.guaranteeTimestamp;
this.gracefulTime = builder.gracefulTime;
this.consistencyLevel = builder.consistencyLevel;
this.ignoreGrowing = builder.ignoreGrowing;
this.groupByFieldName = builder.groupByFieldName;
this.plType = builder.plType;
this.batchSize = builder.batchSize;
}
public static Builder newBuilder() {
return new Builder();
}
/**
* Builder for {@link SearchIteratorParam} class.
*/
public static class Builder {
private String databaseName;
private String collectionName;
private final List partitionNames = Lists.newArrayList();
private MetricType metricType = MetricType.None;
private String vectorFieldName;
private Integer topK = UNLIMITED;
private String expr = "";
private final List outFields = Lists.newArrayList();
private List> vectors;
private Long NQ;
private Integer roundDecimal = -1;
private String params = "{}";
private Long travelTimestamp = 0L;
private Long guaranteeTimestamp = Constant.GUARANTEE_EVENTUALLY_TS;
private Long gracefulTime = 5000L;
private ConsistencyLevelEnum consistencyLevel = null;
private Boolean ignoreGrowing = Boolean.FALSE;
private String groupByFieldName;
// plType is used to distinct vector type
// for Float16Vector/BFloat16Vector and BinaryVector, user inputs ByteBuffer
// the sdk cannot distinct a ByteBuffer is a BinarVector or a Float16Vector
private PlaceholderType plType = PlaceholderType.None;
private Long batchSize = 1000L;
Builder() {
}
/**
* Sets the database name. database name can be nil.
*
* @param databaseName database name
* @return Builder
*/
public Builder withDatabaseName(String databaseName) {
this.databaseName = databaseName;
return this;
}
/**
* Sets the collection name. Collection name cannot be empty or null.
*
* @param collectionName collection name
* @return Builder
*/
public Builder withCollectionName(@NonNull String collectionName) {
this.collectionName = collectionName;
return this;
}
/**
* Sets partition names list to specify search scope (Optional).
*
* @param partitionNames partition names list
* @return Builder
*/
public Builder withPartitionNames(@NonNull List partitionNames) {
partitionNames.forEach(this::addPartitionName);
return this;
}
/**
* ConsistencyLevel of consistency level.
*
* @param consistencyLevel consistency level
* @return Builder
*/
public Builder withConsistencyLevel(ConsistencyLevelEnum consistencyLevel) {
this.consistencyLevel = consistencyLevel;
return this;
}
/**
* Adds a partition to specify search scope (Optional).
*
* @param partitionName partition name
* @return Builder
*/
public Builder addPartitionName(@NonNull String partitionName) {
if (!this.partitionNames.contains(partitionName)) {
this.partitionNames.add(partitionName);
}
return this;
}
/**
* Sets metric type of ANN searching.
*
* @param metricType metric type
* @return Builder
*/
public Builder withMetricType(@NonNull MetricType metricType) {
this.metricType = metricType;
return this;
}
/**
* Sets target vector field by name. Field name cannot be empty or null.
*
* @param vectorFieldName vector field name
* @return Builder
*/
public Builder withVectorFieldName(@NonNull String vectorFieldName) {
this.vectorFieldName = vectorFieldName;
return this;
}
/**
* Sets topK value of ANN search.
*
* @param topK topK value
* @return Builder
*/
public Builder withTopK(@NonNull Integer topK) {
this.topK = topK;
return this;
}
/**
* Sets expression to filter out entities before searching (Optional).
* @see Boolean Expression Rules
*
* @param expr filtering expression
* @return Builder
*/
public Builder withExpr(@NonNull String expr) {
this.expr = expr;
return this;
}
/**
* Specifies output fields (Optional).
*
* @param outFields output fields
* @return Builder
*/
public Builder withOutFields(@NonNull List outFields) {
outFields.forEach(this::addOutField);
return this;
}
/**
* Specifies an output field (Optional).
*
* @param fieldName filed name
* @return Builder
*/
public Builder addOutField(@NonNull String fieldName) {
if (!this.outFields.contains(fieldName)) {
this.outFields.add(fieldName);
}
return this;
}
/**
* Sets the target vectors.
* Note: Deprecated in v2.4.0, for the reason that the sdk cannot know a ByteBuffer
* is a BinarVector or Float16Vector/BFloat16Vector.
* Replaced by withFloatVectors/withBinaryVectors/withFloat16Vectors/withBFloat16Vectors/withSparseFloatVectors.
* It still works for FloatVector/BinarVector/SparseVector, don't use it for Float16Vector/BFloat16Vector.
*
* @param vectors list of target vectors:
* if vector type is FloatVector, vectors is List of List Float;
* if vector type is BinaryVector, vectors is List of ByteBuffer;
* if vector type is SparseFloatVector, values is List of SortedMap[Long, Float];
* @return Builder
*/
@Deprecated
public Builder withVectors(@NonNull List> vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
return this;
}
/**
* Sets the target vectors to search on FloatVector field.
*
* @param vectors target vectors to search
* @return Builder
*/
public Builder withFloatVectors(@NonNull List> vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
this.plType = PlaceholderType.FloatVector;
return this;
}
/**
* Sets the target vectors to search on BinaryVector field.
*
* @param vectors target vectors to search
* @return Builder
*/
public Builder withBinaryVectors(@NonNull List vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
this.plType = PlaceholderType.BinaryVector;
return this;
}
/**
* Sets the target vectors to search on Float16Vector field.
*
* @param vectors target vectors to search
* @return Builder
*/
public Builder withFloat16Vectors(@NonNull List vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
this.plType = PlaceholderType.Float16Vector;
return this;
}
/**
* Sets the target vectors to search on BFloat16Vector field.
*
* @param vectors target vectors to search
* @return Builder
*/
public Builder withBFloat16Vectors(@NonNull List vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
this.plType = PlaceholderType.BFloat16Vector;
return this;
}
/**
* Sets the target vectors to search on SparseFloatVector field.
*
* @param vectors target vectors to search
* @return Builder
*/
public Builder withSparseFloatVectors(@NonNull List> vectors) {
this.vectors = vectors;
this.NQ = (long) vectors.size();
this.plType = PlaceholderType.SparseFloatVector;
return this;
}
/**
* Specifies the decimal place of the returned results.
*
* @param decimal how many digits after the decimal point
* @return Builder
*/
public Builder withRoundDecimal(@NonNull Integer decimal) {
this.roundDecimal = decimal;
return this;
}
/**
* Sets the search parameters specific to the index type.
*
* For example: IVF index, the search parameters can be "{\"nprobe\":10}"
* For more information: @see Index Selection
*
* @param params extra parameters in json format
* @return Builder
*/
public Builder withParams(@NonNull String params) {
this.params = params;
return this;
}
/**
* Ignore the growing segments to get best search performance. Default is False.
* For the user case that don't require data visibility.
*
* @param ignoreGrowing Boolean.TRUE
ignore, Boolean.FALSE is not
* @return Builder
*/
public Builder withIgnoreGrowing(@NonNull Boolean ignoreGrowing) {
this.ignoreGrowing = ignoreGrowing;
return this;
}
/**
* Sets field name to do grouping.
*
* @param groupByFieldName field name to do grouping
* @return Builder
*/
public Builder withGroupByFieldName(@NonNull String groupByFieldName) {
this.groupByFieldName = groupByFieldName;
return this;
}
/**
* Specify a value to control the number of entities returned per batch. Must be a positive value.
* Default value is 1000, will return without batchSize.
*
* @param batchSize a value to define the number of entities returned per batch
* @return Builder
*/
public Builder withBatchSize(@NotNull Long batchSize) {
this.batchSize = batchSize;
return this;
}
/**
* Verifies parameters and creates a new {@link SearchIteratorParam} instance.
*
* @return {@link SearchIteratorParam}
*/
public SearchIteratorParam build() throws ParamException {
ParamUtils.CheckNullEmptyString(collectionName, "Collection name");
ParamUtils.CheckNullEmptyString(vectorFieldName, "Target field name");
if (topK != UNLIMITED && topK <= 0) {
throw new ParamException("TopK value is illegal");
}
if (travelTimestamp < 0) {
throw new ParamException("The travel timestamp must be greater than 0");
}
if (guaranteeTimestamp < 0) {
throw new ParamException("The guarantee timestamp must be greater than 0");
}
if (metricType == MetricType.None) {
throw new ParamException("must specify metricType for search iterator");
}
verifyVectors(vectors);
return new SearchIteratorParam(this);
}
}
public static void verifyVectors(List> vectors) {
if (vectors == null || vectors.isEmpty()) {
throw new ParamException("Target vectors can not be empty");
}
if (vectors.get(0) instanceof List) {
if (vectors.size() > 1) {
throw new ParamException("Not support search iteration over multiple vectors at present");
}
// float vectors
List> first = (List>) vectors.get(0);
if (!(first.get(0) instanceof Float)) {
throw new ParamException("Float vector field's value must be Lst");
}
} else if (vectors.get(0) instanceof ByteBuffer) {
// binary vectors
if (vectors.size() > 1) {
throw new ParamException("Not support search iteration over multiple vectors at present");
}
} else if (vectors.get(0) instanceof SortedMap) {
// SparseFloatVector
if (vectors.size() > 1) {
throw new ParamException("Not support search iteration over multiple vectors at present");
}
// TODO: here only check the first element, potential risk
SortedMap, ?> map = (SortedMap, ?>) vectors.get(0);
if (!(map.firstKey() instanceof Long)) {
throw new ParamException("key type of SparseFloatVector must be Long");
}
if (!(map.get(map.firstKey()) instanceof Float)) {
throw new ParamException("Value type of SparseFloatVector must be Float");
}
} else {
String msg = "Search target vector type is illegal." +
" Only allow List for FloatVector," +
" ByteBuffer for BinaryVector/Float16Vector/BFloat16Vector," +
" List> for SparseFloatVector.";
throw new ParamException(msg);
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy