All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.quarkiverse.langchain4j.chroma.ChromaEmbeddingStore Maven / Gradle / Ivy

package io.quarkiverse.langchain4j.chroma;

import static dev.langchain4j.internal.Utils.getOrDefault;
import static dev.langchain4j.internal.Utils.randomUUID;
import static java.time.Duration.ofSeconds;
import static java.util.Collections.singletonList;
import static java.util.stream.Collectors.joining;
import static java.util.stream.Collectors.toList;
import static java.util.stream.StreamSupport.stream;

import java.net.URI;
import java.net.URISyntaxException;
import java.time.Duration;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.concurrent.TimeUnit;
import java.util.function.Supplier;

import jakarta.ws.rs.WebApplicationException;

import org.jboss.logging.Logger;
import org.jboss.resteasy.reactive.client.api.ClientLogger;
import org.jboss.resteasy.reactive.client.api.LoggingScope;

import dev.langchain4j.data.document.Metadata;
import dev.langchain4j.data.embedding.Embedding;
import dev.langchain4j.data.segment.TextSegment;
import dev.langchain4j.store.embedding.EmbeddingMatch;
import dev.langchain4j.store.embedding.EmbeddingStore;
import io.quarkiverse.langchain4j.chroma.runtime.AddEmbeddingsRequest;
import io.quarkiverse.langchain4j.chroma.runtime.ChromaCollectionsRestApi;
import io.quarkiverse.langchain4j.chroma.runtime.Collection;
import io.quarkiverse.langchain4j.chroma.runtime.CreateCollectionRequest;
import io.quarkiverse.langchain4j.chroma.runtime.DeleteEmbeddingsRequest;
import io.quarkiverse.langchain4j.chroma.runtime.QueryRequest;
import io.quarkiverse.langchain4j.chroma.runtime.QueryResponse;
import io.quarkus.arc.impl.LazyValue;
import io.quarkus.rest.client.reactive.QuarkusRestClientBuilder;
import io.vertx.core.buffer.Buffer;
import io.vertx.core.http.HttpClientRequest;
import io.vertx.core.http.HttpClientResponse;

/**
 * Represents a store for embeddings using the Chroma backend.
 * Always uses cosine distance as the distance metric.
 * 

* TODO: introduce an SPI in langchain4j that will allow us to provide our own client */ public class ChromaEmbeddingStore implements EmbeddingStore { private final ChromaClient chromaClient; private final LazyValue collectionId; /** * Initializes a new instance of ChromaEmbeddingStore with the specified parameters. * * @param baseUrl The base URL of the Chroma service. * @param collectionName The name of the collection in the Chroma service. If not specified, "default" will be used. * @param timeout The timeout duration for the Chroma client. If not specified, 5 seconds will be used. * @param logRequests Whether to log requests. * @param logResponses Whether to log responses. */ public ChromaEmbeddingStore(String baseUrl, String collectionName, Duration timeout, boolean logRequests, boolean logResponses) { String effectiveCollectionName = getOrDefault(collectionName, "default"); this.chromaClient = new ChromaClient(baseUrl, getOrDefault(timeout, ofSeconds(5)), logRequests, logResponses); this.collectionId = new LazyValue<>(new Supplier() { @Override public String get() { Collection collection = chromaClient.collection(effectiveCollectionName); if (collection == null) { Collection createdCollection = chromaClient .createCollection(new CreateCollectionRequest(effectiveCollectionName)); return createdCollection.getId(); } else { return collection.getId(); } } }); } public static Builder builder() { return new Builder(); } public static class Builder { private String baseUrl; private String collectionName; private Duration timeout; private boolean logRequests; private boolean logResponses; /** * @param baseUrl The base URL of the Chroma service. * @return builder */ public Builder baseUrl(String baseUrl) { this.baseUrl = baseUrl; return this; } /** * @param collectionName The name of the collection in the Chroma service. If not specified, "default" will be used. * @return builder */ public Builder collectionName(String collectionName) { this.collectionName = collectionName; return this; } /** * @param timeout The timeout duration for the Chroma client. If not specified, 5 seconds will be used. * @return builder */ public Builder timeout(Duration timeout) { this.timeout = timeout; return this; } public Builder logRequests(boolean logRequests) { this.logRequests = logRequests; return this; } public Builder logResponses(boolean logResponses) { this.logResponses = logResponses; return this; } public ChromaEmbeddingStore build() { return new ChromaEmbeddingStore(this.baseUrl, this.collectionName, this.timeout, logRequests, logResponses); } } @Override public String add(Embedding embedding) { String id = randomUUID(); add(id, embedding); return id; } @Override public void add(String id, Embedding embedding) { addInternal(id, embedding, null); } @Override public String add(Embedding embedding, TextSegment textSegment) { String id = randomUUID(); addInternal(id, embedding, textSegment); return id; } @Override public List addAll(List embeddings) { List ids = embeddings.stream() .map(embedding -> randomUUID()) .collect(toList()); addAllInternal(ids, embeddings, null); return ids; } @Override public List addAll(List embeddings, List textSegments) { List ids = embeddings.stream() .map(embedding -> randomUUID()) .collect(toList()); addAllInternal(ids, embeddings, textSegments); return ids; } @Override public void addAll(List ids, List embeddings, List embedded) { addAllInternal(ids, embeddings, embedded); } private void addInternal(String id, Embedding embedding, TextSegment textSegment) { addAllInternal(singletonList(id), singletonList(embedding), textSegment == null ? null : singletonList(textSegment)); } private void addAllInternal(List ids, List embeddings, List textSegments) { AddEmbeddingsRequest addEmbeddingsRequest = AddEmbeddingsRequest.builder() .embeddings(embeddings.stream() .map(Embedding::vector) .collect(toList())) .ids(ids) .metadatas(textSegments == null ? null : textSegments.stream() .map(TextSegment::metadata) .map(Metadata::asMap) .collect(toList())) .documents(textSegments == null ? null : textSegments.stream() .map(TextSegment::text) .collect(toList())) .build(); chromaClient.addEmbeddings(collectionId.get(), addEmbeddingsRequest); } @Override public List> findRelevant(Embedding referenceEmbedding, int maxResults, double minScore) { QueryRequest queryRequest = new QueryRequest(referenceEmbedding.vectorAsList(), maxResults); QueryResponse queryResponse = chromaClient.queryCollection(collectionId.get(), queryRequest); List> matches = toEmbeddingMatches(queryResponse); return matches.stream() .filter(match -> match.score() >= minScore) .collect(toList()); } // FIXME: we need to know the dimension to be able to construct a query that retrieves // all IDs of embeddings in the collection. Is there a better way to do this, without // having to pass the dimension explicitly? public void deleteAll(int dimension) { chromaClient.deleteAllEmbeddings(collectionId.get(), dimension); } private static List> toEmbeddingMatches(QueryResponse queryResponse) { List> embeddingMatches = new ArrayList<>(); for (int i = 0; i < queryResponse.getIds().get(0).size(); i++) { double score = distanceToScore(queryResponse.getDistances().get(0).get(i)); String embeddingId = queryResponse.getIds().get(0).get(i); Embedding embedding = Embedding.from(queryResponse.getEmbeddings().get(0).get(i)); TextSegment textSegment = toTextSegment(queryResponse, i); embeddingMatches.add(new EmbeddingMatch<>(score, embeddingId, embedding, textSegment)); } return embeddingMatches; } /** * By default, cosine distance will be used. For details: * Converts a cosine distance in the range [0, 2] to a score in the range [0, 1]. * * @param distance The distance value. * @return The converted score. */ private static double distanceToScore(double distance) { return 1 - (distance / 2); } private static TextSegment toTextSegment(QueryResponse queryResponse, int i) { String text = queryResponse.getDocuments().get(0).get(i); Map metadata = queryResponse.getMetadatas().get(0).get(i); return text == null ? null : TextSegment.from(text, metadata == null ? new Metadata() : new Metadata(metadata)); } private static class ChromaClient { private final ChromaCollectionsRestApi chromaApi; ChromaClient(String baseUrl, Duration timeout, boolean logRequests, boolean logResponses) { try { var builder = QuarkusRestClientBuilder.newBuilder() .baseUri(new URI(baseUrl)) .connectTimeout(timeout.toSeconds(), TimeUnit.SECONDS) .readTimeout(timeout.toSeconds(), TimeUnit.SECONDS); if (logRequests || logResponses) { builder.loggingScope(LoggingScope.REQUEST_RESPONSE); builder.clientLogger(new ChromaEmbeddingStore.ChromaClientLogger(logRequests, logResponses)); } chromaApi = builder.build(ChromaCollectionsRestApi.class); } catch (URISyntaxException e) { throw new RuntimeException(e); } } Collection createCollection(CreateCollectionRequest createCollectionRequest) { return chromaApi.createCollection(createCollectionRequest); } Collection collection(String collectionName) { try { return chromaApi.collection(collectionName); } catch (WebApplicationException e) { // if collection is not present, Chroma returns: Status - 500 return null; } } boolean addEmbeddings(String collectionId, AddEmbeddingsRequest addEmbeddingsRequest) { return chromaApi.addEmbeddings(collectionId, addEmbeddingsRequest); } QueryResponse queryCollection(String collectionId, QueryRequest queryRequest) { return chromaApi.queryCollection(collectionId, queryRequest); } public void deleteAllEmbeddings(String collectionId, int dimension) { List referenceEmbedding = new ArrayList<>(); for (int i = 0; i < dimension; i++) { referenceEmbedding.add(0.0f); } QueryRequest queryRequest = new QueryRequest(referenceEmbedding, Integer.MAX_VALUE); QueryResponse queryResponse = chromaApi.queryCollection(collectionId, queryRequest); if (!queryResponse.getIds().get(0).isEmpty()) { DeleteEmbeddingsRequest request = new DeleteEmbeddingsRequest(queryResponse.getIds().get(0)); List deletedIds = chromaApi.deleteEmbeddings(collectionId, request); // TODO: why do we have to do this twice? for some reason // embeddings sometimes remain in the db after the first delete, // even though the response says they were deleted chromaApi.deleteEmbeddings(collectionId, request); } } } static class ChromaClientLogger implements ClientLogger { private static final Logger log = Logger.getLogger(ChromaClientLogger.class); private final boolean logRequests; private final boolean logResponses; public ChromaClientLogger(boolean logRequests, boolean logResponses) { this.logRequests = logRequests; this.logResponses = logResponses; } @Override public void setBodySize(int bodySize) { // ignore } @Override public void logRequest(HttpClientRequest request, Buffer body, boolean omitBody) { if (!logRequests || !log.isInfoEnabled()) { return; } try { log.infof("Request:\n- method: %s\n- url: %s\n- headers: %s\n- body: %s", request.getMethod(), request.absoluteURI(), inOneLine(request.headers()), bodyToString(body)); } catch (Exception e) { log.warn("Failed to log request", e); } } @Override public void logResponse(HttpClientResponse response, boolean redirect) { if (!logResponses || !log.isInfoEnabled()) { return; } response.bodyHandler(new io.vertx.core.Handler<>() { @Override public void handle(Buffer body) { try { log.infof( "Response:\n- status code: %s\n- headers: %s\n- body: %s", response.statusCode(), inOneLine(response.headers()), bodyToString(body)); } catch (Exception e) { log.warn("Failed to log response", e); } } }); } private String bodyToString(Buffer body) { if (body == null) { return ""; } return body.toString(); } private String inOneLine(io.vertx.core.MultiMap headers) { return stream(headers.spliterator(), false) .map(header -> { String headerKey = header.getKey(); String headerValue = header.getValue(); return String.format("[%s: %s]", headerKey, headerValue); }) .collect(joining(", ")); } } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy