com.agentsflex.llm.qwen.QwenLlm Maven / Gradle / Ivy
/*
* Copyright (c) 2023-2025, Agents-Flex ([email protected]).
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.agentsflex.llm.qwen;
import com.agentsflex.core.document.Document;
import com.agentsflex.core.llm.BaseLlm;
import com.agentsflex.core.llm.ChatOptions;
import com.agentsflex.core.llm.StreamResponseListener;
import com.agentsflex.core.llm.client.BaseLlmClientListener;
import com.agentsflex.core.llm.client.HttpClient;
import com.agentsflex.core.llm.client.LlmClient;
import com.agentsflex.core.llm.client.LlmClientListener;
import com.agentsflex.core.llm.client.impl.SseClient;
import com.agentsflex.core.llm.embedding.EmbeddingOptions;
import com.agentsflex.core.llm.response.AiMessageResponse;
import com.agentsflex.core.parser.AiMessageParser;
import com.agentsflex.core.prompt.Prompt;
import com.agentsflex.core.store.VectorData;
import com.agentsflex.core.util.StringUtil;
import com.alibaba.fastjson.JSON;
import com.alibaba.fastjson.JSONObject;
import com.alibaba.fastjson.JSONPath;
import java.util.HashMap;
import java.util.Map;
public class QwenLlm extends BaseLlm {
HttpClient httpClient = new HttpClient();
public AiMessageParser aiMessageParser = QwenLlmUtil.getAiMessageParser(false);
public AiMessageParser streamMessageParser = QwenLlmUtil.getAiMessageParser(true);
public QwenLlm(QwenLlmConfig config) {
super(config);
}
@Override
public AiMessageResponse chat(Prompt prompt, ChatOptions options) {
Map headers = new HashMap<>();
headers.put("Content-Type", "application/json");
headers.put("Authorization", "Bearer " + getConfig().getApiKey());
String payload = QwenLlmUtil.promptToPayload(prompt, config, options, false);
String endpoint = config.getEndpoint();
String response = httpClient.post(endpoint + "/compatible-mode/v1/chat/completions", headers, payload);
if (config.isDebug()) {
System.out.println(">>>>receive payload:" + response);
}
if (StringUtil.noText(response)) {
return AiMessageResponse.error(prompt, response, "no content for response.");
}
JSONObject jsonObject = JSON.parseObject(response);
JSONObject error = jsonObject.getJSONObject("error");
AiMessageResponse messageResponse = new AiMessageResponse(prompt, response, aiMessageParser.parse(jsonObject));
if (error != null && !error.isEmpty()) {
messageResponse.setError(true);
messageResponse.setErrorMessage(error.getString("message"));
messageResponse.setErrorType(error.getString("type"));
messageResponse.setErrorCode(error.getString("code"));
}
return messageResponse;
}
@Override
public void chatStream(Prompt prompt, StreamResponseListener listener, ChatOptions options) {
LlmClient llmClient = new SseClient();
Map headers = new HashMap<>();
headers.put("Content-Type", "application/json");
headers.put("Authorization", "Bearer " + getConfig().getApiKey());
headers.put("X-DashScope-SSE", "enable"); //stream
String payload = QwenLlmUtil.promptToPayload(prompt, config, options, true);
LlmClientListener clientListener = new BaseLlmClientListener(this, llmClient, listener, prompt, streamMessageParser);
String endpoint = config.getEndpoint();
llmClient.start(endpoint + "/compatible-mode/v1/chat/completions", headers, payload, clientListener, config);
}
@Override
public VectorData embed(Document document, EmbeddingOptions options) {
String payload = QwenLlmUtil.promptToEnabledPayload(document, options, config);
Map headers = new HashMap<>();
headers.put("Content-Type", "application/json");
headers.put("Authorization", "Bearer " + getConfig().getApiKey());
String url = config.getEndpoint() + "/compatible-mode/v1/embeddings";
String response = httpClient.post(url, headers, payload);
if (config.isDebug()) {
System.out.println(">>>>receive payload:" + response);
}
if (StringUtil.noText(response)) {
return null;
}
VectorData vectorData = new VectorData();
double[] embedding = JSONPath.read(response, "$.data[0].embedding", double[].class);
vectorData.setVector(embedding);
return vectorData;
}
}