阿里通义千问,继承 chat options

This commit is contained in:
cherishsince 2024-03-16 10:00:13 +08:00
parent 711cfcb3f6
commit 7a785b1ec0
5 changed files with 226 additions and 48 deletions

View File

@ -0,0 +1,15 @@
package cn.iocoder.yudao.framework.ai.chat;
/**
* 聊天异常
*
* author: fansili
* time: 2024/3/15 20:45
*/
public class ChatException extends RuntimeException {
public ChatException(String message) {
super(message);
}
}

View File

@ -2,7 +2,6 @@ package cn.iocoder.yudao.framework.ai.chatqianwen;
import com.aliyun.broadscope.bailian.sdk.AccessTokenClient;
import com.aliyun.broadscope.bailian.sdk.ApplicationClient;
import com.aliyun.broadscope.bailian.sdk.models.ChatRequestMessage;
import com.aliyun.broadscope.bailian.sdk.models.CompletionsRequest;
import com.aliyun.broadscope.bailian.sdk.models.CompletionsResponse;
import lombok.Getter;
@ -10,8 +9,6 @@ import org.springframework.http.HttpStatusCode;
import org.springframework.http.ResponseEntity;
import reactor.core.publisher.Flux;
import java.util.List;
/**
* 阿里 通义千问
*
@ -35,11 +32,10 @@ public class QianWenApi {
private String token;
private ApplicationClient client;
public QianWenApi(String accessKeyId, String accessKeySecret, String agentKey, String appId, String endpoint) {
public QianWenApi(String accessKeyId, String accessKeySecret, String agentKey, String endpoint) {
this.accessKeyId = accessKeyId;
this.accessKeySecret = accessKeySecret;
this.agentKey = agentKey;
this.appId = appId;
if (endpoint != null) {
this.endpoint = endpoint;
@ -54,35 +50,14 @@ public class QianWenApi {
.build();
}
public ResponseEntity<CompletionsResponse> chatCompletionEntity(ChatRequestMessage message) {
// 创建request
CompletionsRequest request = new CompletionsRequest()
// 设置 appid
.setAppId(appId)
.setMessages(List.of(message))
// 返回choice message结果
.setParameters(new CompletionsRequest.Parameter().setResultFormat("message"));
//
public ResponseEntity<CompletionsResponse> chatCompletionEntity(CompletionsRequest request) {
// 发送请求
CompletionsResponse response = client.completions(request);
int httpCode = 200;
if (!response.isSuccess()) {
System.out.printf("failed to create completion, requestId: %s, code: %s, message: %s\n",
response.getRequestId(), response.getCode(), response.getMessage());
httpCode = 500;
}
return new ResponseEntity<>(response, HttpStatusCode.valueOf(httpCode));
// 阿里云的这个 http code 随便设置外面判断是否成功用的 CompletionsResponse.isSuccess
return new ResponseEntity<>(response, HttpStatusCode.valueOf(200));
}
public Flux<CompletionsResponse> chatCompletionStream(ChatRequestMessage message) {
return client.streamCompletions(
new CompletionsRequest()
// 设置 appid
.setAppId(appId)
// 开启 stream
.setStream(true)
.setMessages(List.of(message))
//开启增量输出模式后面输出不会包含已经输出的内容
.setParameters(new CompletionsRequest.Parameter().setIncrementalOutput(true))
);
public Flux<CompletionsResponse> chatCompletionStream(CompletionsRequest request) {
return client.streamCompletions(request);
}
}

View File

@ -1,14 +1,13 @@
package cn.iocoder.yudao.framework.ai.chatqianwen;
import cn.iocoder.yudao.framework.ai.chat.ChatClient;
import cn.iocoder.yudao.framework.ai.chat.ChatResponse;
import cn.iocoder.yudao.framework.ai.chat.Generation;
import cn.iocoder.yudao.framework.ai.chat.StreamingChatClient;
import cn.hutool.core.util.IdUtil;
import cn.hutool.json.JSONUtil;
import cn.iocoder.yudao.framework.ai.chat.*;
import cn.iocoder.yudao.framework.ai.chat.messages.MessageType;
import cn.iocoder.yudao.framework.ai.chat.prompt.ChatOptions;
import cn.iocoder.yudao.framework.ai.chat.prompt.Prompt;
import cn.iocoder.yudao.framework.ai.chatyiyan.exception.YiYanApiException;
import com.aliyun.broadscope.bailian.sdk.models.ChatRequestMessage;
import com.aliyun.broadscope.bailian.sdk.models.ChatUserMessage;
import com.aliyun.broadscope.bailian.sdk.models.CompletionsResponse;
import com.aliyun.broadscope.bailian.sdk.models.*;
import lombok.extern.slf4j.Slf4j;
import org.springframework.http.ResponseEntity;
import org.springframework.retry.RetryCallback;
@ -19,6 +18,7 @@ import reactor.core.publisher.Flux;
import java.time.Duration;
import java.util.List;
import java.util.Optional;
import java.util.stream.Collectors;
/**
@ -34,10 +34,17 @@ public class QianWenChatClient implements ChatClient, StreamingChatClient {
private QianWenApi qianWenApi;
private ChatOptions chatOptions;
public QianWenChatClient(QianWenApi qianWenApi) {
this.qianWenApi = qianWenApi;
}
public QianWenChatClient(QianWenApi qianWenApi, ChatOptions chatOptions) {
this.qianWenApi = qianWenApi;
this.chatOptions = chatOptions;
}
public final RetryTemplate retryTemplate = RetryTemplate.builder()
// 最大重试次数 10
.maxAttempts(10)
@ -58,7 +65,7 @@ public class QianWenChatClient implements ChatClient, StreamingChatClient {
return this.retryTemplate.execute(ctx -> {
// ctx 会有重试的信息
// 创建 request 请求stream模式需要供应商支持
ChatRequestMessage request = this.createRequest(prompt, false);
CompletionsRequest request = this.createRequest(prompt, false);
// 调用 callWithFunctionSupport 发送请求
ResponseEntity<CompletionsResponse> responseEntity = qianWenApi.chatCompletionEntity(request);
// 获取结果封装 chatCompletion
@ -67,21 +74,69 @@ public class QianWenChatClient implements ChatClient, StreamingChatClient {
return new ChatResponse(List.of(new Generation(String.format("failed to create completion, requestId: %s, code: %s, message: %s\n",
response.getRequestId(), response.getCode(), response.getMessage()))));
}
List<Generation> generations = response.getData().getChoices().stream()
.map(item -> new Generation(item.getMessage().getContent())).collect(Collectors.toList());
return new ChatResponse(generations);
// 转换为 Generation 返回
return new ChatResponse(List.of(new Generation(response.getData().getText())));
});
}
private ChatRequestMessage createRequest(Prompt prompt, boolean b) {
return new ChatUserMessage(prompt.getContents());
private CompletionsRequest createRequest(Prompt prompt, boolean stream) {
// 两个都为null 则没有配置文件
if (chatOptions == null && prompt.getOptions() == null) {
throw new ChatException("ChatOptions 未配置参数!");
}
// 优先使用 Prompt 里面的 ChatOptions
ChatOptions options = chatOptions;
if (prompt.getOptions() != null) {
options = (ChatOptions) prompt.getOptions();
}
QianWenOptions qianWenOptions = (QianWenOptions) options;
// 需要额外处理
if (!stream) {
// 如果不需要 stream 输出那么需要将这个设置为false不然只会输出最后几个文字
if (qianWenOptions.getParameters() == null) {
qianWenOptions.setParameters(new CompletionsRequest.Parameter().setIncrementalOutput(false));
} else {
qianWenOptions.getParameters().setIncrementalOutput(false);
}
} else {
// 如果不需要 stream 输出设置为true这样不会输出累加内容
if (qianWenOptions.getParameters() == null) {
qianWenOptions.setParameters(new CompletionsRequest.Parameter().setIncrementalOutput(true));
} else {
qianWenOptions.getParameters().setIncrementalOutput(true);
}
}
// 创建request
return new CompletionsRequest()
// 请求唯一标识请确保RequestId不重复
.setRequestId(IdUtil.getSnowflakeNextIdStr())
// 设置 appid
.setAppId(qianWenOptions.getAppId())
.setMessages(prompt.getInstructions().stream().map(m -> {
// 转换成 千问 对于的请求message
if (MessageType.USER == m.getMessageType()) {
return new ChatUserMessage(m.getContent());
} else if (MessageType.SYSTEM == m.getMessageType()) {
return new ChatSystemMessage(m.getContent());
} else if (MessageType.ASSISTANT == m.getMessageType()) {
return new ChatAssistantMessage(m.getContent());
}
throw new ChatException(String.format("存在不能适配的消息! %s", JSONUtil.toJsonPrettyStr(m)));
}).collect(Collectors.toList()))
// 返回choice message结果
.setParameters(qianWenOptions.getParameters())
// 设置 ChatOptions 里面公共的参数
.setTopP(options.getTopP() == null ? null : options.getTopP().doubleValue())
// 设置输出方式
.setStream(stream);
}
@Override
public Flux<ChatResponse> stream(Prompt prompt) {
// ctx 会有重试的信息
// 创建 request 请求stream模式需要供应商支持
ChatRequestMessage request = this.createRequest(prompt, true);
CompletionsRequest request = this.createRequest(prompt, true);
// 调用 callWithFunctionSupport 发送请求
Flux<CompletionsResponse> response = this.qianWenApi.chatCompletionStream(request);
return response.map(res -> {

View File

@ -0,0 +1,128 @@
package cn.iocoder.yudao.framework.ai.chatqianwen;
import cn.iocoder.yudao.framework.ai.chat.prompt.ChatOptions;
import com.aliyun.broadscope.bailian.sdk.models.CompletionsRequest;
import lombok.Data;
import lombok.experimental.Accessors;
import java.util.List;
/**
* 阿里云 千问 属性
*
* 地址https://help.aliyun.com/document_detail/2684682.html?spm=a2c4g.2621347.0.0.195117e7Ytpkyo
*
* author: fansili
* time: 2024/3/15 19:57
*/
@Data
@Accessors
public class QianWenOptions implements ChatOptions {
private String appId;
/**
* 是否流式输出, 默认为否
*/
private Boolean stream;
/**
* 用户与模型的对话历史
*/
private List<Message> messages;
/**
* 生成时核采样方法的概率阈值例如取值为0.8时仅保留累计概率之和大于等于0.8的概率分布中的token
* 作为随机采样的候选集取值范围为0,1.0)取值越大生成的随机性越高取值越低生成的随机性越低
* 默认值为0.8注意取值不要大于等于1
*/
private Float topP;
/**
* 模型参数设置
*/
private CompletionsRequest.Parameter parameters = new CompletionsRequest.Parameter();
//
// 适配 ChatOptions
@Override
public Float getTemperature() {
return Float.parseFloat(this.parameters.getTemperature().toString());
}
@Override
public void setTemperature(Float temperature) {
this.parameters.setTemperature(Double.valueOf(temperature.toString()));
}
@Override
public void setTopP(Float topP) {
this.topP = topP;
}
@Override
public Integer getTopK() {
return this.parameters.getTopK();
}
@Override
public void setTopK(Integer topK) {
this.parameters.setTopK(topK);
}
@Data
@Accessors
public static class Message {
/**
* 角色: systemuser或assistant
*/
private String role;
/**
* 提示词或模型内容
*/
private String content;
}
@Data
@Accessors
public static class Parameters {
/**
* 输出格式, 默认为"text"
* "text"表示旧版本的text
* "message"表示兼容openai的message
*/
private String resultFormat;
/**
* 生成时采样候选集的大小例如取值为50时仅将单次生成中得分最高的50个token组成随机采样的候选集
* 取值越大生成的随机性越高取值越小生成的确定性越高
* 注意如果top_k参数为空或者top_k的值大于100表示不启用top_k策略此时仅有top_p策略生效默认是空
*/
private Integer topK;
/**
* 生成时使用的随机数种子用户控制模型生成内容的随机性
* seed支持无符号64位整数默认值为1234在使用seed时模型将尽可能生成相同或相似的结果但目前不保证每次生成的结果完全相同
*/
private Integer seed;
/**
* 用于控制随机性和多样性的程度具体来说temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度
* 较高的temperature值会降低概率分布的峰值使得更多的低概率词被选择
* 生成结果更加多样化而较低的temperature值则会增强概率分布的峰值使得高概率词更容易被选择生成结果更加确定
* 取值范围 [0, 2)系统默认值1.0不建议取值为0无意义
*/
private Float temperature;
/**
* 用于限制模型生成token的数量max_tokens设置的是生成上限并不表示一定会生成这么多的token数量
* 其中qwen-turbo 最大值和默认值为1500 qwen-maxqwen-max-1201 qwen-max-longcontext qwen-plus最大值和默认值均为2000
*/
private Integer maxTokens;
/**
* stop参数用于实现内容生成过程的精确控制在生成内容即将包含指定的字符串或token_ids时自动停止生成内容不包含指定的内容
* 例如如果指定stop为"你好"表示将要生成"你好"时停止如果指定stop为[37763, 367]表示将要生成"Observation"时停止
*/
private List<String> stop;
/**
* 用于控制流式输出模式默认False即后面内容会包含已经输出的内容设置为True将开启增量输出模式
* 后面输出不会包含已经输出的内容您需要自行拼接整体输出参考流式输出示例代码
*/
private Boolean incrementalOutput;
}
}

View File

@ -3,6 +3,8 @@ package cn.iocoder.yudao.framework.ai.chat;
import cn.iocoder.yudao.framework.ai.chat.prompt.Prompt;
import cn.iocoder.yudao.framework.ai.chatqianwen.QianWenApi;
import cn.iocoder.yudao.framework.ai.chatqianwen.QianWenChatClient;
import cn.iocoder.yudao.framework.ai.chatqianwen.QianWenOptions;
import com.aliyun.broadscope.bailian.sdk.models.CompletionsRequest;
import org.junit.Before;
import org.junit.Test;
import reactor.core.publisher.Flux;
@ -24,10 +26,13 @@ public class QianWenChatClientTests {
"",
"",
"",
"",
null
);
qianWenChatClient = new QianWenChatClient(qianWenApi);
qianWenChatClient = new QianWenChatClient(
qianWenApi,
new QianWenOptions()
.setAppId("5f14955f201a44eb8dbe0c57250a32ce")
);
}
@Test