|
@@ -499,6 +499,8 @@ public class GRPCController extends BaseController {
|
|
|
public void inferStreamRag(HttpServletRequest httpServletRequest, HttpServletResponse response, @RequestBody ChatReq chatReq) {
|
|
|
// public void inferStreamRag(HttpServletResponse response, ChatReq chatReq) {
|
|
|
log.info("进入了调⽤RAG+⼤模型的调⽤参数");
|
|
|
+ long time1 = System.currentTimeMillis();
|
|
|
+ log.info("开始进来的时间是{}",time1);
|
|
|
// 获取输出流
|
|
|
OutputStream outputStream = null;
|
|
|
ManagedChannel channel = null;
|
|
@@ -611,6 +613,9 @@ public class GRPCController extends BaseController {
|
|
|
//将新的问题放入集合中
|
|
|
historyDates.add(chatReq.getQuestion());
|
|
|
String headerPort = httpServletRequest.getHeader(port);
|
|
|
+ long time2 = System.currentTimeMillis();
|
|
|
+ log.info("开始调用大模型的的时间是{}",time2);
|
|
|
+ log.info("调用大模型之前,处理历史会话等操作的时间为{}", (time2 - time1)/1000);
|
|
|
try {
|
|
|
channel = ManagedChannelBuilder.forAddress(bigModelConfig.getIp(), StringUtils.isBlank(headerPort) ? bigModelConfig.getPort() : Integer.parseInt(headerPort))
|
|
|
.usePlaintext()
|
|
@@ -664,6 +669,9 @@ public class GRPCController extends BaseController {
|
|
|
outputStream.flush();
|
|
|
}
|
|
|
}
|
|
|
+ long time3 = System.currentTimeMillis();
|
|
|
+ log.info("结束调用大模型的的时间是{}",time3);
|
|
|
+ log.info("调用的时间为{}", (time3 - time2)/1000);
|
|
|
//将问答更新到数据库中
|
|
|
chatReq.setSessionId(sessionId);
|
|
|
chatReq.setAnswer(sb.toString());
|
|
@@ -680,6 +688,9 @@ public class GRPCController extends BaseController {
|
|
|
this.chatRecordMapper.insertTXinyiChatRecord(chatReq);
|
|
|
outputStream.write((DEFAULT_ID_IDENTIFIER + chatReq.getId()).getBytes());
|
|
|
outputStream.flush();
|
|
|
+ long time4 = System.currentTimeMillis();
|
|
|
+ log.info("最后操作的时间是{}",time4);
|
|
|
+ log.info("最后操作的时间是{}", (time4 - time3)/1000);
|
|
|
} catch (IOException e) {
|
|
|
throw new RuntimeException(e);
|
|
|
} finally {
|