解决查询命中缓存时流式响应未遵循Ollma规范的问题

- rag返回结果未字符串时,响应分两次发送
- 第一次发送查询内容
- 第二次发送统计信息
This commit is contained in:
yangdx
2025-01-15 23:09:50 +08:00
parent e978a15593
commit 9632a8f0dc
2 changed files with 19 additions and 4 deletions

View File

@@ -119,7 +119,7 @@ DEFAULT_CONFIG = {
"test_cases": {
"basic": {
"query": "孙悟空",
"stream_query": "孙悟空有什么法力,性格特征是什么"
"stream_query": "孙悟空"
}
}
}