Save cache_type to llm_response_cache

This commit is contained in:
yangdx
2025-02-01 22:18:59 +08:00
parent c3942077a9
commit 3bc7c4d8f1

View File

@@ -568,6 +568,7 @@ async def save_to_cache(hashing_kv, cache_data: CacheData):
mode_cache[cache_data.args_hash] = {
"return": cache_data.content,
"cache_type": cache_data.cache_data,
"embedding": cache_data.quantized.tobytes().hex()
if cache_data.quantized is not None
else None,