From 0fbbfef73015e8ffeaa75fb3fd6e8738f1c7f162 Mon Sep 17 00:00:00 2001 From: mirror <674958229@qq.com> Date: Sat, 8 Feb 2025 16:13:23 +0800 Subject: [PATCH 1/2] fix: replace incorrect function in ai-cache and ERROR_PARTIAL_MESSAGE_KEY judgement --- plugins/wasm-go/extensions/ai-cache/main.go | 11 +++-------- 1 file changed, 3 insertions(+), 8 deletions(-) diff --git a/plugins/wasm-go/extensions/ai-cache/main.go b/plugins/wasm-go/extensions/ai-cache/main.go index 0ab323de13..4bb3f2bad1 100644 --- a/plugins/wasm-go/extensions/ai-cache/main.go +++ b/plugins/wasm-go/extensions/ai-cache/main.go @@ -104,11 +104,11 @@ func onHttpRequestBody(ctx wrapper.HttpContext, c config.PluginConfig, body []by key = strings.Join(userMessages, "\n") } else if c.CacheKeyStrategy == config.CACHE_KEY_STRATEGY_DISABLED { log.Info("[onHttpRequestBody] cache key strategy is disabled") - ctx.DontReadRequestBody() + ctx.DontReadResponseBody() return types.ActionContinue } else { log.Warnf("[onHttpRequestBody] unknown cache key strategy: %s", c.CacheKeyStrategy) - ctx.DontReadRequestBody() + ctx.DontReadResponseBody() return types.ActionContinue } @@ -147,11 +147,6 @@ func onHttpResponseHeaders(ctx wrapper.HttpContext, c config.PluginConfig, log w ctx.SetResponseBodyBufferLimit(DEFAULT_MAX_BODY_BYTES) } - if ctx.GetContext(ERROR_PARTIAL_MESSAGE_KEY) != nil { - ctx.DontReadResponseBody() - return types.ActionContinue - } - return types.ActionContinue } @@ -159,7 +154,7 @@ func onHttpResponseBody(ctx wrapper.HttpContext, c config.PluginConfig, chunk [] log.Debugf("[onHttpResponseBody] is last chunk: %v", isLastChunk) log.Debugf("[onHttpResponseBody] chunk: %s", string(chunk)) - if ctx.GetContext(TOOL_CALLS_CONTEXT_KEY) != nil { + if ctx.GetContext(TOOL_CALLS_CONTEXT_KEY) != nil || ctx.GetContext(ERROR_PARTIAL_MESSAGE_KEY) != nil { return chunk } From 05e383301329f5bcbf1bd7159931b99c531e1551 Mon Sep 17 00:00:00 2001 From: mirror <674958229@qq.com> Date: Sat, 8 Feb 2025 16:15:57 +0800 Subject: [PATCH 2/2] update: update ai-cache docs --- plugins/wasm-go/extensions/ai-cache/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/plugins/wasm-go/extensions/ai-cache/README.md b/plugins/wasm-go/extensions/ai-cache/README.md index b6e59e8e16..999f472270 100644 --- a/plugins/wasm-go/extensions/ai-cache/README.md +++ b/plugins/wasm-go/extensions/ai-cache/README.md @@ -30,7 +30,7 @@ LLM 结果缓存插件,默认配置方式可以直接用于 openai 协议的 ## 配置说明 -本插件同时支持基于向量数据库的语义化缓存和基于字符串匹配的缓存方法,如果同时配置了向量数据库和缓存数据库,优先使用向量数据库。 +本插件同时支持基于向量数据库的语义化缓存和基于字符串匹配的缓存方法,如果同时配置了向量数据库和缓存数据库,优先使用缓存数据库,未命中场景下使用向量数据库能力。 *Note*: 向量数据库(vector) 和 缓存数据库(cache) 不能同时为空,否则本插件无法提供缓存服务。