From 10121dc237a68f83ccbcea930e2a0f06d08b2804 Mon Sep 17 00:00:00 2001 From: yumoqing Date: Tue, 20 Jan 2026 18:05:35 +0800 Subject: [PATCH] bugfix --- llmage/llmclient.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/llmage/llmclient.py b/llmage/llmclient.py index 5ffafc3..72ca9bc 100644 --- a/llmage/llmclient.py +++ b/llmage/llmclient.py @@ -388,6 +388,8 @@ async def inference(request, *args, params_kw=None, **kw): db = env.DBPools() async with db.sqlorContext(dbname) as sor: llm = await get_llm(llmid) + if not params_kw.model: + params_kw.model = llm.model if params_kw.nostream and llm.stream == 'stream': llm.stream = 'sync' if llm.stream == 'async':