diff --git a/llmage/llmclient.py b/llmage/llmclient.py index 2baac5a..7390063 100644 --- a/llmage/llmclient.py +++ b/llmage/llmclient.py @@ -84,5 +84,5 @@ async def inference(request, env): raise e llm = llms[0] uapi = UAPI(request, env=env, sor=sor) - return env.stream_response(request, + return await env.stream_response(request, uapi.stream_linify(llm.upappid, llm.apiname, env.user))