feat: 推理过程可视化 - websocket实时推送推理步骤到前端

- core.py: 注入ws_push回调, 17个推理节点实时推送事件(上下文/规划/工具调用/执行) - wwwroot/reasoning_console.wss: 新建websocket端点, 支持connect/start_reasoning/ping - wwwroot/reasoning_console.ui: 重写HTML前端, 时间线式可视化展示推理过程
2026-05-09 15:48:12 +08:00 · 2026-05-09 15:48:12 +08:00 · ea4a9e3bd9
commit ea4a9e3bd9
parent 564084f3c8
3 changed files with 232 additions and 86 deletions
--- a/harnessed_reasoning/core.py
+++ b/harnessed_reasoning/core.py
@ -101,6 +101,9 @@ TOOL_DESCRIPTIONS = "\n".join(f"- {t['name']}: {t['desc']}" for t in AVAILABLE_T
 class HermesReasoningEngine:
    """Production reasoning engine that uses LLM and real tool execution."""
    # Websocket push callback (injected by .wss endpoint)
    ws_push = None
    DEFAULT_SAFETY_RULES = {
        "strict": [
            "rm -rf /", "format ", "dd if=/dev/", "mkfs", "chmod 777",
@ -115,6 +118,19 @@ class HermesReasoningEngine:
    def __init__(self):
        pass
    async def _push(self, event_type: str, data: Dict[str, Any] = None):
        """Push a reasoning step event via websocket."""
        if self.ws_push:
            msg = {
                'event': event_type,
                'data': data or {},
                'timestamp': time.time(),
            }
            try:
                await self.ws_push(msg)
            except Exception as e:
                error(f"ws_push failed: {e}")
    # --------------------------------------------------------
    # Config helpers
    # --------------------------------------------------------
@ -164,9 +180,12 @@ class HermesReasoningEngine:
        """Get real memory and session context from harnessed_agent."""
        context = {"user_id": user_id, "memory_entries": [], "recent_sessions": [], "skills": []}
        await self._push('context_start', {'message': '正在收集上下文...', 'user_id': user_id})
        try:
            # Intelligent memory
            max_tokens = int(config.get('max_context_tokens', 4000)) // 3
            await self._push('context_memory', {'message': '加载记忆上下文...', 'max_tokens': max_tokens})
            if hasattr(ServerEnv(), 'harnessed_get_intelligent_memory_context'):
                mem_result = await ServerEnv().harnessed_get_intelligent_memory_context(
                    current_task=request,
@ -174,6 +193,10 @@ class HermesReasoningEngine:
                )
                if mem_result.get('success'):
                    context['memory_entries'] = mem_result.get('memories', [])
                    await self._push('context_memory_done', {
                        'message': f'加载 {len(context["memory_entries"])} 条记忆',
                        'count': len(context['memory_entries'])
                    })
            # Session search
            if config.get('enable_cross_session_search', '1') == '1':
@ -292,6 +315,8 @@ class HermesReasoningEngine:
    async def _generate_plan(self, request: str, context: Dict[str, Any],
                             config: Dict[str, Any]) -> Dict[str, Any]:
        """Use LLM to analyze request and generate execution plan."""
        await self._push('plan_start', {'message': 'LLM 正在分析请求并生成执行计划...', 'request': request[:100]})
        # Build context summary
        ctx_parts = []
        if context.get('memory_entries'):
@ -327,6 +352,7 @@ class HermesReasoningEngine:
        if 'error' in result:
            error(f"LLM planning failed: {result['error'].get('message')}")
            await self._push('plan_error', {'message': f'LLM 调用失败: {result["error"].get("message")}'})
            return {
                'analysis': 'LLM 调用失败，无法生成计划',
                'steps': [],
@ -336,7 +362,16 @@ class HermesReasoningEngine:
        # Extract JSON from response
        content = result.get('choices', [{}])[0].get('message', {}).get('content', '')
-        return self._parse_plan_json(content)
+        plan = self._parse_plan_json(content)
        steps_count = len(plan.get('steps', []))
        await self._push('plan_complete', {
            'message': f'执行计划已生成，共 {steps_count} 个步骤',
            'analysis': plan.get('analysis', ''),
            'step_count': steps_count,
            'steps': plan.get('steps', [])
        })
        return plan
    def _parse_plan_json(self, text: str) -> Dict[str, Any]:
        """Extract and parse JSON plan from LLM response."""
@ -452,9 +487,20 @@ class HermesReasoningEngine:
        try:
            # Step 1: Gather real context
            info(f"Reasoning start: user={user_id}, request={request[:80]}...")
            await self._push('reasoning_start', {
                'session_id': session_id,
                'user_id': user_id,
                'request': request,
                'message': '推理引擎启动'
            })
            context = await self._get_memory_context(user_id, request, config)
            context['user_id'] = user_id  # Ensure user_id is available for tool execution
            await self._push('context_complete', {
                'message': self._context_summary(context),
                'summary': self._context_summary(context)
            })
            # Step 2: LLM-based planning
            plan = await self._generate_plan(request, context, config)
@ -465,6 +511,12 @@ class HermesReasoningEngine:
            violations = self._safety_check(plan, safety_mode)
            if violations:
                warning(f"Safety violations: {violations}")
                await self._push('safety_violation', {
                    'violations': violations,
                    'message': f'安全检查发现 {len(violations)} 个违规'
                })
            else:
                await self._push('safety_pass', {'message': '安全检查通过'})
            # Step 4: Store session
            await self._store_session(session_id, user_id, request, plan, violations, "planned")
@ -499,12 +551,21 @@ class HermesReasoningEngine:
            elapsed_total = time.time() - start_time
            info(f"Reasoning complete in {elapsed_total:.1f}s, status={result['status']}")
            self._push('reasoning_complete', {
                'status': result.get('status', 'completed'),
                'elapsed': round(elapsed_total, 1),
                'message': f'推理完成，状态: {result.get("status", "completed")}'
            })
        except Exception as e:
            exception(f"Reasoning failed: {e}")
            result["success"] = False
            result["error"] = str(e)
            result["status"] = "failed"
            await self._push('reasoning_error', {
                'error': str(e),
                'message': f'推理失败: {str(e)}'
            })
            try:
                await self._update_session_status(session_id, "failed")
@ -546,10 +607,22 @@ class HermesReasoningEngine:
        max_steps = int(config.get('max_reasoning_steps', 10))
        max_tools = int(config.get('max_tool_calls_per_step', 5))
        await self._push('execution_start', {
            'message': f'开始执行计划，共 {len(steps)} 个步骤',
            'total_steps': len(steps)
        })
        for step in steps[:max_steps]:
            step_num = step.get('step_number', '?')
            step_desc = step.get('description', '')
            step_results = []
            await self._push('step_start', {
                'step_number': step_num,
                'description': step_desc,
                'message': f'步骤 {step_num}: {step_desc}'
            })
            for action in step.get('actions', [])[:max_tools]:
                tool = action.get('tool', '')
                params = action.get('parameters', {})
@ -557,9 +630,24 @@ class HermesReasoningEngine:
                if not tool:
                    continue
                await self._push('tool_call_start', {
                    'step_number': step_num,
                    'tool': tool,
                    'parameters': params,
                    'message': f'调用工具: {tool}'
                })
                info(f"Executing step {step_num}: {tool}({json.dumps(params, ensure_ascii=False)[:100]})")
                tool_result = await self._execute_tool(tool, params, context)
                await self._push('tool_call_result', {
                    'step_number': step_num,
                    'tool': tool,
                    'success': tool_result.get('success', False),
                    'result': str(tool_result)[:1000],
                    'message': f'工具 {tool} 执行{"成功" if tool_result.get("success") else "失败"}'
                })
                step_results.append({
                    'tool': tool,
                    'parameters': params,
@ -581,6 +669,18 @@ class HermesReasoningEngine:
                'actions': step_results,
            })
            await self._push('step_complete', {
                'step_number': step_num,
                'description': step.get('description', ''),
                'action_count': len(step_results),
                'message': f'步骤 {step_num} 完成，执行了 {len(step_results)} 个操作'
            })
        await self._push('execution_complete', {
            'message': f'计划执行完成，共 {len(all_results)} 个步骤',
            'total_steps': len(all_results)
        })
        return all_results
    async def _try_recovery(self, tool: str, params: Dict, error: str,
--- a/wwwroot/reasoning_console.ui
+++ b/wwwroot/reasoning_console.ui
--- a/wwwroot/reasoning_console.wss
+++ b/wwwroot/reasoning_console.wss
@ -0,0 +1,126 @@
 """
 Reasoning Console WebSocket endpoint.
 Handles real-time push of reasoning steps to the frontend.
 """
 import json
 import asyncio
 import time
 from appPublic.uniqueID import getID
 from appPublic.log import info, debug, error, exception
 # 全局存储活跃 ws_pool 引用
 _reasoning_ws_sessions = {}
 async def myfunc(request, **kwargs):
    """WebSocket handler for reasoning console."""
    ws_pool = kwargs.get('ws_pool')
    ws_data = kwargs.get('ws_data')
    lenv = kwargs
    try:
        data = json.loads(ws_data) if ws_data else {}
    except:
        data = {}
    cmd = data.get('cmd', '')
    if cmd == 'connect':
        # 前端连接时注册 session
        user_id = data.get('user_id', 'anonymous')
        session_id = data.get('session_id', getID())
        _reasoning_ws_sessions[user_id] = {
            'ws_pool': ws_pool,
            'session_id': session_id,
        }
        debug(f"WS connected: user={user_id}, session={session_id}")
        await ws_pool.sendto(json.dumps({
            'type': 'connected',
            'session_id': session_id,
            'message': 'WebSocket 连接成功'
        }))
    elif cmd == 'start_reasoning':
        # 前端发起推理请求
        user_id = data.get('user_id', 'anonymous')
        request_text = data.get('request', '')
        if not request_text:
            await ws_pool.sendto(json.dumps({
                'type': 'error',
                'message': '请求内容为空'
            }))
            return
        # 推送推理开始事件
        await _ws_push(user_id, {
            'type': 'reasoning_start',
            'data': {
                'request': request_text,
                'message': '推理引擎启动',
                'timestamp': time.time()
            }
        })
        # 调用推理引擎（异步执行，不阻塞 websocket）
        asyncio.create_task(
            _run_reasoning(user_id, request_text)
        )
    elif cmd == 'ping':
        await ws_pool.sendto(json.dumps({
            'type': 'pong',
            'timestamp': time.time()
        }))
 async def _ws_push(user_id, message):
    """推送消息到指定用户的 websocket 连接。"""
    session = _reasoning_ws_sessions.get(user_id)
    if session and session.get('ws_pool'):
        try:
            await session['ws_pool'].sendto(json.dumps(message))
        except Exception as e:
            error(f"WS push failed for user {user_id}: {e}")
 async def _run_reasoning(user_id, request_text):
    """异步执行推理并推送每一步到前端。"""
    from harnessed_reasoning.core import get_harnessed_reasoning_engine
    engine = get_harnessed_reasoning_engine()
    # 注入 ws_push 回调到引擎实例
    async def push_callback(msg):
        await _ws_push(user_id, msg)
    engine.ws_push = push_callback
    try:
        result = await engine.reason_and_execute(
            request=request_text,
            execute_immediately=True,
            user_id=user_id,
        )
        # 推送最终结果
        await _ws_push(user_id, {
            'type': 'reasoning_complete',
            'data': {
                'result': result,
                'message': '推理完成',
                'timestamp': time.time()
            }
        })
    except Exception as e:
        exception(f"Reasoning failed for user {user_id}")
        await _ws_push(user_id, {
            'type': 'error',
            'data': {
                'error': str(e),
                'message': f'推理失败: {str(e)}',
                'timestamp': time.time()
            }
        })
    finally:
        # 清理回调
        engine.ws_push = None