feat(ai): 添加工具调用的流式处理支持并限制输出大小

No-Github · No-Github · commit 6747a4e0f960 · 2026-03-13T13:54:23.000+08:00
添加流式工具调用接口以实时显示AI思考过程
限制命令输出大小防止内存溢出
处理流式JSON参数不完整的情况
diff --git a/app_ai_chat.go b/app_ai_chat.go
@@ -249,10 +249,16 @@ func (a *App) runAgentLoop(conversationId string, messages []AIChatMessage, prom
 			return nil
 		}
 
-		resp, err := client.ChatWithTools(ctx, aiMessages, toolDefs)
+		// Use streaming tool call so users can see AI thinking in real-time
+		resp, err := client.ChatWithToolsStream(ctx, aiMessages, toolDefs, func(chunk string) error {
+			a.emitEvent("ai-chat-chunk", map[string]string{
+				"conversationId": conversationId,
+				"chunk":          chunk,
+			})
+			return nil
+		})
 		if err != nil {
 			if ctx.Err() != nil {
-				// Cancelled by user or timeout
 				a.emitEvent("ai-chat-chunk", map[string]string{
 					"conversationId": conversationId,
 					"chunk":          "\n\n⏹️ 操作已被用户停止。",
@@ -263,30 +269,17 @@ func (a *App) runAgentLoop(conversationId string, messages []AIChatMessage, prom
 				})
 				return nil
 			}
-			a.emitEvent( "ai-chat-complete", map[string]interface{}{
+			a.emitEvent("ai-chat-complete", map[string]interface{}{
 				"conversationId": conversationId,
 				"success":        false,
 			})
 			return fmt.Errorf(i18n.Tf("app_ai_analysis_failed", err))
 		}
 
-		// No tool calls → stream the final answer
+		// No tool calls → final answer (already streamed via callback)
 		if len(resp.ToolCalls) == 0 {
 			aiMessages = append(aiMessages, ai.Message{Role: "assistant", Content: resp.Content})
-
-			words := strings.Split(resp.Content, "")
-			chunkSize := 8
-			for i := 0; i < len(words); i += chunkSize {
-				end := i + chunkSize
-				if end > len(words) {
-					end = len(words)
-				}
-				a.emitEvent( "ai-chat-chunk", map[string]string{
-					"conversationId": conversationId,
-					"chunk":          strings.Join(words[i:end], ""),
-				})
-			}
-			a.emitEvent( "ai-chat-complete", map[string]interface{}{
+			a.emitEvent("ai-chat-complete", map[string]interface{}{
 				"conversationId": conversationId,
 				"success":        true,
 			})
@@ -303,30 +296,46 @@ func (a *App) runAgentLoop(conversationId string, messages []AIChatMessage, prom
 		// Execute each tool call
 		for _, tc := range resp.ToolCalls {
 			var args map[string]interface{}
+			var jsonParseErr error
 			if tc.Function.Arguments != "" {
 				if jsonErr := json.Unmarshal([]byte(tc.Function.Arguments), &args); jsonErr != nil {
-					args = map[string]interface{}{}
+					// Streaming may produce incomplete JSON for no-arg tools; treat as empty
+					trimmed := strings.TrimSpace(tc.Function.Arguments)
+					if trimmed == "{" || trimmed == "" {
+						args = map[string]interface{}{}
+					} else {
+						jsonParseErr = jsonErr
+						args = map[string]interface{}{}
+					}
 				}
 			}
 
-			a.emitEvent( "ai-agent-tool-call", map[string]interface{}{
+			a.emitEvent("ai-agent-tool-call", map[string]interface{}{
 				"conversationId": conversationId,
 				"toolCallId":     tc.ID,
 				"toolName":       tc.Function.Name,
 				"toolArgs":       args,
 			})
 
-			result, execErr := mcpServer.ExecuteTool(tc.Function.Name, args)
 			var resultContent string
-			success := execErr == nil
-			if execErr != nil {
-				resultContent = fmt.Sprintf("工具执行失败: %v", execErr)
-			} else if len(result.Content) > 0 {
-				var parts []string
-				for _, item := range result.Content {
-					parts = append(parts, item.Text)
+			var success bool
+
+			if jsonParseErr != nil {
+				// Report JSON parse failure as tool result so AI knows the root cause
+				resultContent = fmt.Sprintf("工具参数 JSON 解析失败: %v\n原始参数: %s", jsonParseErr, tc.Function.Arguments)
+				success = false
+			} else {
+				result, execErr := mcpServer.ExecuteTool(tc.Function.Name, args)
+				success = execErr == nil
+				if execErr != nil {
+					resultContent = fmt.Sprintf("工具执行失败: %v", execErr)
+				} else if len(result.Content) > 0 {
+					var parts []string
+					for _, item := range result.Content {
+						parts = append(parts, item.Text)
+					}
+					resultContent = strings.Join(parts, "\n")
 				}
-				resultContent = strings.Join(parts, "\n")
 			}
 
 			// Truncate large tool results to prevent context window overflow
@@ -335,7 +344,7 @@ func (a *App) runAgentLoop(conversationId string, messages []AIChatMessage, prom
 				resultContent = resultContent[:maxToolResultLen] + "\n\n... (output truncated, total " + fmt.Sprintf("%d", len(resultContent)) + " bytes)"
 			}
 
-			a.emitEvent( "ai-agent-tool-result", map[string]interface{}{
+			a.emitEvent("ai-agent-tool-result", map[string]interface{}{
 				"conversationId": conversationId,
 				"toolCallId":     tc.ID,
 				"toolName":       tc.Function.Name,
diff --git a/mod/ai/client.go b/mod/ai/client.go
@@ -114,6 +114,137 @@ type ToolCallResponse struct {
 // StreamCallback is called for each chunk of the stream
 type StreamCallback func(chunk string) error
 
+// ToolStreamCallback is called for each content chunk during streaming tool calls
+type ToolStreamCallback func(chunk string) error
+
+// ChatWithToolsStream sends a streaming chat request with tool definitions.
+// Content chunks are sent to the callback in real-time. Returns the full response (content + tool_calls).
+func (c *Client) ChatWithToolsStream(ctx context.Context, messages []Message, tools []ToolDefinition, callback ToolStreamCallback) (*ToolCallResponse, error) {
+	reqBody := map[string]interface{}{
+		"model":       c.Model,
+		"messages":    messages,
+		"tools":       tools,
+		"tool_choice": "auto",
+		"stream":      true,
+	}
+
+	bodyBytes, err := json.Marshal(reqBody)
+	if err != nil {
+		return nil, fmt.Errorf("failed to marshal request: %w", err)
+	}
+
+	req, err := http.NewRequestWithContext(ctx, "POST", c.BaseURL+"/chat/completions", bytes.NewReader(bodyBytes))
+	if err != nil {
+		return nil, fmt.Errorf("failed to create request: %w", err)
+	}
+	req.Header.Set("Content-Type", "application/json")
+	req.Header.Set("Authorization", "Bearer "+c.APIKey)
+
+	resp, err := c.client.Do(req)
+	if err != nil {
+		return nil, fmt.Errorf("failed to send request: %w", err)
+	}
+	defer resp.Body.Close()
+
+	if resp.StatusCode != http.StatusOK {
+		body, _ := io.ReadAll(resp.Body)
+		return nil, fmt.Errorf("API error (status %d): %s", resp.StatusCode, string(body))
+	}
+
+	var contentBuilder strings.Builder
+	toolCallMap := make(map[int]*ToolCall) // index → accumulated tool call
+
+	reader := bufio.NewReader(resp.Body)
+	for {
+		line, err := reader.ReadBytes('\n')
+		if err != nil {
+			if err == io.EOF {
+				break
+			}
+			return nil, fmt.Errorf("failed to read stream: %w", err)
+		}
+
+		line = bytes.TrimSpace(line)
+		if len(line) == 0 {
+			continue
+		}
+		if !bytes.HasPrefix(line, []byte("data: ")) {
+			continue
+		}
+		data := bytes.TrimPrefix(line, []byte("data: "))
+		if bytes.Equal(data, []byte("[DONE]")) {
+			break
+		}
+
+		var chunk struct {
+			Choices []struct {
+				Delta struct {
+					Content   string `json:"content"`
+					ToolCalls []struct {
+						Index    int    `json:"index"`
+						ID       string `json:"id"`
+						Type     string `json:"type"`
+						Function struct {
+							Name      string `json:"name"`
+							Arguments string `json:"arguments"`
+						} `json:"function"`
+					} `json:"tool_calls"`
+				} `json:"delta"`
+			} `json:"choices"`
+		}
+		if err := json.Unmarshal(data, &chunk); err != nil {
+			continue
+		}
+		if len(chunk.Choices) == 0 {
+			continue
+		}
+
+		delta := chunk.Choices[0].Delta
+
+		// Stream content chunks to callback
+		if delta.Content != "" {
+			contentBuilder.WriteString(delta.Content)
+			if callback != nil {
+				_ = callback(delta.Content)
+			}
+		}
+
+		// Accumulate tool calls
+		for _, dtc := range delta.ToolCalls {
+			tc, ok := toolCallMap[dtc.Index]
+			if !ok {
+				tc = &ToolCall{Type: "function"}
+				toolCallMap[dtc.Index] = tc
+			}
+			if dtc.ID != "" {
+				tc.ID = dtc.ID
+			}
+			if dtc.Function.Name != "" {
+				tc.Function.Name = dtc.Function.Name
+			}
+			tc.Function.Arguments += dtc.Function.Arguments
+		}
+	}
+
+	// Build sorted tool calls list
+	var toolCalls []ToolCall
+	for i := 0; i < len(toolCallMap); i++ {
+		if tc, ok := toolCallMap[i]; ok {
+			// Fix incomplete arguments from streaming (e.g., "{" without closing "}")
+			args := strings.TrimSpace(tc.Function.Arguments)
+			if args == "" || args == "{" {
+				tc.Function.Arguments = "{}"
+			}
+			toolCalls = append(toolCalls, *tc)
+		}
+	}
+
+	return &ToolCallResponse{
+		Content:   contentBuilder.String(),
+		ToolCalls: toolCalls,
+	}, nil
+}
+
 // ChatWithTools sends a non-streaming chat request with tool definitions, returns full response
 func (c *Client) ChatWithTools(ctx context.Context, messages []Message, tools []ToolDefinition) (*ToolCallResponse, error) {
 	reqBody := map[string]interface{}{
diff --git a/mod/mcp/mcp.go b/mod/mcp/mcp.go
@@ -1265,8 +1265,11 @@ func (s *MCPServer) toolExecCommand(caseID string, command string) (ToolResult,
 	}
 	defer session.Close()
 
-	session.Stdout = &outputBuf
-	session.Stderr = &outputBuf
+	// Limit captured output to prevent memory/context explosion
+	const maxOutputBytes = 32 * 1024 // 32KB
+	lw := &limitedWriter{w: &outputBuf, limit: maxOutputBytes}
+	session.Stdout = lw
+	session.Stderr = lw
 
 	// Run with timeout to prevent hanging on blocking commands
 	const execTimeout = 120 * time.Second
@@ -1275,8 +1278,10 @@ func (s *MCPServer) toolExecCommand(caseID string, command string) (ToolResult,
 		done <- session.Run(command)
 	}()
 
+	var truncated bool
 	select {
 	case err := <-done:
+		truncated = lw.truncated
 		if err != nil {
 			return ToolResult{}, fmt.Errorf("command failed: %v\nOutput: %s", err, outputBuf.String())
 		}
@@ -1287,6 +1292,9 @@ func (s *MCPServer) toolExecCommand(caseID string, command string) (ToolResult,
 
 	output := fmt.Sprintf("Command executed on case '%s' (%s):\n", c.Name, c.GetId())
 	output += fmt.Sprintf("\nOutput:\n%s", outputBuf.String())
+	if truncated {
+		output += fmt.Sprintf("\n\n... (output truncated at %d bytes, total output exceeded limit)", maxOutputBytes)
+	}
 
 	return ToolResult{
 		Content: []ContentItem{{
@@ -1971,3 +1979,26 @@ func (m *MCPServerManager) runSSEServer(ctx context.Context, addr string) error
 
 	return nil
 }
+
+// limitedWriter wraps an io.Writer and stops writing after a byte limit
+type limitedWriter struct {
+w         io.Writer
+limit     int
+written   int
+truncated bool
+}
+
+func (lw *limitedWriter) Write(p []byte) (int, error) {
+if lw.written >= lw.limit {
+lw.truncated = true
+return len(p), nil // discard silently
+}
+remaining := lw.limit - lw.written
+if len(p) > remaining {
+p = p[:remaining]
+lw.truncated = true
+}
+n, err := lw.w.Write(p)
+lw.written += n
+return n, err
+}