fix: 修复流式聊天部分问题

2026-04-16 16:12:59 +08:00 · 2026-04-16 16:12:59 +08:00 · 9edf4dac9c
parent 22a4b8a4bb
commit 9edf4dac9c
2 changed files with 68 additions and 82 deletions
--- a/luxx/services/chat.py
+++ b/luxx/services/chat.py
@ -213,81 +213,74 @@ class ChatService:
                    
                    # Get delta
                    choices = chunk.get("choices", [])
-                    if not choices:
+                    delta = None
+                    
+                    if choices:
+                        delta = choices[0].get("delta", {})
+                        # If no delta but has message (non-streaming response)
+                        if not delta:
+                            message = choices[0].get("message", {})
+                            if message.get("content"):
+                                delta = {"content": message["content"]}
+                    
+                    if not delta:
                        # Check if there's any content in the response (for non-standard LLM responses)
-                        if chunk.get("content") or chunk.get("message"):
-                            content = chunk.get("content") or chunk.get("message", {}).get("content", "")
-                            if content:
-                                # BUG FIX: Update full_content so it gets saved to database
-                                prev_content_len = len(full_content)
-                                full_content += content
-                                if prev_content_len == 0:  # New text stream started
-                                    text_step_idx = step_index
-                                    text_step_id = f"step-{step_index}"
-                                    step_index += 1
-                                yield _sse_event("process_step", {
-                                    "step": {
-                                        "id": text_step_id if prev_content_len == 0 else f"step-{step_index - 1}",
-                                        "index": text_step_idx if prev_content_len == 0 else step_index - 1,
-                                        "type": "text",
-                                        "content": full_content  # Always send accumulated content
-                                    }
-                                })
-                        continue
+                        content = chunk.get("content") or chunk.get("message", {}).get("content", "")
+                        if content:
+                            delta = {"content": content}
                    
-                    delta = choices[0].get("delta", {})
-                    
-                    # Handle reasoning (thinking)
-                    reasoning = delta.get("reasoning_content", "")
-                    if reasoning:
-                        prev_thinking_len = len(full_thinking)
-                        full_thinking += reasoning
-                        if prev_thinking_len == 0:  # New thinking stream started
-                            thinking_step_idx = step_index
-                            thinking_step_id = f"step-{step_index}"
-                            step_index += 1
-                        yield _sse_event("process_step", {
-                            "step": {
-                                "id": thinking_step_id,
-                                "index": thinking_step_idx,
-                                "type": "thinking",
-                                "content": full_thinking
-                            }
-                        })
-                    
-                    # Handle content
-                    content = delta.get("content", "")
-                    if content:
-                        prev_content_len = len(full_content)
-                        full_content += content
-                        if prev_content_len == 0:  # New text stream started
-                            text_step_idx = step_index
-                            text_step_id = f"step-{step_index}"
-                            step_index += 1
-                        yield _sse_event("process_step", {
-                            "step": {
-                                "id": text_step_id,
-                                "index": text_step_idx,
-                                "type": "text",
-                                "content": full_content
-                            }
-                        })
-                    
-                    # Accumulate tool calls
-                    tool_calls_delta = delta.get("tool_calls", [])
-                    for tc in tool_calls_delta:
-                        idx = tc.get("index", 0)
-                        if idx >= len(tool_calls_list):
-                            tool_calls_list.append({
-                                "id": tc.get("id", ""),
-                                "type": "function",
-                                "function": {"name": "", "arguments": ""}
+                    if delta:
+                        # Handle reasoning (thinking)
+                        reasoning = delta.get("reasoning_content", "")
+                        if reasoning:
+                            prev_thinking_len = len(full_thinking)
+                            full_thinking += reasoning
+                            if prev_thinking_len == 0:  # New thinking stream started
+                                thinking_step_idx = step_index
+                                thinking_step_id = f"step-{step_index}"
+                                step_index += 1
+                            yield _sse_event("process_step", {
+                                "step": {
+                                    "id": thinking_step_id,
+                                    "index": thinking_step_idx,
+                                    "type": "thinking",
+                                    "content": full_thinking
+                                }
                            })
-                        func = tc.get("function", {})
-                        if func.get("name"):
-                            tool_calls_list[idx]["function"]["name"] += func["name"]
-                        if func.get("arguments"):
-                            tool_calls_list[idx]["function"]["arguments"] += func["arguments"]
+                        
+                        # Handle content
+                        content = delta.get("content", "")
+                        if content:
+                            prev_content_len = len(full_content)
+                            full_content += content
+                            if prev_content_len == 0:  # New text stream started
+                                text_step_idx = step_index
+                                text_step_id = f"step-{step_index}"
+                                step_index += 1
+                            yield _sse_event("process_step", {
+                                "step": {
+                                    "id": text_step_id,
+                                    "index": text_step_idx,
+                                    "type": "text",
+                                    "content": full_content
+                                }
+                            })
+                        
+                        # Accumulate tool calls
+                        tool_calls_delta = delta.get("tool_calls", [])
+                        for tc in tool_calls_delta:
+                            idx = tc.get("index", 0)
+                            if idx >= len(tool_calls_list):
+                                tool_calls_list.append({
+                                    "id": tc.get("id", ""),
+                                    "type": "function",
+                                    "function": {"name": "", "arguments": ""}
+                                })
+                            func = tc.get("function", {})
+                            if func.get("name"):
+                                tool_calls_list[idx]["function"]["name"] += func["name"]
+                            if func.get("arguments"):
+                                tool_calls_list[idx]["function"]["arguments"] += func["arguments"]
                
                # Save thinking step
                if thinking_step_id is not None:
--- a/luxx/services/llm_client.py
+++ b/luxx/services/llm_client.py
@ -143,30 +143,23 @@ class LLMClient:
        tools: Optional[List[Dict]] = None,
        **kwargs
    ) -> AsyncGenerator[str, None]:
-        """Stream call LLM API - yields raw SSE event lines
-        
-        Yields:
-            str: Raw SSE event lines for direct forwarding
-        """
+        """Stream call LLM API - yields raw SSE event lines"""
        body = self._build_body(model, messages, tools, stream=True, **kwargs)
        
-        logger.info(f"Starting stream_call for model: {model}, messages count: {len(messages)}")
-        
        try:
            async with httpx.AsyncClient(timeout=120.0) as client:
-                logger.info(f"Sending request to {self.api_url}")
                async with client.stream(
                    "POST",
                    self.api_url,
                    headers=self._build_headers(),
                    json=body
                ) as response:
-                    logger.info(f"Response status: {response.status_code}")
                    response.raise_for_status()
-                    
                    async for line in response.aiter_lines():
                        if line.strip():
                            yield line + "\n"
+                
+                logger.info(f"response finish with : {response.status_code}")
        except httpx.HTTPStatusError as e:
            status_code = e.response.status_code if e.response else "?"
            logger.error(f"HTTP error: {status_code}")