feat: 增加token 统计

2026-04-13 23:04:41 +08:00 · 2026-04-13 23:04:41 +08:00 · 6f9bff1f1f
parent 30fc1779f4
commit 6f9bff1f1f
6 changed files with 95 additions and 10 deletions
--- a/dashboard/src/components/MessageBubble.vue
+++ b/dashboard/src/components/MessageBubble.vue
@ -26,7 +26,12 @@
        </template>
      </div>
      <div class="message-footer">
-        <span class="token-count" v-if="tokenCount">{{ tokenCount }} tokens</span>
+        <span class="token-info" v-if="usage">
+          <span class="token-item" v-if="usage.prompt_tokens">输入: {{ usage.prompt_tokens }}</span>
+          <span class="token-item" v-if="usage.completion_tokens">输出: {{ usage.completion_tokens }}</span>
+          <span class="token-item total" v-if="usage.total_tokens">总计: {{ usage.total_tokens }}</span>
+        </span>
+        <span class="token-count" v-else-if="tokenCount">{{ tokenCount }} tokens</span>
        <span class="message-time">{{ formatTime(createdAt) }}</span>
        <button v-if="role === 'assistant'" class="ghost-btn accent" @click="copyContent" title="复制">
          <span v-html="copyIcon"></span>
@ -50,6 +55,7 @@ const props = defineProps({
  toolCalls: { type: Array, default: () => [] },
  processSteps: { type: Array, default: () => [] },
  tokenCount: { type: Number, default: 0 },
+  usage: { type: Object, default: null },
  createdAt: { type: String, default: '' },
  deletable: { type: Boolean, default: false },
  attachments: { type: Array, default: () => [] },
@ -131,6 +137,25 @@ const trashIcon = `<svg viewBox="0 0 24 24" width="14" height="14" fill="none" s
  font-size: 12px;
 }

+.token-info {
+  display: flex;
+  align-items: center;
+  gap: 6px;
+  font-size: 11px;
+  color: var(--text-tertiary);
+}
+
+.token-item {
+  padding: 2px 6px;
+  background: var(--bg-code);
+  border-radius: 4px;
+}
+
+.token-item.total {
+  font-weight: 600;
+  color: var(--accent-primary);
+}
+
 .token-count,
 .message-time {
  font-size: 12px;
--- a/dashboard/src/components/ProcessBlock.vue
+++ b/dashboard/src/components/ProcessBlock.vue
@ -276,6 +276,8 @@ const alertIcon = `<svg viewBox="0 0 24 24" width="16" height="16" fill="none" s
  cursor: pointer;
  font-size: 13px;
  transition: background 0.15s;
+  width: 100%;
+  box-sizing: border-box;
 }

 .thinking .step-header:hover,
@ -370,8 +372,9 @@ const alertIcon = `<svg viewBox="0 0 24 24" width="16" height="16" fill="none" s
  overflow: hidden;
  text-overflow: ellipsis;
  white-space: nowrap;
-  flex: 1;
+  flex: 1 1 auto;
  min-width: 0;
+  max-width: 300px;
 }

 .arrow.open {
--- a/dashboard/src/views/ConversationDetailView.vue
+++ b/dashboard/src/views/ConversationDetailView.vue
@ -41,6 +41,7 @@
              :tool-calls="msg.tool_calls"
              :process-steps="msg.process_steps"
              :token-count="msg.token_count"
+              :usage="msg.usage"
              :created-at="msg.created_at"
              :deletable="msg.role === 'user'"
              :attachments="msg.attachments"
@ -233,13 +234,15 @@ const sendMessage = async () => {
          streamingMessage.value.process_steps.push(step)
        }
      },
-      onDone: () => {
+      onDone: (data) => {
        // 完成，添加到消息列表
        autoScroll.value = true
        if (streamingMessage.value) {
          messages.value.push({
            ...streamingMessage.value,
-            created_at: new Date().toISOString()
+            created_at: new Date().toISOString(),
+            token_count: data.token_count,
+            usage: data.usage
          })
          
          // 如果标题为空，自动用第一条用户消息作为标题
--- a/luxx/models.py
+++ b/luxx/models.py
@ -167,6 +167,7 @@ class Message(Base):
    role: Mapped[str] = mapped_column(String(16), nullable=False)  # user, assistant, system, tool
    content: Mapped[str] = mapped_column(Text, nullable=False, default="")
    token_count: Mapped[int] = mapped_column(Integer, default=0)
+    usage: Mapped[Optional[str]] = mapped_column(Text, nullable=True)  # JSON string for usage info
    created_at: Mapped[datetime] = mapped_column(DateTime, default=local_now)
    
    # Relationships
@ -184,6 +185,13 @@ class Message(Base):
            "created_at": self.created_at.isoformat() if self.created_at else None
        }
        
+        # Parse usage JSON
+        if self.usage:
+            try:
+                result["usage"] = json.loads(self.usage)
+            except json.JSONDecodeError:
+                result["usage"] = None
+        
        # Parse content JSON
        try:
            content_obj = json.loads(self.content) if self.content else {}
--- a/luxx/routes/conversations.py
+++ b/luxx/routes/conversations.py
@ -43,6 +43,7 @@ def list_conversations(
    db: Session = Depends(get_db)
 ):
    """Get conversation list"""
+    import json
    query = db.query(Conversation).filter(Conversation.user_id == current_user.id)
    result = paginate(query.order_by(Conversation.updated_at.desc()), page, page_size)
    
@ -56,6 +57,23 @@ def list_conversations(
        ).order_by(Message.created_at).first()
        if first_msg:
            conv_dict['first_message'] = first_msg.content[:50] + ('...' if len(first_msg.content) > 50 else '')
+        
+        # Calculate total tokens from all assistant messages in this conversation
+        assistant_messages = db.query(Message).filter(
+            Message.conversation_id == c.id,
+            Message.role == 'assistant'
+        ).all()
+        total_tokens = 0
+        for msg in assistant_messages:
+            total_tokens += msg.token_count or 0
+            # Also try to get usage from the usage field
+            if msg.usage:
+                try:
+                    usage_obj = json.loads(msg.usage)
+                    total_tokens = usage_obj.get("total_tokens", total_tokens)
+                except:
+                    pass
+        conv_dict['token_count'] = total_tokens
        items.append(conv_dict)
    
    return success_response(data={
--- a/luxx/services/chat.py
+++ b/luxx/services/chat.py
@ -1,6 +1,7 @@
 """Chat service module"""
 import json
 import uuid
+import logging
 from typing import List, Dict, Any, AsyncGenerator, Optional

 from luxx.models import Conversation, Message
@ -9,7 +10,7 @@ from luxx.tools.core import registry
 from luxx.services.llm_client import LLMClient
 from luxx.config import config

-
+logger = logging.getLogger(__name__)
 # Maximum iterations to prevent infinite loops
 MAX_ITERATIONS = 10

@ -130,6 +131,13 @@ class ChatService:
            all_tool_results = []
            step_index = 0
            
+            # Token usage tracking
+            total_usage = {
+                "prompt_tokens": 0,
+                "completion_tokens": 0,
+                "total_tokens": 0
+            }
+            
            # Global step IDs for thinking and text (persist across iterations)
            thinking_step_id = None
            thinking_step_idx = None
@ -186,6 +194,13 @@ class ChatService:
                        yield _sse_event("error", {"content": f"Failed to parse response: {data_str}"})
                        return
                    
+                    # 提取 API 返回的 usage 信息
+                    if "usage" in chunk:
+                        usage = chunk["usage"]
+                        total_usage["prompt_tokens"] = usage.get("prompt_tokens", 0)
+                        total_usage["completion_tokens"] = usage.get("completion_tokens", 0)
+                        total_usage["total_tokens"] = usage.get("total_tokens", 0)
+                    
                    # Check for error in response
                    if "error" in chunk:
                        error_msg = chunk["error"].get("message", str(chunk["error"]))
@ -362,18 +377,26 @@ class ChatService:
                
                # No tool calls - final iteration, save message
                msg_id = str(uuid.uuid4())
+                
+                # 使用 API 返回的真实 completion_tokens，如果 API 没返回则降级使用估算值
+                actual_token_count = total_usage.get("completion_tokens", 0) or len(full_content) // 4
+                logger.info(f"[TOKEN] total_usage: {total_usage}, actual_token_count: {actual_token_count}")
+                
                self._save_message(
                    conversation.id,
                    msg_id,
                    full_content,
                    all_tool_calls,
                    all_tool_results,
-                    all_steps
+                    all_steps,
+                    actual_token_count,
+                    total_usage
                )
                
                yield _sse_event("done", {
                    "message_id": msg_id,
-                    "token_count": len(full_content) // 4
+                    "token_count": actual_token_count,
+                    "usage": total_usage
                })
                return
            
@ -386,7 +409,9 @@ class ChatService:
                    full_content,
                    all_tool_calls,
                    all_tool_results,
-                    all_steps
+                    all_steps,
+                    actual_token_count,
+                    total_usage
                )
            yield _sse_event("error", {"content": "Exceeded maximum tool call iterations"})
            
@ -400,7 +425,9 @@ class ChatService:
        full_content: str,
        all_tool_calls: list,
        all_tool_results: list,
-        all_steps: list
+        all_steps: list,
+        token_count: int = 0,
+        usage: dict = None
    ):
        """Save the assistant message to database."""
        from luxx.database import SessionLocal
@ -420,7 +447,8 @@ class ChatService:
                conversation_id=conversation_id,
                role="assistant",
                content=json.dumps(content_json, ensure_ascii=False),
-                token_count=len(full_content) // 4
+                token_count=token_count,
+                usage=json.dumps(usage) if usage else None
            )
            db.add(msg)
            db.commit()