修复bug

RhythmicWave · RhythmicWave · commit 02c213b1b6bb · 2025-12-21T13:36:59.000+08:00
diff --git a/README.md b/README.md
@@ -55,6 +55,7 @@
 <summary>v0.8.5</summary>
 
 - 使用新的agent框架进行了全面替换；优化灵感助手功能、UI
+- 增加了灵感助手相关设置
 - 重新实现了React模式来为模型实现文本格式工具调用，适用工具调用能力不强的模型。可在设置-灵感助手处开启（默认关闭）
 - 兼容了推理模型，增加了thinking模式
 - 建议将DeepSeek、Qwen之类的模型选择/修改提供商为OpenAI兼容，而OpenAI则仅设置为GPT 5等官方模型。
@@ -75,7 +76,6 @@
   - 引用卡片区域重构：固定布局、始终可见的 `...(N)` 按钮，使用 Popover 替代 Modal
   - 优化工具调用结果展示：显示成功/失败状态、支持跳转卡片、可折叠查看完整 JSON
   - 修复引用卡片与模型选择重叠问题，调整输入框高度
-
 - 代码优化与修复bug
 
 </details>
diff --git a/backend/app/bootstrap/init_app.py b/backend/app/bootstrap/init_app.py
@@ -44,7 +44,8 @@ def init_prompts(db: Session):
     """初始化默认提示词。
     行为受环境变量 BOOTSTRAP_OVERWRITE 控制：
     """
-    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', '')).lower() in ('1', 'true', 'yes', 'on')
+    # 默认开启覆盖更新；仅当显式设置为 false/0 等时才关闭
+    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', 'true')).lower() in ('1', 'true', 'yes', 'on')
     existing_prompts = db.exec(select(Prompt)).all()
     existing_names = {p.name for p in existing_prompts}
 
@@ -268,7 +269,8 @@ def init_knowledge(db: Session):
     created = 0
     updated = 0
     skipped = 0
-    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', '')).lower() in ('1', 'true', 'yes', 'on')
+    # 默认开启覆盖更新；仅当显式设置为 false/0 等时才关闭
+    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', 'true')).lower() in ('1', 'true', 'yes', 'on')
 
     for filename in os.listdir(knowledge_dir):
         if not filename.lower().endswith(('.txt', '.md')):
@@ -381,7 +383,8 @@ def init_workflows(db: Session):
             2.1) Card.UpsertChildByTitle（cardType=组织卡，title={item.name}，useItemAsContent=true）
             2.2) Card.ModifyContent（setPath=world_view.social_system.major_power_camps，setValue=[]）
     """
-    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', '')).lower() in ('1', 'true', 'yes', 'on')
+    # 默认开启覆盖更新；仅当显式设置为 false/0 等时才关闭
+    overwrite = str(os.getenv('BOOTSTRAP_OVERWRITE', 'true')).lower() in ('1', 'true', 'yes', 'on')
     total_created = total_updated = total_skipped = 0
     name = "世界观"
     dsl = {
diff --git a/backend/app/bootstrap/prompts/灵感对话-React.txt b/backend/app/bootstrap/prompts/灵感对话-React.txt
@@ -1,11 +1,14 @@
 你是一个智能创作助手，当前工作在文本工具协议模式下。你的核心目标是成为用户的创作伙伴，通过主动理解意图、合理使用工具、给出清晰可靠的建议，来为作者提供结构化的创作协助。
 
+修改测试……
+
 ## ⚙️ 文本协议要求（务必遵守）
 1. **正常对话**：大部分时候，你可以像平常一样自然地思考和回复，无需特殊格式。
 2. **工具调用**：当需要调用工具时，使用 `<Action>{"tool": "工具名", "input": {…}}</Action>` 格式。其中：
    - `tool` (或 `tool_name`) 必须是系统提供的工具名。
    - `input` 必须是一个 JSON 对象，其字段需与工具定义的参数完全匹配。
    - Action 标签内的内容必须是纯粹、有效的 JSON，不应包含任何额外说明文字。
+   - **每次输出 `<Action>` 之前，尽量先用 1～2 句自然语言向用户说明你要做什么；工具执行完成后，再用 1～3 句自然语言总结你做了什么以及得到的关键信息。最好不要只输出一个 `<Action>` 而没有任何解释性文字。**
 3. **工具结果**：系统会以 Observation (工具执行结果) 的形式反馈信息。收到后你可以继续对话或调用更多工具。
 4. **禁止事项**：
    - 不要猜测工具的执行结果；如果工具调用失败，应分析原因并决定是否重试或改变策略。
diff --git a/backend/app/services/langchain_assistant.py b/backend/app/services/langchain_assistant.py
@@ -1,13 +1,3 @@
-"""LangChain-based assistant backend.
-
-This module provides:
-- Factory to build LangChain ChatModel from LLMConfig.
-- A simple streaming generator that yields JSON-line events compatible with
-  the existing assistant event protocol (currently only `token` events).
-
-It is intentionally minimal for the first migration step and does not yet
-implement tools / ReAct. Those will be added incrementally on top.
-"""
 
 from __future__ import annotations
 
@@ -57,7 +47,8 @@
 _ACTION_TAG_RE = re.compile(r"<Action>(.*?)</Action>", re.IGNORECASE | re.DOTALL)
 _CODE_FENCE_RE = re.compile(r"```(?:json)?\s*(.*?)```", re.IGNORECASE | re.DOTALL)
 _JSON_BLOCK_RE = re.compile(r"Action\s*:?\s*(\{.*\})", re.IGNORECASE | re.DOTALL)
-_PROTOCOL_TAGS = ("action", "thought", "finalanswer")
+# React 文本协议仅保留 Action，一律使用 <Action>{...}</Action> 格式声明工具调用
+_PROTOCOL_TAGS = ("action",)
 
 MAX_REACT_STEPS = 8
 
@@ -135,22 +126,6 @@ def _parse_action_payload(text: str) -> Optional[Tuple[str, Dict[str, Any]]]:
     return tool_name.strip(), args
 
 
-def _clean_react_output(text: str) -> str:
-    """清理 React 输出中的残留协议标记，但保留必要的空白字符。"""
-    
-    if not text:
-        return text
-    
-    # 移除 Action 标签（已被系统处理）
-    cleaned = _ACTION_TAG_RE.sub("", text)
-    
-    # 移除其他可能的协议标签，但保留换行符
-    cleaned = re.sub(r"</?(?:Thought|FinalAnswer|Action).*?>", "", cleaned, flags=re.IGNORECASE | re.DOTALL)
-    
-    # 只移除首尾空白，保留中间的换行符和缩进
-    return cleaned.strip()
-
-
 def _process_react_stream_text(state: dict[str, str], new_text: str) -> str:
     """在流式阶段移除协议标签，但保留换行符和空白字符以维护 Markdown 格式。"""
 
@@ -215,12 +190,9 @@ def _process_react_stream_text(state: dict[str, str], new_text: str) -> str:
             state["buffer"] = buffer
             return "".join(output_parts)
              
-        content = block[inner_start + 1 : close_idx]
-        
-        if potential_tag == "finalanswer":
-            # 保留 FinalAnswer 的内容，包括换行符
-            output_parts.append(content)
-        # Action 和 Thought 直接丢弃，但不影响前后的空白字符
+        # 提取标签内部内容（目前仅用于完整跳过 <Action> ... </Action>）
+        # 注意：这里不直接拼接任何协议标签内部的文本，保证前端只看到清洗后的可见正文。
+        _ = block[inner_start + 1 : close_idx]
         
         # 推进 buffer
         buffer = buffer[block_end:]
@@ -525,7 +497,7 @@ async def stream_chat_with_react(
         llm_config_id=request.llm_config_id,
         temperature=request.temperature or 0.6,
         max_tokens=request.max_tokens or 8192,
-        timeout=request.timeout or 60,
+        timeout=request.timeout or 90,
         thinking_enabled=getattr(request, "thinking_enabled", None),
     )
 
@@ -607,9 +579,12 @@ async def stream_chat_with_react(
                 usage_in_total += in_tokens
                 usage_out_total += out_tokens
 
-            # 仅在本轮已经产生过面向用户的正文文本时，才解析 Action 协议。
-            # 这样可以避免模型在纯思考/Reasoning 阶段输出的 <Action> 触发前端提前进入工具调用状态。
-            action_payload = _parse_action_payload(step_text) if has_visible_text else None
+            # 直接从本轮累计的文本中解析 Action 协议。
+            # 早期实现曾经要求 has_visible_text 才允许解析，为的是避免模型在纯思考阶段输出 <Action>。
+            # 但在当前提示词下，我们只约定了 <Action>{...}</Action>，没有显式的 Thought/FinalAnswer 标签，
+            # 严格依赖 has_visible_text 会导致"只输出 Action、不输出正文"的情况完全被忽略，前端看到的是空回复。
+            # 因此这里放宽限制：总是尝试从 step_text 中解析 Action，由上游提示词约束模型行为。
+            action_payload = _parse_action_payload(step_text)
 
             if action_payload:
                 tool_name, args = action_payload
@@ -657,6 +632,7 @@ async def stream_chat_with_react(
             raise RuntimeError("React 模式未能产生最终回复")
 
     except asyncio.CancelledError:
+        logger.warning(f"[React-Agent] 请求被客户端取消 (CancelledError)")
         if usage_in_total and usage_out_total:
             in_tokens = usage_in_total
             out_tokens = usage_out_total
@@ -671,7 +647,8 @@ async def stream_chat_with_react(
             calls=1,
             aborted=True,
         )
-        return
+        # 必须重新抛出 CancelledError 以便上层协程正确感知取消
+        raise
     except Exception as e:
         logger.error(f"[React-Agent] 执行失败: {e}")
         raise
@@ -728,7 +705,7 @@ async def stream_chat_with_tools(
         llm_config_id=request.llm_config_id,
         temperature=request.temperature or 0.6,
         max_tokens=request.max_tokens or 8192,
-        timeout=request.timeout or 60,
+        timeout=request.timeout or 90,
         thinking_enabled=getattr(request, "thinking_enabled", None),
     )
 
diff --git a/frontend/src/renderer/src/components/assistants/AssistantPanel.vue b/frontend/src/renderer/src/components/assistants/AssistantPanel.vue
@@ -760,6 +760,9 @@ function buildAssistantChatRequest() {
     context_summarization_enabled: assistantPrefs.contextSummaryEnabled.value || undefined,
     context_summarization_threshold: assistantPrefs.contextSummaryThreshold.value || undefined,
     react_mode_enabled: assistantPrefs.reactModeEnabled.value || undefined,
+    temperature: assistantPrefs.assistantTemperature.value || undefined,
+    max_tokens: assistantPrefs.assistantMaxTokens.value || undefined,
+    timeout: assistantPrefs.assistantTimeout.value || undefined,
   }
 
   return {
@@ -787,9 +790,6 @@ function startStreaming(_prev: string, _tail: string, targetIdx: number) {
     prompt_name: promptName,
     project_id: projectStore.currentProject?.id as number,
     stream: true,
-    temperature: props.temperature ?? 0.7,
-    max_tokens: props.max_tokens ?? 8192,
-    timeout: props.timeout ?? undefined,
     thinking_enabled: useThinkingMode.value
   } as any, (chunk) => {
     // 优先尝试解析为结构化事件（JSON-line）
diff --git a/frontend/src/renderer/src/components/setting/AssistantSettings.vue b/frontend/src/renderer/src/components/setting/AssistantSettings.vue
@@ -1,5 +1,6 @@
 <script setup lang="ts">
 import { computed } from 'vue'
+import { QuestionFilled } from '@element-plus/icons-vue'
 import { useAssistantPreferences } from '@renderer/composables/useAssistantPreferences'
 
 // 通过组合式统一管理灵感助手偏好，方便在设置页与助手面板之间复用
@@ -19,6 +20,21 @@ const reactModeEnabled = computed({
   get: () => prefs.reactModeEnabled.value,
   set: (val: boolean) => prefs.setReactModeEnabled(val)
 })
+
+const assistantTemperature = computed({
+  get: () => prefs.assistantTemperature.value,
+  set: (val: number | null) => prefs.setAssistantTemperature(val)
+})
+
+const assistantMaxTokens = computed({
+  get: () => prefs.assistantMaxTokens.value,
+  set: (val: number | null) => prefs.setAssistantMaxTokens(val)
+})
+
+const assistantTimeout = computed({
+  get: () => prefs.assistantTimeout.value,
+  set: (val: number | null) => prefs.setAssistantTimeout(val)
+})
 </script>
 
 <template>
@@ -28,14 +44,99 @@ const reactModeEnabled = computed({
       配置灵感助手的高级能力，目前仅开放 React 工具解析协议。上下文摘要功能尚未启用。
     </p>
 
-    <el-form label-width="140px" class="assistant-form" size="small">
-      <el-form-item label="React 模式">
+    <el-form label-width="160px" class="assistant-form" size="small">
+      <!-- 参数配置组 -->
+      <div class="group-title">参数设置</div>
+
+      <el-form-item>
+        <template #label>
+          <span>
+            采样温度 (temperature)
+            <el-tooltip placement="top" effect="dark">
+              <template #content>
+                控制输出的随机性，数值越大越有创意、越发散，越小越保守、越稳定。<br/>
+                建议范围 0.4 ~ 0.9。默认值为 0.6。
+              </template>
+              <el-icon class="field-help-icon"><QuestionFilled /></el-icon>
+            </el-tooltip>
+          </span>
+        </template>
+        <el-input-number
+          v-model="assistantTemperature"
+          :min="0.1"
+          :max="2"
+          :step="0.1"
+          :precision="2"
+          controls-position="right"
+          placeholder="0.6"
+        />
+      </el-form-item>
+
+      <el-form-item>
+        <template #label>
+          <span>
+            最大输出 Token 数
+            <el-tooltip placement="top" effect="dark">
+              <template #content>
+                控制单次回复的最大长度。值越大，回复可以越长，但也会增加响应时间和费用。<br/>
+                默认值为 8192。
+              </template>
+              <el-icon class="field-help-icon"><QuestionFilled /></el-icon>
+            </el-tooltip>
+          </span>
+        </template>
+        <el-input-number
+          v-model="assistantMaxTokens"
+          :min="256"
+          :max="65536"
+          :step="512"
+          controls-position="right"
+          placeholder="8192"
+        />
+      </el-form-item>
+
+      <el-form-item>
+        <template #label>
+          <span>
+            超时 (秒)
+            <el-tooltip placement="top" effect="dark">
+              <template #content>
+                限制单次调用的最长等待时间，避免请求长时间挂起。<br/>
+                默认值为 90 秒。
+              </template>
+              <el-icon class="field-help-icon"><QuestionFilled /></el-icon>
+            </el-tooltip>
+          </span>
+        </template>
+        <el-input-number
+          v-model="assistantTimeout"
+          :min="10"
+          :max="600"
+          :step="10"
+          controls-position="right"
+          placeholder="90"
+        />
+      </el-form-item>
+
+      <el-divider />
+
+      <!-- React 配置组 -->
+      <div class="group-title">模式设置</div>
+      <el-form-item>
+        <template #label>
+          <span>
+            React 模式
+            <el-tooltip placement="top" effect="dark">
+              <template #content>
+                让模型通过文本协议输出工具调用指令（<Action>{...}</Action>），
+                系统解析后真正调用工具，适合不支持函数调用的模型。
+              </template>
+              <el-icon class="field-help-icon"><QuestionFilled /></el-icon>
+            </el-tooltip>
+          </span>
+        </template>
         <el-switch v-model="reactModeEnabled" />
       </el-form-item>
-      <div class="field-hint">
-        React 模式要求模型按照通过文本协议输出工具调用，
-        系统会解析 Action 并真正调用工具，适合不支持函数调用的模型。
-      </div>
     </el-form>
   </div>
 </template>
@@ -70,4 +171,16 @@ const reactModeEnabled = computed({
 .hint-alert {
   margin-top: 12px;
 }
+
+.group-title {
+  margin: 8px 0 4px 0;
+  font-size: 13px;
+  font-weight: 600;
+  color: var(--el-text-color-regular);
+}
+
+.field-help-icon {
+  margin-left: 4px;
+  cursor: help;
+}
 </style>
diff --git a/frontend/src/renderer/src/composables/useAssistantPreferences.ts b/frontend/src/renderer/src/composables/useAssistantPreferences.ts
diff --git a/frontend/src/renderer/src/stores/useAIParamCardStore.ts b/frontend/src/renderer/src/stores/useAIParamCardStore.ts