npm - union-app-chat-stream - Versions diffs - 1.0.3 → 1.0.5 - Mend

union-app-chat-stream 1.0.3 → 1.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/PROJECT_OVERVIEW.md +16 -0
package/app/.env +14 -14
package/app/.env.dev +14 -14
package/app/.env.prod.bj11 +14 -14
package/app/.env.prod.sh20 +14 -14
package/app/.env.prod.sz31 +14 -14
package/app/.env.test.bj12 +14 -14
package/app/config/env_config.py +6 -0
package/app/manager/chatstream_manager.py +47 -15
package/app/models/schemas.py +5 -3
package/app/service/chat_service.py +119 -2
package/app/service/union_service.py +7 -0
package/app/utils/common_utils.py +1 -1
package/app/views/view_chatstream.py +62 -5
package/app/wsgi.py +1 -1
package/package.json +3 -1
package/tools/prompts.yaml +2 -0
package/app/__pycache__/__init__.cpython-312.pyc +0 -0
package/app/__pycache__/authenticated_user.cpython-312.pyc +0 -0
package/app/__pycache__/extensions.cpython-312.pyc +0 -0
package/app/__pycache__/wsgi.cpython-312.pyc +0 -0
package/app/config/__pycache__/config_loader.cpython-312.pyc +0 -0
package/app/config/__pycache__/env_config.cpython-312.pyc +0 -0
package/app/config/__pycache__/logger_config.cpython-312.pyc +0 -0
package/app/manager/__init__.py +0 -4
package/app/manager/__pycache__/__init__.cpython-312.pyc +0 -0
package/app/manager/__pycache__/chatstream_manager.cpython-312.pyc +0 -0
package/app/manager/__pycache__/prompts.cpython-312.pyc +0 -0
package/app/manager/__pycache__/runtime_manager.cpython-312.pyc +0 -0
package/app/manager/__pycache__/toolcall_manager.cpython-312.pyc +0 -0
package/app/models/__pycache__/schemas.cpython-312.pyc +0 -0
package/app/service/__init__.py +0 -4
package/app/service/__pycache__/__init__.cpython-312.pyc +0 -0
package/app/service/__pycache__/chat_service.cpython-312.pyc +0 -0
package/app/service/__pycache__/llm_service.cpython-312.pyc +0 -0
package/app/service/__pycache__/rag_service.cpython-312.pyc +0 -0
package/app/service/__pycache__/tool_call_service.cpython-312.pyc +0 -0
package/app/service/__pycache__/union_service.cpython-312.pyc +0 -0
package/app/utils/__pycache__/__init__.cpython-312.pyc +0 -0
package/app/utils/__pycache__/common_utils.cpython-312.pyc +0 -0
package/app/utils/__pycache__/debug_context.cpython-312.pyc +0 -0
package/app/utils/__pycache__/function_utils.cpython-312.pyc +0 -0
package/app/utils/__pycache__/jwt_utils.cpython-312.pyc +0 -0
package/app/views/__pycache__/__init__.cpython-312.pyc +0 -0
package/app/views/__pycache__/view_chatstream.cpython-312.pyc +0 -0
package/app/views/__pycache__/view_healthcheck.cpython-312.pyc +0 -0
package/app/views/__pycache__/view_runtime.cpython-312.pyc +0 -0

package/PROJECT_OVERVIEW.md CHANGED Viewed

@@ -162,6 +162,22 @@ Deployment files are organized under `deploy/`:
   treat knowledge-base "related functions" as routing hints unless code
   explicitly promotes them to executable tools.
+## Streaming Tool-Call Contract
+- External tool calls may run for minutes or longer because some tools query
+  large data platforms such as Hive. Do not treat a long-running tool call as a
+  timeout by default.
+- During tool execution, `/chatstream/v1/chat/stream` emits SSE `heartbeat`
+  events every `TOOL_CALL_HEARTBEAT_INTERVAL` seconds. The payload is the normal
+  chat response JSON with a `heartbeat` object, including `type`, `tool`,
+  `elapsedSeconds`, and `message`.
+- Frontends should listen for both `message` and `heartbeat` SSE events.
+  Heartbeat events mean the stream is alive and the current tool is still
+  running; they are not model content and should not be rendered as answer text.
+- Tool execution failures return a `message` event with `finish_reason="error"`
+  and `errorMsg`. If tool-calling reaches `TOOLS_MAX_ROUNDS`, return
+  `finish_reason="error"` and `errorMsg="工具调用轮数达到上限（N轮）"`.
 ## Validation
 Use the smallest reliable checks that cover the change:

package/app/.env CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.47.214.188:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.47.214.188:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=https://10.47.214.188:8443/api/getjiraData
+GET_BIGDATA_URL=http://172.31.3.134:8080/vmock/ai/fullLinkData
+GET_UNION_BASE_URL=http://127.0.0.1:8089/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=dev
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=https://open.bigmodel.cn/api/paas/v4/
+LLM_KEY=f024b21a682248999b42f696a42dfaad.PIySxpJN8xM1evpZ
 LLM_MODEL=GLM-4.7-Flash
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/.env.dev CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.47.214.188:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.47.214.188:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=http://172.31.3.134:8080/vmock/jira-data
+GET_BIGDATA_URL=http://172.31.3.134:8080/vmock/ai/fullLinkData
+GET_UNION_BASE_URL=http://127.0.0.1:8089/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/Users/simon/code/union-py-app/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=dev
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=https://open.bigmodel.cn/api/paas/v4/
+LLM_KEY=f024b21a682248999b42f696a42dfaad.PIySxpJN8xM1evpZ
 LLM_MODEL=GLM-4.7-Flash
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/.env.prod.bj11 CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.16.100.236:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.16.100.236:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=https://10.16.100.236:8443/api/getjiraData
+GET_BIGDATA_URL=https://10.16.100.236:8443/union-op/bigdata/query
+GET_UNION_BASE_URL=https://10.16.100.236:8443/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=prod.bj11
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=<LLM_URL>
+LLM_KEY=<LLM_KEY>
 LLM_MODEL=glm-5
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/.env.prod.sh20 CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.32.100.236:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.32.100.236:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=https://10.32.100.236:8443/api/getjiraData
+GET_BIGDATA_URL=https://10.32.100.236:8443/union-op/bigdata/query
+GET_UNION_BASE_URL=https://10.16.100.236:8443/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=prod.sh20
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=<LLM_URL>
+LLM_KEY=<LLM_KEY>
 LLM_MODEL=glm-5
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/.env.prod.sz31 CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.80.100.236:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.80.100.236:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=https://10.80.100.236:8443/api/getjiraData
+GET_BIGDATA_URL=https://10.80.100.236:8443/union-op/bigdata/query
+GET_UNION_BASE_URL=https://10.16.100.236:8443/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=prod.sz31
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=<LLM_URL>
+LLM_KEY=<LLM_KEY>
 LLM_MODEL=glm-5
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/.env.test.bj12 CHANGED Viewed

@@ -1,16 +1,16 @@
 # Flask and request authentication
-SECRET_KEY=<MASKED_SECRET>
+SECRET_KEY=<SECRET_KEY>
 # External API endpoints
-GET_USE_INFO_URL=<MASKED_URL>
-GET_ORG_INFO_URL=<MASKED_URL>
-GET_JIRA_INFO_URL=<MASKED_URL>
-GET_BIGDATA_URL=<MASKED_URL>
-GET_UNION_BASE_URL=<MASKED_URL>
+GET_USE_INFO_URL=https://10.47.214.188:8443/common/getUserInfo
+GET_ORG_INFO_URL=https://10.47.214.188:8443/api/getOrgInfoByOrgCode
+GET_JIRA_INFO_URL=http://172.31.3.134:8080/vmock/jira-data
+GET_BIGDATA_URL=http://172.31.3.134:8080/vmock/ai/fullLinkData
+GET_UNION_BASE_URL=http://172.31.3.134:8080/
 # Legacy external API tokens
-GET_ORG_INFO_URL_TOKEN=<MASKED_TOKEN>
-GET_JIRA_INFO_URL_TOKEN=<MASKED_TOKEN>
+GET_ORG_INFO_URL_TOKEN=<GET_ORG_INFO_URL_TOKEN>
+GET_JIRA_INFO_URL_TOKEN=<GET_JIRA_INFO_URL_TOKEN>
 # Authorization and logging
 PERMISSIONS=
@@ -20,25 +20,25 @@ LOG_DIR=/data/appLogs
 # Runtime environment and JWT
 FLASK_ENV=test.prod.bj12
-JWT_SECRET_KEY=<MASKED_SECRET>
+JWT_SECRET_KEY=<JWT_SECRET_KEY>
 JWT_EXPIRATION_SECOND=900
 JWT_RENEW_SECOND=700
 # LLM provider
-LLM_URL=<MASKED_URL>
-LLM_KEY=<MASKED_KEY>
+LLM_URL=<LLM_URL>
+LLM_KEY=<LLM_KEY>
 LLM_MODEL=glm-5
 LLM_MAX_TOKENS=4096
 LLM_TEMPERATURE=0.7
 LLM_TOP_P=0.9
 # Chat behavior
-SYSTEM_PROMPT=<MASKED_BUSINESS_VALUE>
+SYSTEM_PROMPT=你是网络支付清算平台（网联平台）联合运维的智能客服助手，面向联合运维成员单位提供咨询与指引服务。
 # Business filter
 FILTER_ENABLED=false
-FILTER_ALLOWED_KEYWORDS=<MASKED_BUSINESS_VALUE>
-FILTER_REJECTION_MESSAGE=<MASKED_BUSINESS_VALUE>
+FILTER_ALLOWED_KEYWORDS=网联,联合运维,运维,生产变更,变更,生产运行,运行,系统成功率,业务成功率,异常,故障,定级,关闭渠道,联合处置,大型单位,中型单位,小型单位,银行,支付,清算
+FILTER_REJECTION_MESSAGE=抱歉，我是联合运维智能客服，只能回答与联合运维相关的问题，例如生产变更、生产运行、故障定级、周期评价、业务范围等。请重新描述您的问题。
 # Tool and conversation settings
 TOOLS_MAX_ROUNDS=5

package/app/config/env_config.py CHANGED Viewed

@@ -71,6 +71,12 @@ class Config:
     )
     TOOLS_MAX_ROUNDS = _env_int("TOOLS_MAX_ROUNDS", 5)
+    TOOL_CALL_HEARTBEAT_INTERVAL = _env_float("TOOL_CALL_HEARTBEAT_INTERVAL", 15.0)
+    CHAT_OPENING_QUESTIONS = _env_list("CHAT_OPENING_QUESTIONS", [
+        "上周全链路运行质量如何",
+        "最近有哪些成员机构交易异常",
+        "当前系统运行风险点有哪些",
+    ])
     CONVERSATION_MAX_HISTORY = _env_int("CONVERSATION_MAX_HISTORY", 20)
     CONVERSATION_TTL = _env_int("CONVERSATION_TTL", 3600)

package/app/manager/chatstream_manager.py CHANGED Viewed

@@ -14,6 +14,8 @@ class ChatstreamManager:
         self._chat_service = chat_service
         self._rag_service = rag_service
         self._conversations: Dict[str, Dict] = {}
+        # ponytail: process-local guard; use shared storage only if workers need cross-process cancellation.
+        self._active_streams: Dict[str, Dict] = {}
         self._max_history = config["CONVERSATION_MAX_HISTORY"]
         self._ttl = config["CONVERSATION_TTL"]
         self._lock = threading.Lock()
@@ -62,6 +64,24 @@ class ChatstreamManager:
             if len(conversation["messages"]) > max_messages:
                 conversation["messages"] = conversation["messages"][-max_messages:]
+    def _start_stream(self, jsessionid: str, conversation_id: str) -> threading.Event:
+        abort_event = threading.Event()
+        with self._lock:
+            active = self._active_streams.get(jsessionid)
+            if active and active["conversation_id"] != conversation_id:
+                active["abort_event"].set()
+            self._active_streams[jsessionid] = {
+                "conversation_id": conversation_id,
+                "abort_event": abort_event,
+            }
+        return abort_event
+    def _finish_stream(self, jsessionid: str, abort_event: threading.Event):
+        with self._lock:
+            active = self._active_streams.get(jsessionid)
+            if active and active["abort_event"] is abort_event:
+                del self._active_streams[jsessionid]
     def chat_stream(
         self,
         conversation_id: Optional[str],
@@ -69,22 +89,34 @@ class ChatstreamManager:
         jsessionid: str,
     ) -> Generator[ChatResponse, None, None]:
         normalized_conversation_id = self.normalize_conversation_id(conversation_id)
+        abort_event = self._start_stream(jsessionid, normalized_conversation_id)
         history = self._get_history(normalized_conversation_id)
         answer_parts: List[str] = []
-        stopped = False
+        saved = False
-        for chunk in self._chat_service.tool_call_stream(
-            normalized_conversation_id,
-            question,
-            tools,
-            history,
-            jsessionid,
-        ):
-            if chunk.content:
-                answer_parts.append(chunk.content)
-            if chunk.finish_reason == "stop":
-                stopped = True
-            yield chunk
+        try:
+            for chunk in self._chat_service.tool_call_stream(
+                normalized_conversation_id,
+                question,
+                tools,
+                history,
+                jsessionid,
+            ):
+                if abort_event.is_set():
+                    yield ChatResponse(
+                        conversationId=normalized_conversation_id,
+                        content="当前对话已被新的对话替换，已停止。",
+                        finish_reason="abort",
+                    )
+                    return
+                if chunk.content:
+                    answer_parts.append(chunk.content)
+                if chunk.finish_reason and answer_parts and not saved:
+                    self._append_exchange(normalized_conversation_id, question, "".join(answer_parts))
+                    saved = True
+                yield chunk
-        if stopped:
-            self._append_exchange(normalized_conversation_id, question, "".join(answer_parts))
+            if answer_parts and not saved:
+                self._append_exchange(normalized_conversation_id, question, "".join(answer_parts))
+        finally:
+            self._finish_stream(jsessionid, abort_event)

package/app/models/schemas.py CHANGED Viewed

@@ -1,11 +1,11 @@
-from typing import Literal, Optional
+from typing import Any, Dict, Literal, Optional
 from pydantic import BaseModel, ConfigDict, Field
 class ChatRequest(BaseModel):
     """聊天请求模型"""
-    model_config = ConfigDict(extra="forbid")
+    model_config = ConfigDict(extra="ignore")
     conversation_id: Optional[str] = Field(
         default=None,
@@ -24,7 +24,9 @@ class ChatResponse(BaseModel):
     reasoning_content: Optional[str] = Field(default=None, description="模型推理内容增量")
     tool_call: Optional[str] = Field(default=None, description="工具调用信息")
     tool_result: Optional[str] = Field(default=None, description="工具执行结果")
-    finish_reason: Optional[Literal["stop", "error", "rejected", "done"]] = Field(
+    heartbeat: Optional[Dict[str, Any]] = Field(default=None, description="长耗时工具调用心跳")
+    error_msg: Optional[str] = Field(default=None, alias="errorMsg", description="错误信息")
+    finish_reason: Optional[Literal["stop", "error", "rejected", "done", "abort"]] = Field(
         default=None,
         description="结束原因；中间流式增量为空",
     )

package/app/service/chat_service.py CHANGED Viewed

@@ -1,3 +1,7 @@
+import json
+import time
+from concurrent.futures import ThreadPoolExecutor, TimeoutError as FutureTimeoutError
+from datetime import datetime, timedelta, timezone
 from pathlib import Path
 from typing import Dict, Generator, List
@@ -14,6 +18,36 @@ def _preview(text: str, limit: int = 300) -> str:
     return str(text).replace("\n", " ")[:limit]
+PUBLIC_TOOL_RESULT_FIELDS = ("tool_name", "display_name", "arguments", "status", "message")
+def _public_tool_result(tool_result: str) -> str:
+    try:
+        payload = json.loads(tool_result)
+    except json.JSONDecodeError:
+        payload = {}
+    if not isinstance(payload, dict):
+        payload = {}
+    public_payload = {key: payload[key] for key in PUBLIC_TOOL_RESULT_FIELDS if key in payload}
+    public_payload.setdefault("message", "工具调用完成")
+    return json.dumps(public_payload, ensure_ascii=False)
+def _time_context() -> str:
+    now = datetime.now(timezone.utc).astimezone(timezone(timedelta(hours=8)))
+    return (
+        "当前基准时间："
+        f"{now:%Y-%m-%d %H:%M:%S} UTC+8。"
+        "用户问题中的“当前、近期、上周、昨天、今天”等相对时间，均按该基准时间计算。"
+    )
 def _load_prompts() -> Dict[str, str]:
     path = Path(__file__).resolve().parents[2] / "tools" / "prompts.yaml"
     if not path.exists():
@@ -55,6 +89,7 @@ class ChatService:
         self._top_p = config["LLM_TOP_P"]
         self._system_prompt = config["SYSTEM_PROMPT"]
         self._tools_max_rounds = config["TOOLS_MAX_ROUNDS"]
+        self._tool_heartbeat_interval = float(config.get("TOOL_CALL_HEARTBEAT_INTERVAL", 15.0))
         self._rag = rag_service
         self._union_service = union_service
@@ -76,6 +111,7 @@ class ChatService:
         messages = []
         if self._system_prompt:
             messages.append({"role": "system", "content": self._system_prompt})
+        messages.append({"role": "system", "content": _time_context()})
         messages.extend(history)
         messages.append({"role": "user", "content": user_question})
         return messages
@@ -118,12 +154,32 @@ class ChatService:
             return ChatResponse(conversationId=conversation_id, tool_call=tool_call)
         def tool_result_event(tool_result: str) -> ChatResponse:
-            return ChatResponse(conversationId=conversation_id, tool_result=tool_result)
+            return ChatResponse(conversationId=conversation_id, tool_result=_public_tool_result(tool_result))
+        def heartbeat_event(tool_name: str, elapsed_seconds: float) -> ChatResponse:
+            return ChatResponse(
+                conversationId=conversation_id,
+                heartbeat={
+                    "type": "tool_call_running",
+                    "tool": tool_name,
+                    "elapsedSeconds": round(elapsed_seconds, 3),
+                    "message": f"工具 {tool_name} 仍在执行，请继续等待。",
+                },
+            )
+        def error_event(error_msg: str) -> ChatResponse:
+            return ChatResponse(
+                conversationId=conversation_id,
+                content=f"[错误] {error_msg}",
+                errorMsg=error_msg,
+                finish_reason="error",
+            )
         try:
             messages = self._build_tool_messages(history, question)
             max_rounds = self._tools_max_rounds
             final_answer = ""
+            completed_without_tool_call = False
             logger.info(f"开始模型流式调用。conversation_id={conversation_id} model={self._model} question={_preview(question, 120)}")
             for round_idx in range(max_rounds):
@@ -168,6 +224,7 @@ class ChatService:
                 if not tool_calls_map:
                     final_answer = current_content
+                    completed_without_tool_call = True
                     break
                 assistant_tool_calls = [tool_calls_map[i] for i in sorted(tool_calls_map)]
@@ -189,16 +246,33 @@ class ChatService:
                         rag_service=self._rag,
                         jsessionid=jsessionid,
                     )
-                    result = call_function(name, args, tool_context)
+                    result = yield from self._call_function_with_heartbeats(
+                        name,
+                        args,
+                        tool_context,
+                        heartbeat_event,
+                    )
                     logger.info(f"工具调用完成。conversation_id={conversation_id} tool={name} result_preview={_preview(result, 300)}")
                     yield tool_result_event(result)
+                    tool_error = self._extract_tool_error(result)
+                    if tool_error:
+                        logger.error(f"工具调用失败。conversation_id={conversation_id} tool={name} error={tool_error}")
+                        yield error_event(f"工具调用失败: {tool_error}")
+                        return
                     messages.append({
                         "role": "tool",
                         "content": result,
                         "tool_call_id": tc["id"],
                     })
+            if not completed_without_tool_call:
+                error_msg = f"工具调用轮数达到上限（{max_rounds}轮）"
+                logger.error(f"对话异常结束。conversation_id={conversation_id} error={error_msg}")
+                yield error_event(error_msg)
+                return
             logger.info(f"对话完成。conversation_id={conversation_id} final_answer_chars={len(final_answer)} final_answer_preview={_preview(final_answer)}")
             yield ChatResponse(conversationId=conversation_id, finish_reason="stop")
@@ -207,9 +281,52 @@ class ChatService:
             yield ChatResponse(
                 conversationId=conversation_id,
                 content=f"[错误] 模型调用异常: {str(e)}",
+                errorMsg=f"模型调用异常: {str(e)}",
                 finish_reason="error",
             )
+    def _call_function_with_heartbeats(
+        self,
+        name: str,
+        args: str,
+        tool_context: ToolContext,
+        heartbeat_event,
+    ) -> Generator[ChatResponse, None, str]:
+        interval = self._tool_heartbeat_interval
+        if interval <= 0:
+            return call_function(name, args, tool_context)
+        executor = ThreadPoolExecutor(max_workers=1)
+        future = executor.submit(call_function, name, args, tool_context)
+        started_at = time.monotonic()
+        try:
+            while True:
+                try:
+                    return future.result(timeout=interval)
+                except FutureTimeoutError:
+                    yield heartbeat_event(name, time.monotonic() - started_at)
+        finally:
+            executor.shutdown(wait=False, cancel_futures=True)
+    @staticmethod
+    def _extract_tool_error(result: str) -> str:
+        try:
+            payload = json.loads(result)
+        except json.JSONDecodeError:
+            return ""
+        if not isinstance(payload, dict):
+            return ""
+        error = payload.get("error")
+        if error:
+            return str(error)
+        status = payload.get("status")
+        if status and status != "success":
+            message = payload.get("message") or f"工具返回状态: {status}"
+            return str(message)
+        return ""
     @staticmethod
     def _merge_tool_call_delta(tool_calls_map: Dict[int, Dict], tc) -> None:
         """将单个流式 tool_call 增量按 index 合并到累积字典中"""

package/app/service/union_service.py CHANGED Viewed

@@ -12,6 +12,7 @@ class UnionService:
     # 常量定义
     API_MAX_RETRIES = 10  # API最大重试次数
+    BIGDATA_API_TIMEOUT = 300
     BIGDATA_INTERFACE_FULL_LINK = "running_cnt.full_link_monthly"
     BIGDATA_INTERFACE_BANK_MONTHLY = "running_cnt.bank_monthly"
@@ -84,8 +85,14 @@ class UnionService:
                 url=url,
                 headers=self._get_union_headers(jsessionid),
                 json_data=payload,
+                timeout=self.BIGDATA_API_TIMEOUT,
                 max_retries=self.API_MAX_RETRIES,
             )
+            if not response.get("success", True):
+                raise RuntimeError(response.get("error_msg", "请求失败"))
+            status_code = response.get("status_code")
+            if status_code and status_code >= 400:
+                raise RuntimeError(f"请求失败：HTTP {status_code}")
             logger.info(f"{description}成功")
             return self._extract_response_data(response), "success"
         except Exception as e:

package/app/utils/common_utils.py CHANGED Viewed

@@ -30,7 +30,7 @@ def call_https_api(
         data: Optional[Dict[str, Any]] = None,
         json_data: Optional[Dict[str, Any]] = None,
         headers: Optional[Dict[str, str]] = None,
-        timeout: int = 30,
+    timeout: int = 10,
         verify_ssl: bool = False,
         auth: Optional[tuple] = None,
         proxies: Optional[Dict[str, Any]] = None,

package/app/views/view_chatstream.py CHANGED Viewed

@@ -1,3 +1,6 @@
+import re
+from itertools import chain
 from pydantic import ValidationError
 from flask import Blueprint, current_app, request, Response, jsonify, stream_with_context, g
@@ -10,6 +13,25 @@ def _sse_event(event: str, data: str) -> str:
     return f"event: {event}\ndata: {data}\n\n"
+def _error_status(error_msg: str) -> int:
+    match = re.search(r"Error code: (\d{3})", error_msg)
+    if match:
+        status = int(match.group(1))
+        if 400 <= status <= 599:
+            return status
+    return 500
+def _error_payload(chunk: ChatResponse) -> dict:
+    error_msg = chunk.error_msg or chunk.content or "聊天流异常"
+    return {
+        "conversationId": chunk.conversation_id,
+        "detail": error_msg,
+        "errorMsg": error_msg,
+        "finish_reason": "error",
+    }
 def _chatstream_manager():
     return current_app.extensions["chatstream_manager"]
@@ -27,6 +49,13 @@ def rag_force_rebuild():
         return jsonify({"detail": str(exc)}), 500
+@chatstream.post("/chat/opening")
+def chat_opening():
+    return jsonify({
+        "suggestedQuestions": current_app.config.get("CHAT_OPENING_QUESTIONS", [])
+    })
 @chatstream.route("/chat/stream", methods=["OPTIONS", "POST"])
 def chat_stream_endpoint():
     if request.method == "OPTIONS":
@@ -37,12 +66,40 @@ def chat_stream_endpoint():
     except ValidationError as exc:
         return jsonify({"detail": exc.errors()}), 422
+    conversation_id = chat_request.conversation_id
+    jsessionid = g.current_user["jsessionid"]
+    stream = _chatstream_manager().chat_stream(conversation_id, chat_request.question, jsessionid)
+    try:
+        first_chunk = next(stream)
+    except StopIteration:
+        first_chunk = ChatResponse(conversationId=conversation_id, finish_reason="done")
+    except Exception as exc:
+        error_msg = f"聊天流异常: {exc}"
+        return jsonify({"detail": error_msg, "errorMsg": error_msg, "finish_reason": "error"}), 500
+    if first_chunk.finish_reason == "error":
+        return jsonify(_error_payload(first_chunk)), _error_status(first_chunk.error_msg or first_chunk.content or "")
     def event_generator():
-        conversation_id = chat_request.conversation_id
-        jsessionid = g.current_user["jsessionid"]
-        for chunk in _chatstream_manager().chat_stream(conversation_id, chat_request.question, jsessionid):
-            conversation_id = chunk.conversation_id
-            yield _sse_event("message", chunk.model_dump_json(by_alias=True))
+        nonlocal conversation_id
+        try:
+            for chunk in chain([first_chunk], stream):
+                conversation_id = chunk.conversation_id
+                event = "heartbeat" if chunk.heartbeat else "message"
+                yield _sse_event(event, chunk.model_dump_json(by_alias=True))
+                if chunk.finish_reason == "error":
+                    return
+        except Exception as exc:
+            error_msg = f"聊天流异常: {exc}"
+            error = ChatResponse(
+                conversationId=conversation_id,
+                content=f"[错误] {error_msg}",
+                errorMsg=error_msg,
+                finish_reason="error",
+            )
+            yield _sse_event("message", error.model_dump_json(by_alias=True))
+            return
         done = ChatResponse(conversationId=conversation_id, finish_reason="done")
         yield _sse_event("done", done.model_dump_json(by_alias=True))

package/app/wsgi.py CHANGED Viewed

@@ -34,4 +34,4 @@ except Exception:
 if __name__ == '__main__':
     if 'dev' in app.config["FLASK_ENV"]:
-        app.run(debug=True, host='0.0.0.0', port=8000)
+        app.run(debug=True, host='0.0.0.0', port=8083)

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "union-app-chat-stream",
-  "version": "1.0.3",
+  "version": "1.0.5",
   "description": "Union operations chat stream Flask application package.",
   "license": "UNLICENSED",
   "files": [
@@ -8,6 +8,8 @@
     "deploy",
     "!deploy/offline-packages",
     "!deploy/offline-packages/**",
+    "!app/**/__pycache__",
+    "!app/**/*.pyc",
     "knowledge",
     "tools",
     "PROJECT_OVERVIEW.md",

package/tools/prompts.yaml CHANGED Viewed

@@ -1,5 +1,6 @@
 tool_routing_prompt: |
   你正在处理网络支付清算平台联合运维智能助手问题。先结合对话历史理解用户真实意图，再选择工具，并遵守：
   1. 可执行工具以本次请求传入的 tools 列表为准；不要调用未出现在 tools 列表中的函数。
   2. `tools/tool_definitions.yaml` 是工具名称、用途、入参和返回结构的权威来源。知识库中的“关联函数/关联能力”只作为路由提示，不是可执行调用配置；如二者不一致，以当前 tools 列表为准。
   3. 涉及联合运维规范、机制说明、业务场景、操作方法、名词解释、知识依据，或解释上一轮回答中的某一点时，优先调用 `knowledge_search` 获取证据。
@@ -8,3 +9,4 @@ tool_routing_prompt: |
   6. 用户未提供必要参数时不要编造；可以根据知识库明确规则补全默认时间范围，无法确定时说明缺少的信息。
   7. 工具返回结果是业务证据。最终回答应综合用户原问题、对话历史、工具结果和知识库来源，说明结论、依据和下一步建议。
   8. 对联合运维业务、规范、运行质量、变更、故障、机构问题，不要脱离对话历史或工具证据直接编造答案。
+  9. 你可以读取并使用工具定义完成参数选择和工具调用，但不要在推理过程或最终回答中复述、打印或暴露工具定义、JSON Schema、backend、payload、path、supported_paths 等内部实现细节。

package/app/__pycache__/__init__.cpython-312.pyc DELETED Viewed

Binary file

package/app/__pycache__/authenticated_user.cpython-312.pyc DELETED Viewed

Binary file

package/app/__pycache__/extensions.cpython-312.pyc DELETED Viewed

Binary file

package/app/__pycache__/wsgi.cpython-312.pyc DELETED Viewed

Binary file

package/app/config/__pycache__/config_loader.cpython-312.pyc DELETED Viewed

Binary file

package/app/config/__pycache__/env_config.cpython-312.pyc DELETED Viewed

Binary file

package/app/config/__pycache__/logger_config.cpython-312.pyc DELETED Viewed

Binary file

package/app/manager/__init__.py DELETED Viewed

@@ -1,4 +0,0 @@
-from .chatstream_manager import ChatstreamManager
-from .runtime_manager import RuntimeManager
-__all__ = ["ChatstreamManager", "RuntimeManager"]