PyPI - botrun-flow-lang - Versions diffs - 5.12.263__py3-none-any.whl → 5.12.264__py3-none-any.whl - Mend

botrun-flow-lang 5.12.263py3-none-any.whl → 5.12.264py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

botrun_flow_lang/api/auth_api.py +39 -39
botrun_flow_lang/api/auth_utils.py +183 -183
botrun_flow_lang/api/botrun_back_api.py +65 -65
botrun_flow_lang/api/flow_api.py +3 -3
botrun_flow_lang/api/hatch_api.py +508 -508
botrun_flow_lang/api/langgraph_api.py +811 -811
botrun_flow_lang/api/line_bot_api.py +1484 -1484
botrun_flow_lang/api/model_api.py +300 -300
botrun_flow_lang/api/rate_limit_api.py +32 -32
botrun_flow_lang/api/routes.py +79 -79
botrun_flow_lang/api/search_api.py +53 -53
botrun_flow_lang/api/storage_api.py +395 -395
botrun_flow_lang/api/subsidy_api.py +290 -290
botrun_flow_lang/api/subsidy_api_system_prompt.txt +109 -109
botrun_flow_lang/api/user_setting_api.py +70 -70
botrun_flow_lang/api/version_api.py +31 -31
botrun_flow_lang/api/youtube_api.py +26 -26
botrun_flow_lang/constants.py +13 -13
botrun_flow_lang/langgraph_agents/agents/agent_runner.py +178 -178
botrun_flow_lang/langgraph_agents/agents/agent_tools/step_planner.py +77 -77
botrun_flow_lang/langgraph_agents/agents/checkpointer/firestore_checkpointer.py +666 -666
botrun_flow_lang/langgraph_agents/agents/gov_researcher/GOV_RESEARCHER_PRD.md +192 -192
botrun_flow_lang/langgraph_agents/agents/gov_researcher/gemini_subsidy_graph.py +460 -460
botrun_flow_lang/langgraph_agents/agents/gov_researcher/gov_researcher_2_graph.py +1002 -1002
botrun_flow_lang/langgraph_agents/agents/gov_researcher/gov_researcher_graph.py +822 -822
botrun_flow_lang/langgraph_agents/agents/langgraph_react_agent.py +723 -723
botrun_flow_lang/langgraph_agents/agents/search_agent_graph.py +864 -864
botrun_flow_lang/langgraph_agents/agents/tools/__init__.py +4 -4
botrun_flow_lang/langgraph_agents/agents/tools/gemini_code_execution.py +376 -376
botrun_flow_lang/langgraph_agents/agents/util/gemini_grounding.py +66 -66
botrun_flow_lang/langgraph_agents/agents/util/html_util.py +316 -316
botrun_flow_lang/langgraph_agents/agents/util/img_util.py +294 -294
botrun_flow_lang/langgraph_agents/agents/util/local_files.py +419 -419
botrun_flow_lang/langgraph_agents/agents/util/mermaid_util.py +86 -86
botrun_flow_lang/langgraph_agents/agents/util/model_utils.py +143 -143
botrun_flow_lang/langgraph_agents/agents/util/pdf_analyzer.py +486 -486
botrun_flow_lang/langgraph_agents/agents/util/pdf_cache.py +250 -250
botrun_flow_lang/langgraph_agents/agents/util/pdf_processor.py +204 -204
botrun_flow_lang/langgraph_agents/agents/util/perplexity_search.py +464 -464
botrun_flow_lang/langgraph_agents/agents/util/plotly_util.py +59 -59
botrun_flow_lang/langgraph_agents/agents/util/tavily_search.py +199 -199
botrun_flow_lang/langgraph_agents/agents/util/youtube_util.py +90 -90
botrun_flow_lang/langgraph_agents/cache/langgraph_botrun_cache.py +197 -197
botrun_flow_lang/llm_agent/llm_agent.py +19 -19
botrun_flow_lang/llm_agent/llm_agent_util.py +83 -83
botrun_flow_lang/log/.gitignore +2 -2
botrun_flow_lang/main.py +61 -61
botrun_flow_lang/main_fast.py +51 -51
botrun_flow_lang/mcp_server/__init__.py +10 -10
botrun_flow_lang/mcp_server/default_mcp.py +744 -744
botrun_flow_lang/models/nodes/utils.py +205 -205
botrun_flow_lang/models/token_usage.py +34 -34
botrun_flow_lang/requirements.txt +21 -21
botrun_flow_lang/services/base/firestore_base.py +30 -30
botrun_flow_lang/services/hatch/hatch_factory.py +11 -11
botrun_flow_lang/services/hatch/hatch_fs_store.py +419 -419
botrun_flow_lang/services/storage/storage_cs_store.py +206 -206
botrun_flow_lang/services/storage/storage_factory.py +12 -12
botrun_flow_lang/services/storage/storage_store.py +65 -65
botrun_flow_lang/services/user_setting/user_setting_factory.py +9 -9
botrun_flow_lang/services/user_setting/user_setting_fs_store.py +66 -66
botrun_flow_lang/static/docs/tools/index.html +926 -926
botrun_flow_lang/tests/api_functional_tests.py +1525 -1525
botrun_flow_lang/tests/api_stress_test.py +357 -357
botrun_flow_lang/tests/shared_hatch_tests.py +333 -333
botrun_flow_lang/tests/test_botrun_app.py +46 -46
botrun_flow_lang/tests/test_html_util.py +31 -31
botrun_flow_lang/tests/test_img_analyzer.py +190 -190
botrun_flow_lang/tests/test_img_util.py +39 -39
botrun_flow_lang/tests/test_local_files.py +114 -114
botrun_flow_lang/tests/test_mermaid_util.py +103 -103
botrun_flow_lang/tests/test_pdf_analyzer.py +104 -104
botrun_flow_lang/tests/test_plotly_util.py +151 -151
botrun_flow_lang/tests/test_run_workflow_engine.py +65 -65
botrun_flow_lang/tools/generate_docs.py +133 -133
botrun_flow_lang/tools/templates/tools.html +153 -153
botrun_flow_lang/utils/__init__.py +7 -7
botrun_flow_lang/utils/botrun_logger.py +344 -344
botrun_flow_lang/utils/clients/rate_limit_client.py +209 -209
botrun_flow_lang/utils/clients/token_verify_client.py +153 -153
botrun_flow_lang/utils/google_drive_utils.py +654 -654
botrun_flow_lang/utils/langchain_utils.py +324 -324
botrun_flow_lang/utils/yaml_utils.py +9 -9
{botrun_flow_lang-5.12.263.dist-info → botrun_flow_lang-5.12.264.dist-info}/METADATA +1 -1
botrun_flow_lang-5.12.264.dist-info/RECORD +102 -0
botrun_flow_lang-5.12.263.dist-info/RECORD +0 -102
{botrun_flow_lang-5.12.263.dist-info → botrun_flow_lang-5.12.264.dist-info}/WHEEL +0 -0

botrun_flow_lang/langgraph_agents/agents/util/pdf_cache.py CHANGED Viewed

@@ -1,250 +1,250 @@
-"""
-PDF 快取模組
-提供 PDF 切片的 GCS 快取功能，避免重複切割相同的 PDF 檔案。
-快取會自動在 7 天後過期（透過 GCS Lifecycle Rule）。
-"""
-import hashlib
-import json
-from io import BytesIO
-from typing import List, Tuple, Optional
-from datetime import datetime
-from botrun_flow_lang.services.storage.storage_factory import storage_store_factory
-# 快取目錄前綴
-PDF_CACHE_PREFIX = "pdf-cache"
-# 快取過期天數（用於 lifecycle rule）
-PDF_CACHE_EXPIRY_DAYS = 7
-def get_cache_key(pdf_url: str) -> str:
-    """
-    根據 PDF URL 產生快取 key（hash）
-    Args:
-        pdf_url: PDF 檔案的 URL
-    Returns:
-        str: 32 字元的 MD5 hash
-    """
-    return hashlib.md5(pdf_url.encode()).hexdigest()
-def _get_cache_path(cache_key: str) -> str:
-    """
-    取得快取目錄路徑
-    Args:
-        cache_key: 快取 key
-    Returns:
-        str: GCS 路徑，格式為 "pdf-cache/{cache_key}"
-    """
-    return f"{PDF_CACHE_PREFIX}/{cache_key}"
-def _get_metadata_path(cache_key: str) -> str:
-    """取得 metadata 檔案路徑"""
-    return f"{_get_cache_path(cache_key)}/metadata.json"
-def _get_chunk_path(cache_key: str, chunk_index: int) -> str:
-    """取得切片檔案路徑"""
-    return f"{_get_cache_path(cache_key)}/chunk-{chunk_index:03d}.pdf"
-async def check_cache(cache_key: str) -> Optional[List[Tuple[bytes, str]]]:
-    """
-    檢查 GCS 是否有快取
-    Args:
-        cache_key: 快取 key（來自 get_cache_key）
-    Returns:
-        Optional[List[Tuple[bytes, str]]]: 如果有快取，回傳切片清單；否則回傳 None
-    """
-    try:
-        storage = storage_store_factory()
-        metadata_path = _get_metadata_path(cache_key)
-        # 檢查 metadata 檔案是否存在
-        if not await storage.file_exists(metadata_path):
-            print(f"[pdf_cache] 快取不存在: {cache_key}")
-            return None
-        # 讀取 metadata
-        metadata_file = await storage.retrieve_file(metadata_path)
-        if not metadata_file:
-            print(f"[pdf_cache] 無法讀取 metadata: {cache_key}")
-            return None
-        metadata = json.loads(metadata_file.getvalue().decode("utf-8"))
-        chunk_count = metadata.get("chunk_count", 0)
-        page_ranges = metadata.get("page_ranges", [])
-        if chunk_count == 0:
-            print(f"[pdf_cache] 快取無切片: {cache_key}")
-            return None
-        print(f"[pdf_cache] 找到快取: {cache_key}, {chunk_count} 個切片")
-        # 讀取所有切片
-        chunks = []
-        for i in range(chunk_count):
-            chunk_path = _get_chunk_path(cache_key, i)
-            chunk_file = await storage.retrieve_file(chunk_path)
-            if not chunk_file:
-                print(f"[pdf_cache] 無法讀取切片 {i}: {cache_key}")
-                return None  # 快取不完整，放棄使用
-            chunk_bytes = chunk_file.getvalue()
-            page_range = page_ranges[i] if i < len(page_ranges) else f"chunk-{i:03d}"
-            chunks.append((chunk_bytes, page_range))
-        print(f"[pdf_cache] 成功載入快取: {cache_key}")
-        return chunks
-    except Exception as e:
-        print(f"[pdf_cache] 檢查快取時發生錯誤: {e}")
-        return None
-async def save_to_cache(
-    cache_key: str,
-    chunks: List[Tuple[bytes, str]],
-    original_url: str,
-    original_size_mb: float,
-    total_pages: int,
-) -> bool:
-    """
-    將切片存入 GCS 快取
-    Args:
-        cache_key: 快取 key
-        chunks: 切片清單 [(chunk_bytes, page_range), ...]
-        original_url: 原始 PDF URL
-        original_size_mb: 原始檔案大小（MB）
-        total_pages: 總頁數
-    Returns:
-        bool: 是否成功存入快取
-    """
-    try:
-        storage = storage_store_factory()
-        # 1. 存入所有切片
-        page_ranges = []
-        for i, (chunk_bytes, page_range) in enumerate(chunks):
-            chunk_path = _get_chunk_path(cache_key, i)
-            chunk_file = BytesIO(chunk_bytes)
-            success, _ = await storage.store_file(
-                chunk_path, chunk_file, public=False, content_type="application/pdf"
-            )
-            if not success:
-                print(f"[pdf_cache] 無法存入切片 {i}: {cache_key}")
-                return False
-            page_ranges.append(page_range)
-        # 2. 存入 metadata
-        metadata = {
-            "original_url": original_url,
-            "cache_key": cache_key,
-            "chunk_count": len(chunks),
-            "page_ranges": page_ranges,
-            "original_size_mb": original_size_mb,
-            "total_pages": total_pages,
-            "created_at": datetime.utcnow().isoformat(),
-        }
-        metadata_path = _get_metadata_path(cache_key)
-        metadata_file = BytesIO(json.dumps(metadata, ensure_ascii=False).encode("utf-8"))
-        success, _ = await storage.store_file(
-            metadata_path, metadata_file, public=False, content_type="application/json"
-        )
-        if not success:
-            print(f"[pdf_cache] 無法存入 metadata: {cache_key}")
-            return False
-        print(
-            f"[pdf_cache] 成功存入快取: {cache_key}, "
-            f"{len(chunks)} 個切片, {total_pages} 頁"
-        )
-        return True
-    except Exception as e:
-        print(f"[pdf_cache] 存入快取時發生錯誤: {e}")
-        return False
-async def get_cache_metadata(cache_key: str) -> Optional[dict]:
-    """
-    取得快取的 metadata（不載入切片內容）
-    Args:
-        cache_key: 快取 key
-    Returns:
-        Optional[dict]: metadata 字典，或 None
-    """
-    try:
-        storage = storage_store_factory()
-        metadata_path = _get_metadata_path(cache_key)
-        if not await storage.file_exists(metadata_path):
-            return None
-        metadata_file = await storage.retrieve_file(metadata_path)
-        if not metadata_file:
-            return None
-        return json.loads(metadata_file.getvalue().decode("utf-8"))
-    except Exception as e:
-        print(f"[pdf_cache] 讀取 metadata 時發生錯誤: {e}")
-        return None
-async def delete_cache(cache_key: str) -> bool:
-    """
-    刪除快取
-    Args:
-        cache_key: 快取 key
-    Returns:
-        bool: 是否成功刪除
-    """
-    try:
-        storage = storage_store_factory()
-        # 先讀取 metadata 取得切片數量
-        metadata = await get_cache_metadata(cache_key)
-        if not metadata:
-            return True  # 快取不存在，視為成功
-        chunk_count = metadata.get("chunk_count", 0)
-        # 刪除所有切片
-        for i in range(chunk_count):
-            chunk_path = _get_chunk_path(cache_key, i)
-            await storage.delete_file(chunk_path)
-        # 刪除 metadata
-        metadata_path = _get_metadata_path(cache_key)
-        await storage.delete_file(metadata_path)
-        print(f"[pdf_cache] 已刪除快取: {cache_key}")
-        return True
-    except Exception as e:
-        print(f"[pdf_cache] 刪除快取時發生錯誤: {e}")
-        return False
+"""
+PDF 快取模組
+提供 PDF 切片的 GCS 快取功能，避免重複切割相同的 PDF 檔案。
+快取會自動在 7 天後過期（透過 GCS Lifecycle Rule）。
+"""
+import hashlib
+import json
+from io import BytesIO
+from typing import List, Tuple, Optional
+from datetime import datetime
+from botrun_flow_lang.services.storage.storage_factory import storage_store_factory
+# 快取目錄前綴
+PDF_CACHE_PREFIX = "pdf-cache"
+# 快取過期天數（用於 lifecycle rule）
+PDF_CACHE_EXPIRY_DAYS = 7
+def get_cache_key(pdf_url: str) -> str:
+    """
+    根據 PDF URL 產生快取 key（hash）
+    Args:
+        pdf_url: PDF 檔案的 URL
+    Returns:
+        str: 32 字元的 MD5 hash
+    """
+    return hashlib.md5(pdf_url.encode()).hexdigest()
+def _get_cache_path(cache_key: str) -> str:
+    """
+    取得快取目錄路徑
+    Args:
+        cache_key: 快取 key
+    Returns:
+        str: GCS 路徑，格式為 "pdf-cache/{cache_key}"
+    """
+    return f"{PDF_CACHE_PREFIX}/{cache_key}"
+def _get_metadata_path(cache_key: str) -> str:
+    """取得 metadata 檔案路徑"""
+    return f"{_get_cache_path(cache_key)}/metadata.json"
+def _get_chunk_path(cache_key: str, chunk_index: int) -> str:
+    """取得切片檔案路徑"""
+    return f"{_get_cache_path(cache_key)}/chunk-{chunk_index:03d}.pdf"
+async def check_cache(cache_key: str) -> Optional[List[Tuple[bytes, str]]]:
+    """
+    檢查 GCS 是否有快取
+    Args:
+        cache_key: 快取 key（來自 get_cache_key）
+    Returns:
+        Optional[List[Tuple[bytes, str]]]: 如果有快取，回傳切片清單；否則回傳 None
+    """
+    try:
+        storage = storage_store_factory()
+        metadata_path = _get_metadata_path(cache_key)
+        # 檢查 metadata 檔案是否存在
+        if not await storage.file_exists(metadata_path):
+            print(f"[pdf_cache] 快取不存在: {cache_key}")
+            return None
+        # 讀取 metadata
+        metadata_file = await storage.retrieve_file(metadata_path)
+        if not metadata_file:
+            print(f"[pdf_cache] 無法讀取 metadata: {cache_key}")
+            return None
+        metadata = json.loads(metadata_file.getvalue().decode("utf-8"))
+        chunk_count = metadata.get("chunk_count", 0)
+        page_ranges = metadata.get("page_ranges", [])
+        if chunk_count == 0:
+            print(f"[pdf_cache] 快取無切片: {cache_key}")
+            return None
+        print(f"[pdf_cache] 找到快取: {cache_key}, {chunk_count} 個切片")
+        # 讀取所有切片
+        chunks = []
+        for i in range(chunk_count):
+            chunk_path = _get_chunk_path(cache_key, i)
+            chunk_file = await storage.retrieve_file(chunk_path)
+            if not chunk_file:
+                print(f"[pdf_cache] 無法讀取切片 {i}: {cache_key}")
+                return None  # 快取不完整，放棄使用
+            chunk_bytes = chunk_file.getvalue()
+            page_range = page_ranges[i] if i < len(page_ranges) else f"chunk-{i:03d}"
+            chunks.append((chunk_bytes, page_range))
+        print(f"[pdf_cache] 成功載入快取: {cache_key}")
+        return chunks
+    except Exception as e:
+        print(f"[pdf_cache] 檢查快取時發生錯誤: {e}")
+        return None
+async def save_to_cache(
+    cache_key: str,
+    chunks: List[Tuple[bytes, str]],
+    original_url: str,
+    original_size_mb: float,
+    total_pages: int,
+) -> bool:
+    """
+    將切片存入 GCS 快取
+    Args:
+        cache_key: 快取 key
+        chunks: 切片清單 [(chunk_bytes, page_range), ...]
+        original_url: 原始 PDF URL
+        original_size_mb: 原始檔案大小（MB）
+        total_pages: 總頁數
+    Returns:
+        bool: 是否成功存入快取
+    """
+    try:
+        storage = storage_store_factory()
+        # 1. 存入所有切片
+        page_ranges = []
+        for i, (chunk_bytes, page_range) in enumerate(chunks):
+            chunk_path = _get_chunk_path(cache_key, i)
+            chunk_file = BytesIO(chunk_bytes)
+            success, _ = await storage.store_file(
+                chunk_path, chunk_file, public=False, content_type="application/pdf"
+            )
+            if not success:
+                print(f"[pdf_cache] 無法存入切片 {i}: {cache_key}")
+                return False
+            page_ranges.append(page_range)
+        # 2. 存入 metadata
+        metadata = {
+            "original_url": original_url,
+            "cache_key": cache_key,
+            "chunk_count": len(chunks),
+            "page_ranges": page_ranges,
+            "original_size_mb": original_size_mb,
+            "total_pages": total_pages,
+            "created_at": datetime.utcnow().isoformat(),
+        }
+        metadata_path = _get_metadata_path(cache_key)
+        metadata_file = BytesIO(json.dumps(metadata, ensure_ascii=False).encode("utf-8"))
+        success, _ = await storage.store_file(
+            metadata_path, metadata_file, public=False, content_type="application/json"
+        )
+        if not success:
+            print(f"[pdf_cache] 無法存入 metadata: {cache_key}")
+            return False
+        print(
+            f"[pdf_cache] 成功存入快取: {cache_key}, "
+            f"{len(chunks)} 個切片, {total_pages} 頁"
+        )
+        return True
+    except Exception as e:
+        print(f"[pdf_cache] 存入快取時發生錯誤: {e}")
+        return False
+async def get_cache_metadata(cache_key: str) -> Optional[dict]:
+    """
+    取得快取的 metadata（不載入切片內容）
+    Args:
+        cache_key: 快取 key
+    Returns:
+        Optional[dict]: metadata 字典，或 None
+    """
+    try:
+        storage = storage_store_factory()
+        metadata_path = _get_metadata_path(cache_key)
+        if not await storage.file_exists(metadata_path):
+            return None
+        metadata_file = await storage.retrieve_file(metadata_path)
+        if not metadata_file:
+            return None
+        return json.loads(metadata_file.getvalue().decode("utf-8"))
+    except Exception as e:
+        print(f"[pdf_cache] 讀取 metadata 時發生錯誤: {e}")
+        return None
+async def delete_cache(cache_key: str) -> bool:
+    """
+    刪除快取
+    Args:
+        cache_key: 快取 key
+    Returns:
+        bool: 是否成功刪除
+    """
+    try:
+        storage = storage_store_factory()
+        # 先讀取 metadata 取得切片數量
+        metadata = await get_cache_metadata(cache_key)
+        if not metadata:
+            return True  # 快取不存在，視為成功
+        chunk_count = metadata.get("chunk_count", 0)
+        # 刪除所有切片
+        for i in range(chunk_count):
+            chunk_path = _get_chunk_path(cache_key, i)
+            await storage.delete_file(chunk_path)
+        # 刪除 metadata
+        metadata_path = _get_metadata_path(cache_key)
+        await storage.delete_file(metadata_path)
+        print(f"[pdf_cache] 已刪除快取: {cache_key}")
+        return True
+    except Exception as e:
+        print(f"[pdf_cache] 刪除快取時發生錯誤: {e}")
+        return False

botrun-flow-lang 5.12.263__py3-none-any.whl → 5.12.264__py3-none-any.whl

botrun-flow-lang 5.12.263py3-none-any.whl → 5.12.264py3-none-any.whl