PyPI - flowllm - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

flowllm 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (141) hide show

flowllm/__init__.py +21 -0
flowllm/app.py +15 -0
flowllm/client/__init__.py +25 -0
flowllm/client/async_http_client.py +81 -0
flowllm/client/http_client.py +81 -0
flowllm/client/mcp_client.py +133 -0
flowllm/client/sync_mcp_client.py +116 -0
flowllm/config/__init__.py +1 -0
flowllm/config/default.yaml +77 -0
flowllm/config/empty.yaml +37 -0
flowllm/config/pydantic_config_parser.py +242 -0
flowllm/context/base_context.py +79 -0
flowllm/context/flow_context.py +16 -0
llmflow/op/prompt_mixin.py → flowllm/context/prompt_handler.py +25 -14
flowllm/context/registry.py +30 -0
flowllm/context/service_context.py +147 -0
flowllm/embedding_model/__init__.py +1 -0
{llmflow → flowllm}/embedding_model/base_embedding_model.py +93 -2
{llmflow → flowllm}/embedding_model/openai_compatible_embedding_model.py +71 -13
flowllm/flow/__init__.py +1 -0
flowllm/flow/base_flow.py +72 -0
flowllm/flow/base_tool_flow.py +15 -0
flowllm/flow/gallery/__init__.py +8 -0
flowllm/flow/gallery/cmd_flow.py +11 -0
flowllm/flow/gallery/code_tool_flow.py +30 -0
flowllm/flow/gallery/dashscope_search_tool_flow.py +34 -0
flowllm/flow/gallery/deepsearch_tool_flow.py +39 -0
flowllm/flow/gallery/expression_tool_flow.py +18 -0
flowllm/flow/gallery/mock_tool_flow.py +67 -0
flowllm/flow/gallery/tavily_search_tool_flow.py +30 -0
flowllm/flow/gallery/terminate_tool_flow.py +30 -0
flowllm/flow/parser/expression_parser.py +171 -0
flowllm/llm/__init__.py +2 -0
{llmflow → flowllm}/llm/base_llm.py +100 -18
flowllm/llm/litellm_llm.py +455 -0
flowllm/llm/openai_compatible_llm.py +439 -0
flowllm/op/__init__.py +11 -0
llmflow/op/react/react_v1_op.py → flowllm/op/agent/react_op.py +17 -22
flowllm/op/akshare/__init__.py +3 -0
flowllm/op/akshare/get_ak_a_code_op.py +108 -0
flowllm/op/akshare/get_ak_a_code_prompt.yaml +21 -0
flowllm/op/akshare/get_ak_a_info_op.py +140 -0
flowllm/op/base_llm_op.py +64 -0
flowllm/op/base_op.py +148 -0
flowllm/op/base_ray_op.py +313 -0
flowllm/op/code/__init__.py +1 -0
flowllm/op/code/execute_code_op.py +42 -0
flowllm/op/gallery/__init__.py +2 -0
flowllm/op/gallery/mock_op.py +42 -0
flowllm/op/gallery/terminate_op.py +29 -0
flowllm/op/parallel_op.py +23 -0
flowllm/op/search/__init__.py +3 -0
flowllm/op/search/dashscope_deep_research_op.py +260 -0
flowllm/op/search/dashscope_search_op.py +179 -0
flowllm/op/search/dashscope_search_prompt.yaml +13 -0
flowllm/op/search/tavily_search_op.py +102 -0
flowllm/op/sequential_op.py +21 -0
flowllm/schema/flow_request.py +12 -0
flowllm/schema/flow_response.py +12 -0
flowllm/schema/message.py +35 -0
flowllm/schema/service_config.py +72 -0
flowllm/schema/tool_call.py +118 -0
{llmflow → flowllm}/schema/vector_node.py +1 -0
flowllm/service/__init__.py +3 -0
flowllm/service/base_service.py +68 -0
flowllm/service/cmd_service.py +15 -0
flowllm/service/http_service.py +79 -0
flowllm/service/mcp_service.py +47 -0
flowllm/storage/__init__.py +1 -0
flowllm/storage/cache/__init__.py +1 -0
flowllm/storage/cache/cache_data_handler.py +104 -0
flowllm/storage/cache/data_cache.py +375 -0
flowllm/storage/vector_store/__init__.py +3 -0
flowllm/storage/vector_store/base_vector_store.py +44 -0
{llmflow → flowllm/storage}/vector_store/chroma_vector_store.py +11 -10
{llmflow → flowllm/storage}/vector_store/es_vector_store.py +11 -11
llmflow/vector_store/file_vector_store.py → flowllm/storage/vector_store/local_vector_store.py +110 -11
flowllm/utils/common_utils.py +52 -0
flowllm/utils/fetch_url.py +117 -0
flowllm/utils/llm_utils.py +28 -0
flowllm/utils/ridge_v2.py +54 -0
{llmflow → flowllm}/utils/timer.py +5 -4
{flowllm-0.1.0.dist-info → flowllm-0.1.2.dist-info}/METADATA +45 -388
flowllm-0.1.2.dist-info/RECORD +99 -0
flowllm-0.1.2.dist-info/entry_points.txt +2 -0
{flowllm-0.1.0.dist-info → flowllm-0.1.2.dist-info}/licenses/LICENSE +1 -1
flowllm-0.1.2.dist-info/top_level.txt +1 -0
flowllm-0.1.0.dist-info/RECORD +0 -66
flowllm-0.1.0.dist-info/entry_points.txt +0 -3
flowllm-0.1.0.dist-info/top_level.txt +0 -1
llmflow/app.py +0 -53
llmflow/config/config_parser.py +0 -80
llmflow/config/mock_config.yaml +0 -58
llmflow/embedding_model/__init__.py +0 -5
llmflow/enumeration/agent_state.py +0 -8
llmflow/llm/__init__.py +0 -5
llmflow/llm/openai_compatible_llm.py +0 -283
llmflow/mcp_server.py +0 -110
llmflow/op/__init__.py +0 -10
llmflow/op/base_op.py +0 -125
llmflow/op/mock_op.py +0 -40
llmflow/op/vector_store/__init__.py +0 -13
llmflow/op/vector_store/recall_vector_store_op.py +0 -48
llmflow/op/vector_store/update_vector_store_op.py +0 -28
llmflow/op/vector_store/vector_store_action_op.py +0 -46
llmflow/pipeline/pipeline.py +0 -94
llmflow/pipeline/pipeline_context.py +0 -37
llmflow/schema/app_config.py +0 -69
llmflow/schema/experience.py +0 -144
llmflow/schema/message.py +0 -68
llmflow/schema/request.py +0 -32
llmflow/schema/response.py +0 -29
llmflow/service/__init__.py +0 -0
llmflow/service/llmflow_service.py +0 -96
llmflow/tool/__init__.py +0 -9
llmflow/tool/base_tool.py +0 -80
llmflow/tool/code_tool.py +0 -43
llmflow/tool/dashscope_search_tool.py +0 -162
llmflow/tool/mcp_tool.py +0 -77
llmflow/tool/tavily_search_tool.py +0 -109
llmflow/tool/terminate_tool.py +0 -23
llmflow/utils/__init__.py +0 -0
llmflow/utils/common_utils.py +0 -17
llmflow/utils/file_handler.py +0 -25
llmflow/utils/http_client.py +0 -156
llmflow/utils/op_utils.py +0 -102
llmflow/utils/registry.py +0 -33
llmflow/vector_store/__init__.py +0 -7
llmflow/vector_store/base_vector_store.py +0 -136
{llmflow → flowllm/context}/__init__.py +0 -0
{llmflow/config → flowllm/enumeration}/__init__.py +0 -0
{llmflow → flowllm}/enumeration/chunk_enum.py +0 -0
{llmflow → flowllm}/enumeration/http_enum.py +0 -0
{llmflow → flowllm}/enumeration/role.py +0 -0
{llmflow/enumeration → flowllm/flow/parser}/__init__.py +0 -0
{llmflow/op/react → flowllm/op/agent}/__init__.py +0 -0
/llmflow/op/react/react_v1_prompt.yaml → /flowllm/op/agent/react_prompt.yaml +0 -0
{llmflow/pipeline → flowllm/schema}/__init__.py +0 -0
{llmflow/schema → flowllm/utils}/__init__.py +0 -0
{llmflow → flowllm}/utils/singleton.py +0 -0
{flowllm-0.1.0.dist-info → flowllm-0.1.2.dist-info}/WHEEL +0 -0

flowllm/storage/cache/cache_data_handler.py ADDED Viewed

@@ -0,0 +1,104 @@
+import json
+from abc import ABC, abstractmethod
+from pathlib import Path
+from typing import Dict, Any
+import pandas as pd
+class CacheDataHandler(ABC):
+    """Abstract base class for data type handlers"""
+    @abstractmethod
+    def save(self, data: Any, file_path: Path, **kwargs) -> Dict[str, Any]:
+        """
+        Save data to file and return metadata
+        Args:
+            data: Data to save
+            file_path: File path to save to
+            **kwargs: Additional parameters
+        Returns:
+            Dict containing metadata about the saved data
+        """
+        pass
+    @abstractmethod
+    def load(self, file_path: Path, **kwargs) -> Any:
+        """
+        Load data from file
+        Args:
+            file_path: File path to load from
+            **kwargs: Additional parameters
+        Returns:
+            Loaded data
+        """
+        pass
+    @abstractmethod
+    def get_file_extension(self) -> str:
+        """Get the file extension for this data type"""
+        pass
+class DataFrameHandler(CacheDataHandler):
+    """Handler for pandas DataFrame data type"""
+    def save(self, data: pd.DataFrame, file_path: Path, **kwargs) -> Dict[str, Any]:
+        """Save DataFrame as CSV"""
+        csv_params = {
+            "index": False,
+            "encoding": "utf-8"
+        }
+        csv_params.update(kwargs)
+        data.to_csv(file_path, **csv_params)
+        return {
+            'row_count': len(data),
+            'column_count': len(data.columns),
+            'file_size': file_path.stat().st_size
+        }
+    def load(self, file_path: Path, **kwargs) -> pd.DataFrame:
+        """Load DataFrame from CSV"""
+        csv_params = {
+            'encoding': 'utf-8'
+        }
+        csv_params.update(kwargs)
+        return pd.read_csv(file_path, **csv_params)
+    def get_file_extension(self) -> str:
+        return ".csv"
+class DictHandler(CacheDataHandler):
+    """Handler for dict data type"""
+    def save(self, data: dict, file_path: Path, **kwargs) -> Dict[str, Any]:
+        """Save dict as JSON"""
+        json_params = {
+            "ensure_ascii": False,
+            "indent": 2
+        }
+        json_params.update(kwargs)
+        with open(file_path, 'w', encoding='utf-8') as f:
+            json.dump(data, f, **json_params)
+        return {
+            'key_count': len(data),
+            'file_size': file_path.stat().st_size
+        }
+    def load(self, file_path: Path, **kwargs) -> dict:
+        """Load dict from JSON"""
+        with open(file_path, 'r', encoding='utf-8') as f:
+            return json.load(f)
+    def get_file_extension(self) -> str:
+        return ".json"

flowllm/storage/cache/data_cache.py ADDED Viewed

@@ -0,0 +1,375 @@
+"""
+DataCache utility that supports multiple data types with local storage and data expiration functionality
+"""
+import json
+from datetime import datetime, timedelta
+from pathlib import Path
+from typing import Optional, Dict, Any, Union, Type
+import pandas as pd
+from flowllm.storage.cache.cache_data_handler import CacheDataHandler, DataFrameHandler, DictHandler
+class DataCache:
+    """
+    Generic data cache utility class
+    Features:
+    - Support for multiple data types (DataFrame, dict, and extensible for others)
+    - Support for data expiration time settings
+    - Automatic cleanup of expired data
+    - Recording and managing update timestamps
+    - Type-specific storage formats (CSV for DataFrame, JSON for dict)
+    """
+    def __init__(self, cache_dir: str = "cache"):
+        self.cache_dir = Path(cache_dir)
+        self.cache_dir.mkdir(parents=True, exist_ok=True)
+        self.metadata_file = self.cache_dir / "metadata.json"
+        self.metadata = {}
+        # Register default handlers
+        self.handlers: Dict[Type, CacheDataHandler] = {
+            pd.DataFrame: DataFrameHandler(),
+            dict: DictHandler()
+        }
+        self._load_metadata()
+    def register_handler(self, data_type: Type, handler: CacheDataHandler):
+        """
+        Register a custom data handler for a specific data type
+        Args:
+            data_type: The data type to handle
+            handler: The handler instance
+        """
+        self.handlers[data_type] = handler
+    def _get_handler(self, data_type: Type) -> CacheDataHandler:
+        """Get the appropriate handler for a data type"""
+        if data_type in self.handlers:
+            return self.handlers[data_type]
+        # Try to find a handler for parent classes
+        for registered_type, handler in self.handlers.items():
+            if issubclass(data_type, registered_type):
+                return handler
+        raise ValueError(f"No handler registered for data type: {data_type}")
+    def _load_metadata(self):
+        """Load metadata"""
+        if self.metadata_file.exists():
+            with open(self.metadata_file) as f:
+                self.metadata = json.load(f)
+    def _save_metadata(self):
+        """Save metadata"""
+        with open(self.metadata_file, "w") as f:
+            json.dump(self.metadata, f, ensure_ascii=False, indent=2)
+    def _get_file_path(self, key: str, data_type: Type = None) -> Path:
+        """Get data file path with appropriate extension"""
+        if data_type is None:
+            # Try to get extension from metadata
+            if key in self.metadata and 'data_type' in self.metadata[key]:
+                stored_type_name = self.metadata[key]['data_type']
+                if stored_type_name == 'DataFrame':
+                    extension = '.csv'
+                elif stored_type_name == 'dict':
+                    extension = '.json'
+                elif stored_type_name == 'str':
+                    extension = '.txt'
+                else:
+                    # Try to find extension from registered handlers
+                    extension = '.dat'  # Default extension
+                    for registered_type, handler in self.handlers.items():
+                        if registered_type.__name__ == stored_type_name:
+                            extension = handler.get_file_extension()
+                            break
+            else:
+                extension = '.dat'  # Default extension
+        else:
+            try:
+                handler = self._get_handler(data_type)
+                extension = handler.get_file_extension()
+            except ValueError:
+                extension = '.dat'  # Default extension
+        return self.cache_dir / f"{key}{extension}"
+    def _is_expired(self, key: str) -> bool:
+        """Check if data is expired"""
+        if key not in self.metadata:
+            return True
+        expire_time_str = self.metadata[key].get('expire_time')
+        if not expire_time_str:
+            return False  # No expiration time set, never expires
+        expire_time = datetime.fromisoformat(expire_time_str)
+        return datetime.now() > expire_time
+    def save(self, key: str, data: Union[pd.DataFrame, dict, Any], expire_hours: Optional[float] = None,
+             **handler_kwargs) -> bool:
+        """
+        Save data to cache
+        Args:
+            key: Cache key name
+            data: Data to save (DataFrame, dict, or other supported types)
+            expire_hours: Expiration time in hours, None means never expires
+            **handler_kwargs: Additional parameters passed to the data handler
+        Returns:
+            bool: Whether save was successful
+        """
+        try:
+            data_type = type(data)
+            handler = self._get_handler(data_type)
+            file_path = self._get_file_path(key, data_type)
+            # Save data using appropriate handler
+            handler_metadata = handler.save(data, file_path, **handler_kwargs)
+            # Update metadata
+            current_time = datetime.now()
+            self.metadata[key] = {
+                'created_time': current_time.isoformat(),
+                'updated_time': current_time.isoformat(),
+                'expire_time': (current_time + timedelta(hours=expire_hours)).isoformat() if expire_hours else None,
+                'data_type': data_type.__name__,
+                **handler_metadata
+            }
+            self._save_metadata()
+            return True
+        except Exception as e:
+            print(f"Failed to save data: {e}")
+            return False
+    def load(self, key: str, auto_clean_expired: bool = True, **handler_kwargs) -> Optional[Any]:
+        """
+        Load data from cache
+        Args:
+            key: Cache key name
+            auto_clean_expired: Whether to automatically clean expired data
+            **handler_kwargs: Additional parameters passed to the data handler
+        Returns:
+            Optional[Any]: Loaded data, returns None if not exists or expired
+        """
+        try:
+            # Check if expired
+            if self._is_expired(key):
+                if auto_clean_expired:
+                    self.delete(key)
+                    print(f"Cache '{key}' has expired and was automatically cleaned")
+                return None
+            file_path = self._get_file_path(key)
+            if not file_path.exists():
+                return None
+            # Get data type from metadata
+            if key not in self.metadata or 'data_type' not in self.metadata[key]:
+                print(f"No data type information found for key '{key}'")
+                return None
+            data_type_name = self.metadata[key]['data_type']
+            # Map type name back to actual type
+            if data_type_name == 'DataFrame':
+                data_type = pd.DataFrame
+            elif data_type_name == 'dict':
+                data_type = dict
+            elif data_type_name == 'str':
+                data_type = str
+            else:
+                # For other custom types, try to find a handler by checking registered types
+                data_type = None
+                for registered_type in self.handlers.keys():
+                    if registered_type.__name__ == data_type_name:
+                        data_type = registered_type
+                        break
+                if data_type is None:
+                    print(f"Unknown data type: {data_type_name}")
+                    return None
+            handler = self._get_handler(data_type)
+            # Load data using appropriate handler
+            data = handler.load(file_path, **handler_kwargs)
+            # Update last access time
+            if key in self.metadata:
+                self.metadata[key]['last_accessed'] = datetime.now().isoformat()
+                self._save_metadata()
+            return data
+        except Exception as e:
+            print(f"Failed to load data: {e}")
+            return None
+    def exists(self, key: str, check_expired: bool = True) -> bool:
+        """
+        Check if cache exists
+        Args:
+            key: Cache key name
+            check_expired: Whether to check expiration status
+        Returns:
+            bool: Whether cache exists and is not expired
+        """
+        if check_expired and self._is_expired(key):
+            return False
+        file_path = self._get_file_path(key)
+        return file_path.exists() and key in self.metadata
+    def delete(self, key: str) -> bool:
+        """
+        Delete cache
+        Args:
+            key: Cache key name
+        Returns:
+            bool: Whether deletion was successful
+        """
+        try:
+            file_path = self._get_file_path(key)
+            # Delete data file
+            if file_path.exists():
+                file_path.unlink()
+            # Delete metadata
+            if key in self.metadata:
+                del self.metadata[key]
+                self._save_metadata()
+            return True
+        except Exception as e:
+            print(f"Failed to delete cache: {e}")
+            return False
+    def clean_expired(self) -> int:
+        """
+        Clean all expired caches
+        Returns:
+            int: Number of cleaned caches
+        """
+        expired_keys = []
+        for key in list(self.metadata.keys()):
+            if self._is_expired(key):
+                expired_keys.append(key)
+        cleaned_count = 0
+        for key in expired_keys:
+            if self.delete(key):
+                cleaned_count += 1
+        return cleaned_count
+    def get_info(self, key: str) -> Optional[Dict[str, Any]]:
+        """
+        Get cache information
+        Args:
+            key: Cache key name
+        Returns:
+            Optional[Dict]: Cache information including creation time, update time, expiration time, etc.
+        """
+        if key not in self.metadata:
+            return None
+        info = self.metadata[key].copy()
+        info['key'] = key
+        info['is_expired'] = self._is_expired(key)
+        info['file_path'] = str(self._get_file_path(key))
+        return info
+    def list_all(self, include_expired: bool = False) -> Dict[str, Dict[str, Any]]:
+        """
+        List all caches
+        Args:
+            include_expired: Whether to include expired caches
+        Returns:
+            Dict: Information of all caches
+        """
+        result = {}
+        for key in self.metadata:
+            if not include_expired and self._is_expired(key):
+                continue
+            info = self.get_info(key)
+            if info:
+                result[key] = info
+        return result
+    def get_cache_stats(self) -> Dict[str, Any]:
+        """
+        Get cache statistics
+        Returns:
+            Dict: Cache statistics information
+        """
+        total_count = len(self.metadata)
+        expired_count = sum(1 for key in self.metadata if self._is_expired(key))
+        active_count = total_count - expired_count
+        total_size = 0
+        for key in self.metadata:
+            file_path = self._get_file_path(key)
+            if file_path.exists():
+                total_size += file_path.stat().st_size
+        return {
+            'total_count': total_count,
+            'active_count': active_count,
+            'expired_count': expired_count,
+            'total_size_bytes': total_size,
+            'total_size_mb': round(total_size / (1024 * 1024), 2),
+            'cache_dir': str(self.cache_dir)
+        }
+    def clear_all(self) -> bool:
+        """
+        Clear all caches
+        Returns:
+            bool: Whether clearing was successful
+        """
+        try:
+            # Delete all data files (CSV, JSON, and other supported formats)
+            for data_file in self.cache_dir.glob("*"):
+                if data_file.is_file() and data_file.name != "metadata.json":
+                    data_file.unlink()
+            # Clear metadata
+            self.metadata = {}
+            self._save_metadata()
+            return True
+        except Exception as e:
+            print(f"Failed to clear cache: {e}")
+            return False

flowllm/storage/vector_store/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+from .chroma_vector_store import ChromaVectorStore
+from .es_vector_store import EsVectorStore
+from .local_vector_store import LocalVectorStore

flowllm/storage/vector_store/base_vector_store.py ADDED Viewed

@@ -0,0 +1,44 @@
+from abc import ABC
+from pathlib import Path
+from typing import List, Iterable
+from pydantic import BaseModel, Field
+from flowllm.embedding_model.base_embedding_model import BaseEmbeddingModel
+from flowllm.schema.vector_node import VectorNode
+class BaseVectorStore(BaseModel, ABC):
+    embedding_model: BaseEmbeddingModel | None = Field(default=None)
+    batch_size: int = Field(default=1024)
+    def exist_workspace(self, workspace_id: str, **kwargs) -> bool:
+        raise NotImplementedError
+    def delete_workspace(self, workspace_id: str, **kwargs):
+        raise NotImplementedError
+    def create_workspace(self, workspace_id: str, **kwargs):
+        raise NotImplementedError
+    def _iter_workspace_nodes(self, workspace_id: str, **kwargs) -> Iterable[VectorNode]:
+        raise NotImplementedError
+    def dump_workspace(self, workspace_id: str, path: str | Path = "", callback_fn=None, **kwargs):
+        raise NotImplementedError
+    def load_workspace(self, workspace_id: str, path: str | Path = "", nodes: List[VectorNode] = None, callback_fn=None,
+                       **kwargs):
+        raise NotImplementedError
+    def copy_workspace(self, src_workspace_id: str, dest_workspace_id: str, **kwargs):
+        raise NotImplementedError
+    def search(self, query: str, workspace_id: str, top_k: int = 1, **kwargs) -> List[VectorNode]:
+        raise NotImplementedError
+    def insert(self, nodes: VectorNode | List[VectorNode], workspace_id: str, **kwargs):
+        raise NotImplementedError
+    def delete(self, node_ids: str | List[str], workspace_id: str, **kwargs):
+        raise NotImplementedError

{llmflow → flowllm/storage}/vector_store/chroma_vector_store.py RENAMED Viewed

@@ -6,17 +6,16 @@ from chromadb.config import Settings
 from loguru import logger
 from pydantic import Field, PrivateAttr, model_validator
-from llmflow.embedding_model.openai_compatible_embedding_model import OpenAICompatibleEmbeddingModel
-from llmflow.schema.vector_node import VectorNode
-from llmflow.vector_store import VECTOR_STORE_REGISTRY
-from llmflow.vector_store.base_vector_store import BaseVectorStore
+from flowllm.context.service_context import C
+from flowllm.schema.vector_node import VectorNode
+from flowllm.storage.vector_store.local_vector_store import LocalVectorStore
-@VECTOR_STORE_REGISTRY.register("chroma")
-class ChromaVectorStore(BaseVectorStore):
+@C.register_vector_store("chroma")
+class ChromaVectorStore(LocalVectorStore):
     store_dir: str = Field(default="./chroma_vector_store")
     collections: dict = Field(default_factory=dict)
-    _client: chromadb.Client = PrivateAttr()
+    _client: chromadb.ClientAPI = PrivateAttr()
     @model_validator(mode="after")
     def init_client(self):
@@ -97,8 +96,10 @@ class ChromaVectorStore(BaseVectorStore):
 def main():
-    from dotenv import load_dotenv
-    load_dotenv()
+    from flowllm.utils.common_utils import load_env
+    from flowllm.embedding_model import OpenAICompatibleEmbeddingModel
+    load_env()
     embedding_model = OpenAICompatibleEmbeddingModel(dimensions=64, model_name="text-embedding-v4")
     workspace_id = "chroma_test_index"
@@ -185,4 +186,4 @@ def main():
 if __name__ == "__main__":
     main()
-    # launch with: python -m llmflow.storage.chroma_vector_store
+    # launch with: python -m flowllm.storage.chroma_vector_store

{llmflow → flowllm/storage}/vector_store/es_vector_store.py RENAMED Viewed

@@ -6,15 +6,14 @@ from elasticsearch.helpers import bulk
 from loguru import logger
 from pydantic import Field, PrivateAttr, model_validator
-from llmflow.embedding_model.openai_compatible_embedding_model import OpenAICompatibleEmbeddingModel
-from llmflow.schema.vector_node import VectorNode
-from llmflow.vector_store import VECTOR_STORE_REGISTRY
-from llmflow.vector_store.base_vector_store import BaseVectorStore
+from flowllm.context.service_context import C
+from flowllm.schema.vector_node import VectorNode
+from flowllm.storage.vector_store.local_vector_store import LocalVectorStore
-@VECTOR_STORE_REGISTRY.register("elasticsearch")
-class EsVectorStore(BaseVectorStore):
-    hosts: str | List[str] = Field(default_factory=lambda: os.getenv("ES_HOSTS", "http://localhost:9200"))
+@C.register_vector_store("elasticsearch")
+class EsVectorStore(LocalVectorStore):
+    hosts: str | List[str] = Field(default_factory=lambda: os.getenv("FLOW_ES_HOSTS", "http://localhost:9200"))
     basic_auth: str | Tuple[str, str] | None = Field(default=None)
     retrieve_filters: List[dict] = []
     _client: Elasticsearch = PrivateAttr()
@@ -24,6 +23,7 @@ class EsVectorStore(BaseVectorStore):
         if isinstance(self.hosts, str):
             self.hosts = [self.hosts]
         self._client = Elasticsearch(hosts=self.hosts, basic_auth=self.basic_auth)
+        logger.info(f"Elasticsearch client initialized with hosts: {self.hosts}")
         return self
     def exist_workspace(self, workspace_id: str, **kwargs) -> bool:
@@ -160,10 +160,11 @@ class EsVectorStore(BaseVectorStore):
         if refresh:
             self.refresh(workspace_id=workspace_id)
 def main():
-    from dotenv import load_dotenv
-    load_dotenv()
+    from flowllm.utils.common_utils import load_env
+    from flowllm.embedding_model import OpenAICompatibleEmbeddingModel
+    load_env()
     embedding_model = OpenAICompatibleEmbeddingModel(dimensions=64, model_name="text-embedding-v4")
     workspace_id = "rag_nodes_index"
@@ -224,4 +225,3 @@ def main():
 if __name__ == "__main__":
     main()
-    # launch with: python -m llmflow.storage.es_vector_store

flowllm 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl

flowllm 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl