PyPI - crewplus - Versions diffs - 0.2.34__tar.gz → 0.2.37__tar.gz - Mend

crewplus 0.2.34tar.gz → 0.2.37tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of crewplus might be problematic. Click here for more details.

Files changed (22) hide show

{crewplus-0.2.34 → crewplus-0.2.37}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: crewplus
-Version: 0.2.34
+Version: 0.2.37
 Summary: Base services for CrewPlus AI applications
 Author-Email: Tim Liu <tim@opsmateai.com>
 License: MIT

{crewplus-0.2.34 → crewplus-0.2.37}/crewplus/services/gemini_chat_model.py RENAMED Viewed

@@ -294,6 +294,7 @@ class GeminiChatModel(BaseChatModel):
         if creds is None:
             # Get service account file from env if not provided
             sa_file = self.service_account_file or os.getenv("GCP_SERVICE_ACCOUNT_FILE")
+            self.logger.debug(f"Service account file: {sa_file}")
             if sa_file:
                 try:
                     creds = service_account.Credentials.from_service_account_file(
@@ -307,15 +308,21 @@ class GeminiChatModel(BaseChatModel):
         # If creds is still None, the client will use Application Default Credentials (ADC).
-        self._client = genai.Client(
-            project=self.project_id,
-            location=self.location,
-            credentials=creds,
-        )
-        self.logger.info(
-            f"Initialized GeminiChatModel with model: {self.model_name} for Vertex AI "
-            f"(Project: {self.project_id}, Location: {self.location})"
-        )
+        try:
+            self._client = genai.Client(
+                vertexai=True,
+                project=self.project_id,
+                location=self.location,
+                credentials=creds,
+            )
+            self.logger.info(
+                f"Initialized GeminiChatModel with model: {self.model_name} for Vertex AI "
+                f"(Project: {self.project_id}, Location: {self.location})"
+            )
+        except Exception as e:
+            error_msg = f"Failed to initialize GenAI Client for Vertex AI: {e}"
+            self.logger.error(error_msg, exc_info=True)
+            raise ValueError(error_msg)
     def get_model_identifier(self) -> str:
         """Return a string identifying this model for tracing and logging."""

{crewplus-0.2.34 → crewplus-0.2.37}/crewplus/services/init_services.py RENAMED Viewed

@@ -1,15 +1,27 @@
 import os
+import logging
+from typing import Optional
 from .model_load_balancer import ModelLoadBalancer
 model_balancer = None
-def init_load_balancer(config_path: str = None):
+def init_load_balancer(
+    config_path: Optional[str] = None,
+    logger: Optional[logging.Logger] = None
+):
     """
     Initializes the global ModelLoadBalancer instance.
     This function is idempotent. If the balancer is already initialized,
     it does nothing. It follows a safe initialization pattern where the
     global instance is only assigned after successful configuration loading.
+    Args:
+        config_path (Optional[str]): The path to the model configuration file.
+            If not provided, it's determined by the `MODEL_CONFIG_PATH`
+            environment variable, or defaults to "config/models_config.json".
+        logger (Optional[logging.Logger]): An optional logger instance to be
+            used by the model balancer.
     """
     global model_balancer
     if model_balancer is None:
@@ -20,7 +32,10 @@ def init_load_balancer(config_path: str = None):
         )
         try:
             # 1. Create a local instance first.
-            balancer = ModelLoadBalancer(final_config_path)
+            balancer = ModelLoadBalancer(
+                config_path=final_config_path,
+                logger=logger
+            )
             # 2. Attempt to load its configuration.
             balancer.load_config()
             # 3. Only assign to the global variable on full success.

{crewplus-0.2.34 → crewplus-0.2.37}/crewplus/services/model_load_balancer.py RENAMED Viewed

@@ -1,6 +1,7 @@
 import json
 import random
 import logging
+import threading
 from typing import Dict, List, Optional, Union
 from collections import defaultdict
 from langchain_openai import ChatOpenAI, AzureOpenAIEmbeddings
@@ -31,7 +32,7 @@ class ModelLoadBalancer:
         self.config_data = config_data
         self.logger = logger or logging.getLogger(__name__)
         self.models_config: List[Dict] = []
-        self.models: Dict[int, Union[TracedAzureChatOpenAI, ChatOpenAI, AzureOpenAIEmbeddings, GeminiChatModel]] = {}
+        self.thread_local = threading.local()
         self._initialize_state()
         self._config_loaded = False  # Flag to check if config is loaded
@@ -60,15 +61,6 @@ class ModelLoadBalancer:
             self.models_config = config['models']
-            # Instantiate models
-            for model_config in self.models_config:
-                model_id = model_config['id']
-                model_instance = self._instantiate_model(model_config)
-                if model_instance is not None:
-                    self.models[model_id] = model_instance
-                else:
-                    self.logger.warning(f"Model with id {model_id} was not loaded due to instantiation error.")
             self._config_loaded = True
             self.logger.debug("Model balancer: configuration loaded successfully.")
         except (FileNotFoundError, json.JSONDecodeError, ValueError) as e:
@@ -105,8 +97,7 @@ class ModelLoadBalancer:
         if deployment_name:
             for model_config in self.models_config:
                 if model_config.get('deployment_name') == deployment_name:
-                    model_id = model_config['id']
-                    model = self.models[model_id]
+                    model = self._get_or_create_model(model_config)
                     if with_metadata:
                         return model, deployment_name
                     return model
@@ -130,14 +121,33 @@ class ModelLoadBalancer:
                 self.logger.warning(f"Unsupported selection strategy: '{selection_strategy}'. Defaulting to 'random'.")
                 selected_model_config = self._random_selection(candidates)
-            model_id = selected_model_config['id']
-            model = self.models[model_id]
+            model = self._get_or_create_model(selected_model_config)
             if with_metadata:
                 return model, selected_model_config.get('deployment_name')
             return model
         raise ValueError("Either 'deployment_name' or both 'provider' and 'model_type' must be provided.")
+    def _get_thread_local_models_cache(self) -> Dict:
+        """Gets the model cache for the current thread, creating it if it doesn't exist."""
+        if not hasattr(self.thread_local, 'models_cache'):
+            self.thread_local.models_cache = {}
+        return self.thread_local.models_cache
+    def _get_or_create_model(self, model_config: Dict):
+        """
+        Gets a model instance from the thread-local cache. If it doesn't exist,
+        it instantiates, caches, and returns it.
+        """
+        model_id = model_config['id']
+        models_cache = self._get_thread_local_models_cache()
+        if model_id not in models_cache:
+            self.logger.debug(f"Creating new model instance for id {model_id} in thread {threading.get_ident()}")
+            models_cache[model_id] = self._instantiate_model(model_config)
+        return models_cache[model_id]
     def _instantiate_model(self, model_config: Dict):
         """Instantiate and return an LLM object based on the model configuration"""
         provider = model_config['provider']

{crewplus-0.2.34 → crewplus-0.2.37}/pyproject.toml RENAMED Viewed

@@ -6,7 +6,7 @@ build-backend = "pdm.backend"
 [project]
 name = "crewplus"
-version = "0.2.34"
+version = "0.2.37"
 description = "Base services for CrewPlus AI applications"
 authors = [
     { name = "Tim Liu", email = "tim@opsmateai.com" },