PyPI - iatoolkit - Versions diffs - 0.71.4__py3-none-any.whl → 0.91.1__py3-none-any.whl - Mend

iatoolkit 0.71.4py3-none-any.whl → 0.91.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

iatoolkit/__init__.py +15 -5
iatoolkit/base_company.py +4 -58
iatoolkit/cli_commands.py +6 -7
iatoolkit/common/exceptions.py +1 -0
iatoolkit/common/routes.py +12 -28
iatoolkit/common/util.py +7 -1
iatoolkit/company_registry.py +50 -14
iatoolkit/{iatoolkit.py → core.py} +54 -55
iatoolkit/infra/{mail_app.py → brevo_mail_app.py} +15 -37
iatoolkit/infra/llm_client.py +9 -5
iatoolkit/locales/en.yaml +10 -2
iatoolkit/locales/es.yaml +171 -162
iatoolkit/repositories/database_manager.py +59 -14
iatoolkit/repositories/llm_query_repo.py +34 -22
iatoolkit/repositories/models.py +16 -18
iatoolkit/repositories/profile_repo.py +5 -10
iatoolkit/repositories/vs_repo.py +9 -4
iatoolkit/services/auth_service.py +1 -1
iatoolkit/services/branding_service.py +1 -1
iatoolkit/services/company_context_service.py +19 -11
iatoolkit/services/configuration_service.py +219 -46
iatoolkit/services/dispatcher_service.py +31 -225
iatoolkit/services/document_service.py +10 -1
iatoolkit/services/embedding_service.py +9 -6
iatoolkit/services/excel_service.py +50 -2
iatoolkit/services/history_manager_service.py +189 -0
iatoolkit/services/jwt_service.py +1 -1
iatoolkit/services/language_service.py +8 -2
iatoolkit/services/license_service.py +82 -0
iatoolkit/services/mail_service.py +171 -25
iatoolkit/services/profile_service.py +37 -32
iatoolkit/services/{prompt_manager_service.py → prompt_service.py} +110 -1
iatoolkit/services/query_service.py +192 -191
iatoolkit/services/sql_service.py +63 -12
iatoolkit/services/tool_service.py +231 -0
iatoolkit/services/user_feedback_service.py +18 -6
iatoolkit/services/user_session_context_service.py +18 -0
iatoolkit/static/images/iatoolkit_core.png +0 -0
iatoolkit/static/images/iatoolkit_logo.png +0 -0
iatoolkit/static/js/chat_feedback_button.js +1 -1
iatoolkit/static/js/chat_help_content.js +4 -4
iatoolkit/static/js/chat_main.js +17 -5
iatoolkit/static/js/chat_onboarding_button.js +1 -1
iatoolkit/static/styles/chat_iatoolkit.css +1 -1
iatoolkit/static/styles/chat_public.css +28 -0
iatoolkit/static/styles/documents.css +598 -0
iatoolkit/static/styles/landing_page.css +223 -7
iatoolkit/system_prompts/__init__.py +0 -0
iatoolkit/system_prompts/query_main.prompt +2 -1
iatoolkit/system_prompts/sql_rules.prompt +47 -12
iatoolkit/templates/_company_header.html +30 -5
iatoolkit/templates/_login_widget.html +3 -3
iatoolkit/templates/chat.html +1 -1
iatoolkit/templates/forgot_password.html +3 -2
iatoolkit/templates/onboarding_shell.html +1 -1
iatoolkit/templates/signup.html +3 -0
iatoolkit/views/base_login_view.py +1 -1
iatoolkit/views/change_password_view.py +1 -1
iatoolkit/views/forgot_password_view.py +9 -4
iatoolkit/views/history_api_view.py +3 -3
iatoolkit/views/home_view.py +4 -2
iatoolkit/views/init_context_api_view.py +1 -1
iatoolkit/views/llmquery_api_view.py +4 -3
iatoolkit/views/{file_store_api_view.py → load_document_api_view.py} +1 -1
iatoolkit/views/login_view.py +17 -5
iatoolkit/views/logout_api_view.py +10 -2
iatoolkit/views/prompt_api_view.py +1 -1
iatoolkit/views/root_redirect_view.py +22 -0
iatoolkit/views/signup_view.py +12 -4
iatoolkit/views/static_page_view.py +27 -0
iatoolkit/views/verify_user_view.py +1 -1
iatoolkit-0.91.1.dist-info/METADATA +268 -0
iatoolkit-0.91.1.dist-info/RECORD +125 -0
iatoolkit-0.91.1.dist-info/licenses/LICENSE_COMMUNITY.md +15 -0
iatoolkit/services/history_service.py +0 -37
iatoolkit/templates/about.html +0 -13
iatoolkit/templates/index.html +0 -145
iatoolkit/templates/login_simulation.html +0 -45
iatoolkit/views/external_login_view.py +0 -73
iatoolkit/views/index_view.py +0 -14
iatoolkit/views/login_simulation_view.py +0 -93
iatoolkit-0.71.4.dist-info/METADATA +0 -276
iatoolkit-0.71.4.dist-info/RECORD +0 -122
{iatoolkit-0.71.4.dist-info → iatoolkit-0.91.1.dist-info}/WHEEL +0 -0
{iatoolkit-0.71.4.dist-info → iatoolkit-0.91.1.dist-info}/licenses/LICENSE +0 -0
{iatoolkit-0.71.4.dist-info → iatoolkit-0.91.1.dist-info}/top_level.txt +0 -0

iatoolkit/services/query_service.py CHANGED Viewed

@@ -5,19 +5,18 @@
 from iatoolkit.infra.llm_client import llmClient
 from iatoolkit.services.profile_service import ProfileService
-from iatoolkit.repositories.document_repo import DocumentRepo
 from iatoolkit.repositories.profile_repo import ProfileRepo
+from iatoolkit.services.tool_service import ToolService
 from iatoolkit.services.document_service import DocumentService
 from iatoolkit.services.company_context_service import CompanyContextService
 from iatoolkit.services.i18n_service import I18nService
 from iatoolkit.services.configuration_service import ConfigurationService
-from iatoolkit.repositories.llm_query_repo import LLMQueryRepo
 from iatoolkit.repositories.models import Task
 from iatoolkit.services.dispatcher_service import Dispatcher
-from iatoolkit.services.prompt_manager_service import PromptService
+from iatoolkit.services.prompt_service import PromptService
 from iatoolkit.services.user_session_context_service import UserSessionContextService
+from iatoolkit.services.history_manager_service import HistoryManagerService
 from iatoolkit.common.util import Utility
-from iatoolkit.common.exceptions import IAToolkitException
 from injector import inject
 import base64
 import logging
@@ -25,34 +24,40 @@ from typing import Optional
 import json
 import time
 import hashlib
-import os
+from dataclasses import dataclass
-GEMINI_MAX_TOKENS_CONTEXT_HISTORY = 200000
+@dataclass
+class HistoryHandle:
+    """Encapsulates the state needed to manage history for a single turn."""
+    company_short_name: str
+    user_identifier: str
+    type: str
+    request_params: dict = None
 class QueryService:
     @inject
     def __init__(self,
+                 dispatcher: Dispatcher,
+                 tool_service: ToolService,
                  llm_client: llmClient,
                  profile_service: ProfileService,
                  company_context_service: CompanyContextService,
                  document_service: DocumentService,
-                 document_repo: DocumentRepo,
-                 llmquery_repo: LLMQueryRepo,
                  profile_repo: ProfileRepo,
                  prompt_service: PromptService,
                  i18n_service: I18nService,
-                 util: Utility,
-                 dispatcher: Dispatcher,
                  session_context: UserSessionContextService,
-                 configuration_service: ConfigurationService
+                 configuration_service: ConfigurationService,
+                 history_manager: HistoryManagerService,
+                 util: Utility,
                  ):
         self.profile_service = profile_service
         self.company_context_service = company_context_service
         self.document_service = document_service
-        self.document_repo = document_repo
-        self.llmquery_repo = llmquery_repo
         self.profile_repo = profile_repo
+        self.tool_service = tool_service
         self.prompt_service = prompt_service
         self.i18n_service = i18n_service
         self.util = util
@@ -60,35 +65,106 @@ class QueryService:
         self.session_context = session_context
         self.configuration_service = configuration_service
         self.llm_client = llm_client
+        self.history_manager = history_manager
-        # get the model from the environment variable
-        self.default_model = os.getenv("LLM_MODEL", "")
-        if not self.default_model:
-            raise IAToolkitException(IAToolkitException.ErrorType.API_KEY,
-                               "missing ENV variable 'LLM_MODEL' configuration.")
-    def init_context(self, company_short_name: str,
-                     user_identifier: str,
-                     model: str = None) -> dict:
+    def _resolve_model(self, company_short_name: str, model: Optional[str]) -> str:
+        # Priority: 1. Explicit model -> 2. Company config
+        effective_model = model
+        if not effective_model:
+            llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
+            if llm_config and llm_config.get('model'):
+                effective_model = llm_config['model']
+        return effective_model
+    def _get_history_type(self, model: str) -> str:
+        return HistoryManagerService.TYPE_SERVER_SIDE if self.util.is_openai_model(
+            model) else HistoryManagerService.TYPE_CLIENT_SIDE
+    def _build_user_facing_prompt(self, company, user_identifier: str,
+                                  client_data: dict, files: list,
+                                  prompt_name: Optional[str], question: str) -> str:
+        # get the user profile data from the session context
+        user_profile = self.profile_service.get_profile_by_identifier(company.short_name, user_identifier)
+        # combine client_data with user_profile
+        final_client_data = (user_profile or {}).copy()
+        final_client_data.update(client_data)
+        # Load attached files into the context
+        files_context = self.load_files_for_context(files)
+        # Initialize prompt_content. It will be an empty string for direct questions.
+        main_prompt = ""
+        # We use a local variable for the question to avoid modifying the argument reference if it were mutable,
+        # although strings are immutable, this keeps the logic clean regarding what 'question' means in each context.
+        effective_question = question
+        if prompt_name:
+            question_dict = {'prompt': prompt_name, 'data': final_client_data}
+            effective_question = json.dumps(question_dict)
+            prompt_content = self.prompt_service.get_prompt_content(company, prompt_name)
+            # Render the user requested prompt
+            main_prompt = self.util.render_prompt_from_string(
+                template_string=prompt_content,
+                question=effective_question,
+                client_data=final_client_data,
+                user_identifier=user_identifier,
+                company=company,
+            )
-        # 1. Execute the forced rebuild sequence using the unified identifier.
-        self.session_context.clear_all_context(company_short_name, user_identifier)
-        logging.info(f"Context for {company_short_name}/{user_identifier} has been cleared.")
+        # This is the final user-facing prompt for this specific turn
+        user_turn_prompt = f"{main_prompt}\n{files_context}"
+        if not prompt_name:
+            user_turn_prompt += f"\n### La pregunta que debes responder es: {effective_question}"
+        else:
+            user_turn_prompt += f'\n### Contexto Adicional: El usuario ha aportado este contexto puede ayudar: {effective_question}'
-        # 2. LLM context is clean, now we can load it again
-        self.prepare_context(
-            company_short_name=company_short_name,
-            user_identifier=user_identifier
-        )
+        return user_turn_prompt, effective_question
-        # 3. communicate the new context to the LLM
-        response = self.set_context_for_llm(
-            company_short_name=company_short_name,
+    def _ensure_valid_history(self, company, user_identifier: str,
+                              effective_model: str, user_turn_prompt: str,
+                              ignore_history: bool) -> tuple[Optional[HistoryHandle], Optional[dict]]:
+        """
+            Manages the history strategy and rebuilds context if necessary.
+            Returns: (HistoryHandle, error_response)
+        """
+        history_type = self._get_history_type(effective_model)
+        # Initialize the handle with base context info
+        handle = HistoryHandle(
+            company_short_name=company.short_name,
             user_identifier=user_identifier,
-            model=model
+            type=history_type
         )
-        return response
+        # pass the handle to populate request_params
+        needs_rebuild = self.history_manager.populate_request_params(
+            handle, user_turn_prompt, ignore_history
+        )
+        if needs_rebuild:
+            logging.warning(f"No valid history for {company.short_name}/{user_identifier}. Rebuilding context...")
+            # try to rebuild the context
+            self.prepare_context(company_short_name=company.short_name, user_identifier=user_identifier)
+            self.set_context_for_llm(company_short_name=company.short_name, user_identifier=user_identifier,
+                                     model=effective_model)
+            # Retry populating params with the same handle
+            needs_rebuild = self.history_manager.populate_request_params(
+                handle, user_turn_prompt, ignore_history
+            )
+            if needs_rebuild:
+                error_key = 'errors.services.context_rebuild_failed'
+                error_message = self.i18n_service.t(error_key, company_short_name=company.short_name,
+                                                    user_identifier=user_identifier)
+                return None, {'error': True, "error_message": error_message}
+        return handle, None
     def _build_context_and_profile(self, company_short_name: str, user_identifier: str) -> tuple:
         # this method read the user/company context from the database and renders the system prompt
@@ -106,7 +182,7 @@ class QueryService:
             question=None,
             client_data=user_profile,
             company=company,
-            service_list=self.dispatcher.get_company_services(company)
+            service_list=self.tool_service.get_tools_for_llm(company)
         )
         # get the company context: schemas, database models, .md files
@@ -117,6 +193,31 @@ class QueryService:
         return final_system_context, user_profile
+    def init_context(self, company_short_name: str,
+                     user_identifier: str,
+                     model: str = None) -> dict:
+        # 1. Execute the forced rebuild sequence using the unified identifier.
+        self.session_context.clear_all_context(company_short_name, user_identifier)
+        logging.info(f"Context for {company_short_name}/{user_identifier} has been cleared.")
+        # 2. LLM context is clean, now we can load it again
+        self.prepare_context(
+            company_short_name=company_short_name,
+            user_identifier=user_identifier
+        )
+        # 3. communicate the new context to the LLM
+        response = self.set_context_for_llm(
+            company_short_name=company_short_name,
+            user_identifier=user_identifier,
+            model=model
+        )
+        return response
     def prepare_context(self, company_short_name: str, user_identifier: str) -> dict:
         # prepare the context and decide if it needs to be rebuilt
         # save the generated context in the session context for later use
@@ -134,21 +235,22 @@ class QueryService:
         # calculate the context version
         current_version = self._compute_context_version_from_string(final_system_context)
+        # get the current version from the session cache
         try:
             prev_version = self.session_context.get_context_version(company_short_name, user_identifier)
         except Exception:
             prev_version = None
-        rebuild_is_needed = not (prev_version and prev_version == current_version and
-                                 self._has_valid_cached_context(company_short_name, user_identifier))
-        if rebuild_is_needed:
-            # Guardar el contexto preparado y su versión para que `finalize_context_rebuild` los use.
-            self.session_context.save_prepared_context(company_short_name,
-                                                       user_identifier,
-                                                       final_system_context,
-                                                       current_version)
+        # Determine if we need to persist the prepared context again.
+        # If versions match, we assume the artifact is likely safe, but forcing a save
+        # on version mismatch ensures data consistency.
+        rebuild_is_needed = (prev_version != current_version)
+        # Save the prepared context and its version for `set_context_for_llm` to use.
+        self.session_context.save_prepared_context(company_short_name,
+                                                   user_identifier,
+                                                   final_system_context,
+                                                   current_version)
         return {'rebuild_needed': rebuild_is_needed}
     def set_context_for_llm(self,
@@ -163,14 +265,7 @@ class QueryService:
             return
         # --- Model Resolution ---
-        # Priority: 1. Explicit model -> 2. Company config -> 3. Global default
-        effective_model = model
-        if not effective_model:
-            llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
-            if llm_config and llm_config.get('model'):
-                effective_model = llm_config['model']
-        effective_model = effective_model or self.default_model
+        effective_model = self._resolve_model(company_short_name, model)
         # blocking logic to avoid multiple requests for the same user/company at the same time
         lock_key = f"lock:context:{company_short_name}/{user_identifier}"
@@ -181,37 +276,29 @@ class QueryService:
         try:
             start_time = time.time()
-            company = self.profile_repo.get_company_by_short_name(company_short_name)
             # get the prepared context and version from the session cache
-            prepared_context, version_to_save = self.session_context.get_and_clear_prepared_context(company_short_name,
-                                                                                                    user_identifier)
+            prepared_context, version_to_save = self.session_context.get_and_clear_prepared_context(company_short_name,                                                                                                    user_identifier)
             if not prepared_context:
                 return
             logging.info(f"sending context to LLM model {effective_model} for: {company_short_name}/{user_identifier}...")
-            # clean only the chat history and the last response ID for this user/company
-            self.session_context.clear_llm_history(company_short_name, user_identifier)
-            response_id = ''
-            if self.util.is_gemini_model(effective_model):
-                context_history = [{"role": "user", "content": prepared_context}]
-                self.session_context.save_context_history(company_short_name, user_identifier, context_history)
-            elif self.util.is_openai_model(effective_model):
-                # Here is the call to the LLM client for settling the company/user context
-                response_id = self.llm_client.set_company_context(
-                    company=company,
-                    company_base_context=prepared_context,
-                    model=effective_model
-                )
-                self.session_context.save_last_response_id(company_short_name, user_identifier, response_id)
+            # --- Use Strategy Pattern for History/Context Initialization ---
+            history_type = self._get_history_type(effective_model)
+            response_data = self.history_manager.initialize_context(
+                company_short_name, user_identifier, history_type, prepared_context, company, effective_model
+            )
             if version_to_save:
                 self.session_context.save_context_version(company_short_name, user_identifier, version_to_save)
             logging.info(
                 f"Context for: {company_short_name}/{user_identifier} settled in {int(time.time() - start_time)} sec.")
+            # Return data (e.g., response_id) if the manager generated any
+            return response_data
         except Exception as e:
             logging.exception(f"Error in finalize_context_rebuild for {company_short_name}: {e}")
             raise e
@@ -219,7 +306,6 @@ class QueryService:
             # release the lock
             self.session_context.release_lock(lock_key)
-        return {'response_id': response_id }
     def llm_query(self,
                   company_short_name: str,
@@ -228,7 +314,7 @@ class QueryService:
                   prompt_name: str = None,
                   question: str = '',
                   client_data: dict = {},
-                  response_id: str = '',
+                  ignore_history: bool = False,
                   files: list = [],
                   model: Optional[str] = None) -> dict:
         try:
@@ -242,86 +328,48 @@ class QueryService:
                         "error_message": self.i18n_service.t('services.start_query')}
             # --- Model Resolution ---
-            # Priority: 1. Explicit model -> 2. Company config -> 3. Global default
-            effective_model = model
-            if not effective_model:
-                llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
-                if llm_config and llm_config.get('model'):
-                    effective_model = llm_config['model']
-            effective_model = effective_model or self.default_model
-            # get the previous response_id and context history
-            previous_response_id = None
-            context_history = self.session_context.get_context_history(company.short_name, user_identifier) or []
-            if self.util.is_openai_model(effective_model):
-                if response_id:
-                    # context is getting from this response_id
-                    previous_response_id = response_id
-                else:
-                    # use the full user history context
-                    previous_response_id = self.session_context.get_last_response_id(company.short_name, user_identifier)
-                    if not previous_response_id:
-                        return {'error': True,
-                                "error_message": self.i18n_service.t('errors.services.missing_response_id', company_short_name=company.short_name, user_identifier=user_identifier)
-                                }
-            elif self.util.is_gemini_model(effective_model):
-                # check the length of the context_history and remove old messages
-                self._trim_context_history(context_history)
-            # get the user profile data from the session context
-            user_profile = self.profile_service.get_profile_by_identifier(company.short_name, user_identifier)
-            # combine client_data with user_profile
-            final_client_data = (user_profile or {}).copy()
-            final_client_data.update(client_data)
-            # Load attached files into the context
-            files_context = self.load_files_for_context(files)
-            # Initialize prompt_content. It will be an empty string for direct questions.
-            main_prompt = ""
-            if prompt_name:
-                # For task-based queries, wrap data into a JSON string and get the specific prompt template
-                question_dict = {'prompt': prompt_name, 'data': final_client_data }
-                question = json.dumps(question_dict)
-                prompt_content = self.prompt_service.get_prompt_content(company, prompt_name)
-                # Render the main user prompt using the appropriate template (or an empty one)
-                main_prompt = self.util.render_prompt_from_string(
-                    template_string=prompt_content,
-                    question=question,
-                    client_data=final_client_data,
-                    user_identifier=user_identifier,
-                    company=company,
-                )
+            effective_model = self._resolve_model(company_short_name, model)
-            # This is the final user-facing prompt for this specific turn
-            user_turn_prompt = f"{main_prompt}\n{files_context}"
-            if not prompt_name:
-                user_turn_prompt += f"\n### La pregunta que debes responder es: {question}"
-            else:
-                user_turn_prompt += f'\n### Contexto Adicional: El usuario ha aportado este contexto puede ayudar: {question}'
+            # --- Build User-Facing Prompt ---
+            user_turn_prompt, effective_question = self._build_user_facing_prompt(
+                company=company,
+                user_identifier=user_identifier,
+                client_data=client_data,
+                files=files,
+                prompt_name=prompt_name,
+                question=question
+            )
-            # add to the history context
-            if self.util.is_gemini_model(effective_model):
-                context_history.append({"role": "user", "content": user_turn_prompt})
+            # --- History Management (Strategy Pattern) ---
+            history_handle, error_response = self._ensure_valid_history(
+                company=company,
+                user_identifier=user_identifier,
+                effective_model=effective_model,
+                user_turn_prompt=user_turn_prompt,
+                ignore_history=ignore_history
+            )
+            if error_response:
+                return error_response
-            # service list for the function calls
-            tools = self.dispatcher.get_company_services(company)
+            # get the tools availables for this company
+            tools = self.tool_service.get_tools_for_llm(company)
             # openai structured output instructions
             output_schema = {}
+            # Safely extract parameters for invoke using the handle
+            # The handle is guaranteed to have request_params populated if no error returned
+            previous_response_id = history_handle.request_params.get('previous_response_id')
+            context_history = history_handle.request_params.get('context_history')
             # Now send the instructions to the llm
             response = self.llm_client.invoke(
                 company=company,
                 user_identifier=user_identifier,
                 model=effective_model,
                 previous_response_id=previous_response_id,
-                context_history=context_history if self.util.is_gemini_model(effective_model) else None,
-                question=question,
+                context_history=context_history,
+                question=effective_question,
                 context=user_turn_prompt,
                 tools=tools,
                 text=output_schema
@@ -330,11 +378,10 @@ class QueryService:
             if not response.get('valid_response'):
                 response['error'] = True
-            # save last_response_id for the history chain
-            if "response_id" in response:
-                self.session_context.save_last_response_id(company.short_name, user_identifier, response["response_id"])
-            if self.util.is_gemini_model(effective_model):
-                self.session_context.save_context_history(company.short_name, user_identifier, context_history)
+                # save history using the manager passing the handle
+                self.history_manager.update_history(
+                    history_handle, user_turn_prompt, response
+                )
             return response
         except Exception as e:
@@ -348,23 +395,6 @@ class QueryService:
         except Exception:
             return "unknown"
-    def _has_valid_cached_context(self, company_short_name: str, user_identifier: str) -> bool:
-        """
-        Verifica si existe un estado de contexto reutilizable en sesión.
-        - OpenAI: last_response_id presente.
-        - Gemini: context_history con al menos 1 mensaje.
-        """
-        try:
-            if self.util.is_openai_model(self.default_model):
-                prev_id = self.session_context.get_last_response_id(company_short_name, user_identifier)
-                return bool(prev_id)
-            if self.util.is_gemini_model(self.default_model):
-                history = self.session_context.get_context_history(company_short_name, user_identifier) or []
-                return len(history) >= 1
-            return False
-        except Exception as e:
-            logging.warning(f"error verifying context cache: {e}")
-            return False
     def load_files_for_context(self, files: list) -> str:
         """
@@ -381,7 +411,7 @@ class QueryService:
             """
         for document in files:
             # Support both 'file_id' and 'filename' for robustness
-            filename = document.get('file_id') or document.get('filename')
+            filename = document.get('file_id') or document.get('filename') or document.get('name')
             if not filename:
                 context += "\n<error>Documento adjunto sin nombre ignorado.</error>\n"
                 continue
@@ -410,32 +440,3 @@ class QueryService:
         return context
-    def _trim_context_history(self, context_history: list):
-        """
-        Verifica el tamaño del historial de contexto y elimina los mensajes más antiguos
-        si supera un umbral, conservando siempre el mensaje del sistema (índice 0).
-        """
-        if not context_history or len(context_history) <= 1:
-            return  # nothing to remember
-        # calculate total tokens
-        try:
-            total_tokens = sum(self.llm_client.count_tokens(json.dumps(message)) for message in context_history)
-        except Exception as e:
-            logging.error(f"error counting tokens for history: {e}.")
-            return
-        # Si se excede el límite, eliminar mensajes antiguos (empezando por el segundo)
-        while total_tokens > GEMINI_MAX_TOKENS_CONTEXT_HISTORY and len(context_history) > 1:
-            try:
-                # Eliminar el mensaje más antiguo después del prompt del sistema
-                removed_message = context_history.pop(1)
-                removed_tokens = self.llm_client.count_tokens(json.dumps(removed_message))
-                total_tokens -= removed_tokens
-                logging.warning(
-                    f"history tokens ({total_tokens + removed_tokens} tokens) exceed the limit of: {GEMINI_MAX_TOKENS_CONTEXT_HISTORY}. "
-                    f"new context: {total_tokens} tokens."
-                )
-            except IndexError:
-                # Se produce si solo queda el mensaje del sistema, el bucle debería detenerse.
-                break

iatoolkit/services/sql_service.py CHANGED Viewed

@@ -8,6 +8,7 @@ from iatoolkit.common.util import Utility
 from iatoolkit.services.i18n_service import I18nService
 from iatoolkit.common.exceptions import IAToolkitException
 from sqlalchemy import text
+from sqlalchemy.exc import SQLAlchemyError
 from injector import inject, singleton
 import json
 import logging
@@ -30,7 +31,7 @@ class SqlService:
         # Cache for database connections
         self._db_connections: dict[str, DatabaseManager] = {}
-    def register_database(self, db_name: str, db_uri: str):
+    def register_database(self, db_uri: str, db_name: str, schema: str | None = None):
         """
         Creates and caches a DatabaseManager instance for a given database name and URI.
         If a database with the same name is already registered, it does nothing.
@@ -38,10 +39,10 @@ class SqlService:
         if db_name in self._db_connections:
             return
-        logging.debug(f"Registering and creating connection for database: '{db_name}'")
+        logging.info(f"Registering and creating connection for database: '{db_name}' (schema: {schema})")
         # create the database connection and save it on the cache
-        db_manager = DatabaseManager(db_uri, register_pgvector=False)
+        db_manager = DatabaseManager(db_uri, schema=schema, register_pgvector=False)
         self._db_connections[db_name] = db_manager
     def get_database_manager(self, db_name: str) -> DatabaseManager:
@@ -57,23 +58,53 @@ class SqlService:
                 f"Database '{db_name}' is not registered with the SqlService."
             )
-    def exec_sql(self, database: str, query: str) -> str:
+    def exec_sql(self, company_short_name: str,
+                 database: str,
+                 query: str,
+                 format: str = 'json',
+                 commit: bool = False):
         """
-        Executes a raw SQL statement against a registered database and returns the result as a JSON string.
+        Executes a raw SQL statement against a registered database.
+        Args:
+            company_short_name: The company identifier (for logging/context).
+            database: The logical name of the database to query.
+            query: The SQL statement to execute.
+            format: The output format ('json' or 'dict'). Only relevant for SELECT queries.
+            commit: Whether to commit the transaction immediately after execution.
+                    Use True for INSERT/UPDATE/DELETE statements.
+        Returns:
+            - A JSON string or list of dicts for SELECT queries.
+            - A dictionary {'rowcount': N} for non-returning statements (INSERT/UPDATE) if not using RETURNING.
         """
         try:
             # 1. Get the database manager from the cache
             db_manager = self.get_database_manager(database)
+            session = db_manager.get_session()
             # 2. Execute the SQL statement
-            result = db_manager.get_session().execute(text(query))
-            cols = result.keys()
-            rows_context = [dict(zip(cols, row)) for row in result.fetchall()]
+            result = session.execute(text(query))
+            # 3. Handle Commit
+            if commit:
+                session.commit()
+            # 4. Process Results
+            # Check if the query returns rows (e.g., SELECT or INSERT ... RETURNING)
+            if result.returns_rows:
+                cols = result.keys()
+                rows_context = [dict(zip(cols, row)) for row in result.fetchall()]
-            # seialize the result
-            sql_result_json = json.dumps(rows_context, default=self.util.serialize)
+                if format == 'dict':
+                    return rows_context
+                # serialize the result
+                return json.dumps(rows_context, default=self.util.serialize)
+            # For statements that don't return rows (standard UPDATE/DELETE)
+            return {'rowcount': result.rowcount}
-            return sql_result_json
         except IAToolkitException:
             # Re-raise exceptions from get_database_manager to preserve the specific error
             raise
@@ -89,4 +120,24 @@ class SqlService:
             logging.error(f"Error executing SQL statement: {error_message}")
             raise IAToolkitException(IAToolkitException.ErrorType.DATABASE_ERROR,
-                                     error_message) from e
+                                     error_message) from e
+    def commit(self, database: str):
+        """
+        Commits the current transaction for a registered database.
+        Useful when multiple exec_sql calls are part of a single transaction.
+        """
+        # Get the database manager from the cache
+        db_manager = self.get_database_manager(database)
+        try:
+            db_manager.get_session().commit()
+        except SQLAlchemyError as db_error:
+            db_manager.get_session().rollback()
+            logging.error(f"Error de base de datos: {str(db_error)}")
+            raise db_error
+        except Exception as e:
+            logging.error(f"error while commiting sql: '{str(e)}'")
+            raise IAToolkitException(
+                IAToolkitException.ErrorType.DATABASE_ERROR, str(e)
+            )

iatoolkit 0.71.4__py3-none-any.whl → 0.91.1__py3-none-any.whl

iatoolkit 0.71.4py3-none-any.whl → 0.91.1py3-none-any.whl