PyPI - iatoolkit - Versions diffs - 0.71.4__py3-none-any.whl → 1.4.2__py3-none-any.whl - Mend

iatoolkit 0.71.4py3-none-any.whl → 1.4.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

iatoolkit/__init__.py +19 -7
iatoolkit/base_company.py +1 -71
iatoolkit/cli_commands.py +9 -21
iatoolkit/common/exceptions.py +2 -0
iatoolkit/common/interfaces/__init__.py +0 -0
iatoolkit/common/interfaces/asset_storage.py +34 -0
iatoolkit/common/interfaces/database_provider.py +38 -0
iatoolkit/common/model_registry.py +159 -0
iatoolkit/common/routes.py +53 -32
iatoolkit/common/util.py +17 -12
iatoolkit/company_registry.py +55 -14
iatoolkit/{iatoolkit.py → core.py} +102 -72
iatoolkit/infra/{mail_app.py → brevo_mail_app.py} +15 -37
iatoolkit/infra/llm_providers/__init__.py +0 -0
iatoolkit/infra/llm_providers/deepseek_adapter.py +278 -0
iatoolkit/infra/{gemini_adapter.py → llm_providers/gemini_adapter.py} +11 -17
iatoolkit/infra/{openai_adapter.py → llm_providers/openai_adapter.py} +41 -7
iatoolkit/infra/llm_proxy.py +235 -134
iatoolkit/infra/llm_response.py +5 -0
iatoolkit/locales/en.yaml +134 -4
iatoolkit/locales/es.yaml +293 -162
iatoolkit/repositories/database_manager.py +92 -22
iatoolkit/repositories/document_repo.py +7 -0
iatoolkit/repositories/filesystem_asset_repository.py +36 -0
iatoolkit/repositories/llm_query_repo.py +36 -22
iatoolkit/repositories/models.py +86 -95
iatoolkit/repositories/profile_repo.py +64 -13
iatoolkit/repositories/vs_repo.py +31 -28
iatoolkit/services/auth_service.py +1 -1
iatoolkit/services/branding_service.py +1 -1
iatoolkit/services/company_context_service.py +96 -39
iatoolkit/services/configuration_service.py +329 -67
iatoolkit/services/dispatcher_service.py +51 -227
iatoolkit/services/document_service.py +10 -1
iatoolkit/services/embedding_service.py +9 -6
iatoolkit/services/excel_service.py +50 -2
iatoolkit/services/file_processor_service.py +0 -5
iatoolkit/services/history_manager_service.py +208 -0
iatoolkit/services/jwt_service.py +1 -1
iatoolkit/services/knowledge_base_service.py +412 -0
iatoolkit/services/language_service.py +8 -2
iatoolkit/services/license_service.py +82 -0
iatoolkit/{infra/llm_client.py → services/llm_client_service.py} +42 -29
iatoolkit/services/load_documents_service.py +18 -47
iatoolkit/services/mail_service.py +171 -25
iatoolkit/services/profile_service.py +69 -36
iatoolkit/services/{prompt_manager_service.py → prompt_service.py} +136 -25
iatoolkit/services/query_service.py +229 -203
iatoolkit/services/sql_service.py +116 -34
iatoolkit/services/tool_service.py +246 -0
iatoolkit/services/user_feedback_service.py +18 -6
iatoolkit/services/user_session_context_service.py +121 -51
iatoolkit/static/images/iatoolkit_core.png +0 -0
iatoolkit/static/images/iatoolkit_logo.png +0 -0
iatoolkit/static/js/chat_feedback_button.js +1 -1
iatoolkit/static/js/chat_help_content.js +4 -4
iatoolkit/static/js/chat_main.js +61 -9
iatoolkit/static/js/chat_model_selector.js +227 -0
iatoolkit/static/js/chat_onboarding_button.js +1 -1
iatoolkit/static/js/chat_reload_button.js +4 -1
iatoolkit/static/styles/chat_iatoolkit.css +59 -3
iatoolkit/static/styles/chat_public.css +28 -0
iatoolkit/static/styles/documents.css +598 -0
iatoolkit/static/styles/landing_page.css +223 -7
iatoolkit/static/styles/llm_output.css +34 -1
iatoolkit/system_prompts/__init__.py +0 -0
iatoolkit/system_prompts/query_main.prompt +28 -3
iatoolkit/system_prompts/sql_rules.prompt +47 -12
iatoolkit/templates/_company_header.html +30 -5
iatoolkit/templates/_login_widget.html +3 -3
iatoolkit/templates/base.html +13 -0
iatoolkit/templates/chat.html +45 -3
iatoolkit/templates/forgot_password.html +3 -2
iatoolkit/templates/onboarding_shell.html +1 -2
iatoolkit/templates/signup.html +3 -0
iatoolkit/views/base_login_view.py +8 -3
iatoolkit/views/change_password_view.py +1 -1
iatoolkit/views/chat_view.py +76 -0
iatoolkit/views/forgot_password_view.py +9 -4
iatoolkit/views/history_api_view.py +3 -3
iatoolkit/views/home_view.py +4 -2
iatoolkit/views/init_context_api_view.py +1 -1
iatoolkit/views/llmquery_api_view.py +4 -3
iatoolkit/views/load_company_configuration_api_view.py +49 -0
iatoolkit/views/{file_store_api_view.py → load_document_api_view.py} +15 -11
iatoolkit/views/login_view.py +25 -8
iatoolkit/views/logout_api_view.py +10 -2
iatoolkit/views/prompt_api_view.py +1 -1
iatoolkit/views/rag_api_view.py +216 -0
iatoolkit/views/root_redirect_view.py +22 -0
iatoolkit/views/signup_view.py +12 -4
iatoolkit/views/static_page_view.py +27 -0
iatoolkit/views/users_api_view.py +33 -0
iatoolkit/views/verify_user_view.py +1 -1
iatoolkit-1.4.2.dist-info/METADATA +268 -0
iatoolkit-1.4.2.dist-info/RECORD +133 -0
iatoolkit-1.4.2.dist-info/licenses/LICENSE_COMMUNITY.md +15 -0
iatoolkit/repositories/tasks_repo.py +0 -52
iatoolkit/services/history_service.py +0 -37
iatoolkit/services/search_service.py +0 -55
iatoolkit/services/tasks_service.py +0 -188
iatoolkit/templates/about.html +0 -13
iatoolkit/templates/index.html +0 -145
iatoolkit/templates/login_simulation.html +0 -45
iatoolkit/views/external_login_view.py +0 -73
iatoolkit/views/index_view.py +0 -14
iatoolkit/views/login_simulation_view.py +0 -93
iatoolkit/views/tasks_api_view.py +0 -72
iatoolkit/views/tasks_review_api_view.py +0 -55
iatoolkit-0.71.4.dist-info/METADATA +0 -276
iatoolkit-0.71.4.dist-info/RECORD +0 -122
{iatoolkit-0.71.4.dist-info → iatoolkit-1.4.2.dist-info}/WHEEL +0 -0
{iatoolkit-0.71.4.dist-info → iatoolkit-1.4.2.dist-info}/licenses/LICENSE +0 -0
{iatoolkit-0.71.4.dist-info → iatoolkit-1.4.2.dist-info}/top_level.txt +0 -0

iatoolkit/services/query_service.py CHANGED Viewed

@@ -3,21 +3,20 @@
 #
 # IAToolkit is open source software.
-from iatoolkit.infra.llm_client import llmClient
+from iatoolkit.services.llm_client_service import llmClient
 from iatoolkit.services.profile_service import ProfileService
-from iatoolkit.repositories.document_repo import DocumentRepo
 from iatoolkit.repositories.profile_repo import ProfileRepo
+from iatoolkit.services.tool_service import ToolService
 from iatoolkit.services.document_service import DocumentService
 from iatoolkit.services.company_context_service import CompanyContextService
 from iatoolkit.services.i18n_service import I18nService
 from iatoolkit.services.configuration_service import ConfigurationService
-from iatoolkit.repositories.llm_query_repo import LLMQueryRepo
-from iatoolkit.repositories.models import Task
 from iatoolkit.services.dispatcher_service import Dispatcher
-from iatoolkit.services.prompt_manager_service import PromptService
+from iatoolkit.services.prompt_service import PromptService
 from iatoolkit.services.user_session_context_service import UserSessionContextService
+from iatoolkit.services.history_manager_service import HistoryManagerService
+from iatoolkit.common.model_registry import ModelRegistry
 from iatoolkit.common.util import Utility
-from iatoolkit.common.exceptions import IAToolkitException
 from injector import inject
 import base64
 import logging
@@ -25,34 +24,42 @@ from typing import Optional
 import json
 import time
 import hashlib
-import os
+from dataclasses import dataclass
-GEMINI_MAX_TOKENS_CONTEXT_HISTORY = 200000
+@dataclass
+class HistoryHandle:
+    """Encapsulates the state needed to manage history for a single turn."""
+    company_short_name: str
+    user_identifier: str
+    type: str
+    model: str | None = None
+    request_params: dict = None
 class QueryService:
     @inject
     def __init__(self,
+                 dispatcher: Dispatcher,
+                 tool_service: ToolService,
                  llm_client: llmClient,
                  profile_service: ProfileService,
                  company_context_service: CompanyContextService,
                  document_service: DocumentService,
-                 document_repo: DocumentRepo,
-                 llmquery_repo: LLMQueryRepo,
                  profile_repo: ProfileRepo,
                  prompt_service: PromptService,
                  i18n_service: I18nService,
-                 util: Utility,
-                 dispatcher: Dispatcher,
                  session_context: UserSessionContextService,
-                 configuration_service: ConfigurationService
+                 configuration_service: ConfigurationService,
+                 history_manager: HistoryManagerService,
+                 util: Utility,
+                 model_registry: ModelRegistry
                  ):
         self.profile_service = profile_service
         self.company_context_service = company_context_service
         self.document_service = document_service
-        self.document_repo = document_repo
-        self.llmquery_repo = llmquery_repo
         self.profile_repo = profile_repo
+        self.tool_service = tool_service
         self.prompt_service = prompt_service
         self.i18n_service = i18n_service
         self.util = util
@@ -60,35 +67,114 @@ class QueryService:
         self.session_context = session_context
         self.configuration_service = configuration_service
         self.llm_client = llm_client
+        self.history_manager = history_manager
+        self.model_registry = model_registry
-        # get the model from the environment variable
-        self.default_model = os.getenv("LLM_MODEL", "")
-        if not self.default_model:
-            raise IAToolkitException(IAToolkitException.ErrorType.API_KEY,
-                               "missing ENV variable 'LLM_MODEL' configuration.")
-    def init_context(self, company_short_name: str,
-                     user_identifier: str,
-                     model: str = None) -> dict:
+    def _resolve_model(self, company_short_name: str, model: Optional[str]) -> str:
+        # Priority: 1. Explicit model -> 2. Company config
+        effective_model = model
+        if not effective_model:
+            llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
+            if llm_config and llm_config.get('model'):
+                effective_model = llm_config['model']
+        return effective_model
+    def _get_history_type(self, model: str) -> str:
+        history_type_str = self.model_registry.get_history_type(model)
+        if history_type_str == "server_side":
+            return HistoryManagerService.TYPE_SERVER_SIDE
+        else:
+            return HistoryManagerService.TYPE_CLIENT_SIDE
+    def _build_user_facing_prompt(self, company, user_identifier: str,
+                                  client_data: dict, files: list,
+                                  prompt_name: Optional[str], question: str):
+        # get the user profile data from the session context
+        user_profile = self.profile_service.get_profile_by_identifier(company.short_name, user_identifier)
+        # combine client_data with user_profile
+        final_client_data = (user_profile or {}).copy()
+        final_client_data.update(client_data)
+        # Load attached files into the context
+        files_context = self.load_files_for_context(files)
+        # Initialize prompt_content. It will be an empty string for direct questions.
+        main_prompt = ""
+        # We use a local variable for the question to avoid modifying the argument reference if it were mutable,
+        # although strings are immutable, this keeps the logic clean regarding what 'question' means in each context.
+        effective_question = question
+        if prompt_name:
+            question_dict = {'prompt': prompt_name, 'data': final_client_data}
+            effective_question = json.dumps(question_dict)
+            prompt_content = self.prompt_service.get_prompt_content(company, prompt_name)
+            # Render the user requested prompt
+            main_prompt = self.util.render_prompt_from_string(
+                template_string=prompt_content,
+                question=effective_question,
+                client_data=final_client_data,
+                user_identifier=user_identifier,
+                company=company,
+            )
-        # 1. Execute the forced rebuild sequence using the unified identifier.
-        self.session_context.clear_all_context(company_short_name, user_identifier)
-        logging.info(f"Context for {company_short_name}/{user_identifier} has been cleared.")
+        # This is the final user-facing prompt for this specific turn
+        user_turn_prompt = f"{main_prompt}\n{files_context}"
+        if not prompt_name:
+            user_turn_prompt += f"\n### La pregunta que debes responder es: {effective_question}"
+        else:
+            user_turn_prompt += f'\n### Contexto Adicional: El usuario ha aportado este contexto puede ayudar: {effective_question}'
+        return user_turn_prompt, effective_question
+    def _ensure_valid_history(self, company,
+                              user_identifier: str,
+                              effective_model: str,
+                              user_turn_prompt: str,
+                              ignore_history: bool
+                              ) -> tuple[Optional[HistoryHandle], Optional[dict]]:
+        """
+            Manages the history strategy and rebuilds context if necessary.
+            Returns: (HistoryHandle, error_response)
+        """
+        history_type = self._get_history_type(effective_model)
-        # 2. LLM context is clean, now we can load it again
-        self.prepare_context(
-            company_short_name=company_short_name,
-            user_identifier=user_identifier
+        # Initialize the handle with base context info
+        handle = HistoryHandle(
+            company_short_name=company.short_name,
+            user_identifier=user_identifier,
+            type=history_type,
+            model=effective_model
         )
-        # 3. communicate the new context to the LLM
-        response = self.set_context_for_llm(
-            company_short_name=company_short_name,
-            user_identifier=user_identifier,
-            model=model
+        # pass the handle to populate request_params
+        needs_rebuild = self.history_manager.populate_request_params(
+            handle, user_turn_prompt, ignore_history
         )
-        return response
+        if needs_rebuild:
+            logging.warning(f"No valid history for {company.short_name}/{user_identifier}. Rebuilding context...")
+            # try to rebuild the context
+            self.prepare_context(company_short_name=company.short_name, user_identifier=user_identifier)
+            self.set_context_for_llm(company_short_name=company.short_name, user_identifier=user_identifier,
+                                     model=effective_model)
+            # Retry populating params with the same handle
+            needs_rebuild = self.history_manager.populate_request_params(
+                handle, user_turn_prompt, ignore_history
+            )
+            if needs_rebuild:
+                error_key = 'errors.services.context_rebuild_failed'
+                error_message = self.i18n_service.t(error_key, company_short_name=company.short_name,
+                                                    user_identifier=user_identifier)
+                return None, {'error': True, "error_message": error_message}
+        return handle, None
     def _build_context_and_profile(self, company_short_name: str, user_identifier: str) -> tuple:
         # this method read the user/company context from the database and renders the system prompt
@@ -106,7 +192,7 @@ class QueryService:
             question=None,
             client_data=user_profile,
             company=company,
-            service_list=self.dispatcher.get_company_services(company)
+            service_list=self.tool_service.get_tools_for_llm(company)
         )
         # get the company context: schemas, database models, .md files
@@ -117,6 +203,44 @@ class QueryService:
         return final_system_context, user_profile
+    def init_context(self, company_short_name: str,
+                     user_identifier: str,
+                     model: str = None) -> dict:
+        """
+        Forces a context rebuild for a given user and (optionally) model.
+        - Clears LLM-related context for the resolved model.
+        - Regenerates the static company/user context.
+        - Sends the context to the LLM for that model.
+        """
+        # 1. Resolve the effective model for this user/company
+        effective_model = self._resolve_model(company_short_name, model)
+        # 2. Clear only the LLM-related context for this model
+        self.session_context.clear_all_context(company_short_name, user_identifier,model=effective_model)
+        logging.info(
+            f"Context for {company_short_name}/{user_identifier} "
+            f"(model={effective_model}) has been cleared."
+        )
+        # 3. Static LLM context is now clean, we can prepare it again (model-agnostic)
+        self.prepare_context(
+            company_short_name=company_short_name,
+            user_identifier=user_identifier
+        )
+        # 4. Communicate the new context to the specific LLM model
+        response = self.set_context_for_llm(
+            company_short_name=company_short_name,
+            user_identifier=user_identifier,
+            model=effective_model
+        )
+        return response
     def prepare_context(self, company_short_name: str, user_identifier: str) -> dict:
         # prepare the context and decide if it needs to be rebuilt
         # save the generated context in the session context for later use
@@ -134,46 +258,42 @@ class QueryService:
         # calculate the context version
         current_version = self._compute_context_version_from_string(final_system_context)
+        # get the current version from the session cache
         try:
             prev_version = self.session_context.get_context_version(company_short_name, user_identifier)
         except Exception:
             prev_version = None
-        rebuild_is_needed = not (prev_version and prev_version == current_version and
-                                 self._has_valid_cached_context(company_short_name, user_identifier))
-        if rebuild_is_needed:
-            # Guardar el contexto preparado y su versión para que `finalize_context_rebuild` los use.
-            self.session_context.save_prepared_context(company_short_name,
-                                                       user_identifier,
-                                                       final_system_context,
-                                                       current_version)
+        # Determine if we need to persist the prepared context again.
+        # If versions match, we assume the artifact is likely safe, but forcing a save
+        # on version mismatch ensures data consistency.
+        rebuild_is_needed = (prev_version != current_version)
+        # Save the prepared context and its version for `set_context_for_llm` to use.
+        self.session_context.save_prepared_context(company_short_name,
+                                                   user_identifier,
+                                                   final_system_context,
+                                                   current_version)
         return {'rebuild_needed': rebuild_is_needed}
     def set_context_for_llm(self,
                             company_short_name: str,
                             user_identifier: str,
                             model: str = ''):
-        # This service takes a pre-built context and send to the LLM
+        """
+        Takes a pre-built static context and sends it to the LLM for the given model.
+        Also initializes the model-specific history through HistoryManagerService.
+        """
         company = self.profile_repo.get_company_by_short_name(company_short_name)
         if not company:
             logging.error(f"Company not found: {company_short_name} in set_context_for_llm")
             return
         # --- Model Resolution ---
-        # Priority: 1. Explicit model -> 2. Company config -> 3. Global default
-        effective_model = model
-        if not effective_model:
-            llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
-            if llm_config and llm_config.get('model'):
-                effective_model = llm_config['model']
+        effective_model = self._resolve_model(company_short_name, model)
-        effective_model = effective_model or self.default_model
-        # blocking logic to avoid multiple requests for the same user/company at the same time
-        lock_key = f"lock:context:{company_short_name}/{user_identifier}"
+        # Lock per (company, user, model) to avoid concurrent rebuilds for the same model
+        lock_key = f"lock:context:{company_short_name}/{user_identifier}/{effective_model}"
         if not self.session_context.acquire_lock(lock_key, expire_seconds=60):
             logging.warning(
                 f"try to rebuild context for user {user_identifier} while is still in process, ignored.")
@@ -181,37 +301,29 @@ class QueryService:
         try:
             start_time = time.time()
-            company = self.profile_repo.get_company_by_short_name(company_short_name)
             # get the prepared context and version from the session cache
-            prepared_context, version_to_save = self.session_context.get_and_clear_prepared_context(company_short_name,
-                                                                                                    user_identifier)
+            prepared_context, version_to_save = self.session_context.get_and_clear_prepared_context(company_short_name,                                                                                                    user_identifier)
             if not prepared_context:
                 return
             logging.info(f"sending context to LLM model {effective_model} for: {company_short_name}/{user_identifier}...")
-            # clean only the chat history and the last response ID for this user/company
-            self.session_context.clear_llm_history(company_short_name, user_identifier)
-            response_id = ''
-            if self.util.is_gemini_model(effective_model):
-                context_history = [{"role": "user", "content": prepared_context}]
-                self.session_context.save_context_history(company_short_name, user_identifier, context_history)
-            elif self.util.is_openai_model(effective_model):
-                # Here is the call to the LLM client for settling the company/user context
-                response_id = self.llm_client.set_company_context(
-                    company=company,
-                    company_base_context=prepared_context,
-                    model=effective_model
-                )
-                self.session_context.save_last_response_id(company_short_name, user_identifier, response_id)
+            # --- Use Strategy Pattern for History/Context Initialization ---
+            history_type = self._get_history_type(effective_model)
+            response_data = self.history_manager.initialize_context(
+                company_short_name, user_identifier, history_type, prepared_context, company, effective_model
+            )
             if version_to_save:
                 self.session_context.save_context_version(company_short_name, user_identifier, version_to_save)
             logging.info(
                 f"Context for: {company_short_name}/{user_identifier} settled in {int(time.time() - start_time)} sec.")
+            # Return data (e.g., response_id) if the manager generated any
+            return response_data
         except Exception as e:
             logging.exception(f"Error in finalize_context_rebuild for {company_short_name}: {e}")
             raise e
@@ -219,18 +331,17 @@ class QueryService:
             # release the lock
             self.session_context.release_lock(lock_key)
-        return {'response_id': response_id }
     def llm_query(self,
                   company_short_name: str,
                   user_identifier: str,
-                  task: Optional[Task] = None,
+                  model: Optional[str] = None,
                   prompt_name: str = None,
                   question: str = '',
                   client_data: dict = {},
-                  response_id: str = '',
-                  files: list = [],
-                  model: Optional[str] = None) -> dict:
+                  ignore_history: bool = False,
+                  files: list = []
+                  ) -> dict:
         try:
             company = self.profile_repo.get_company_by_short_name(short_name=company_short_name)
             if not company:
@@ -242,86 +353,48 @@ class QueryService:
                         "error_message": self.i18n_service.t('services.start_query')}
             # --- Model Resolution ---
-            # Priority: 1. Explicit model -> 2. Company config -> 3. Global default
-            effective_model = model
-            if not effective_model:
-                llm_config = self.configuration_service.get_configuration(company_short_name, 'llm')
-                if llm_config and llm_config.get('model'):
-                    effective_model = llm_config['model']
-            effective_model = effective_model or self.default_model
-            # get the previous response_id and context history
-            previous_response_id = None
-            context_history = self.session_context.get_context_history(company.short_name, user_identifier) or []
-            if self.util.is_openai_model(effective_model):
-                if response_id:
-                    # context is getting from this response_id
-                    previous_response_id = response_id
-                else:
-                    # use the full user history context
-                    previous_response_id = self.session_context.get_last_response_id(company.short_name, user_identifier)
-                    if not previous_response_id:
-                        return {'error': True,
-                                "error_message": self.i18n_service.t('errors.services.missing_response_id', company_short_name=company.short_name, user_identifier=user_identifier)
-                                }
-            elif self.util.is_gemini_model(effective_model):
-                # check the length of the context_history and remove old messages
-                self._trim_context_history(context_history)
-            # get the user profile data from the session context
-            user_profile = self.profile_service.get_profile_by_identifier(company.short_name, user_identifier)
-            # combine client_data with user_profile
-            final_client_data = (user_profile or {}).copy()
-            final_client_data.update(client_data)
-            # Load attached files into the context
-            files_context = self.load_files_for_context(files)
-            # Initialize prompt_content. It will be an empty string for direct questions.
-            main_prompt = ""
-            if prompt_name:
-                # For task-based queries, wrap data into a JSON string and get the specific prompt template
-                question_dict = {'prompt': prompt_name, 'data': final_client_data }
-                question = json.dumps(question_dict)
-                prompt_content = self.prompt_service.get_prompt_content(company, prompt_name)
-                # Render the main user prompt using the appropriate template (or an empty one)
-                main_prompt = self.util.render_prompt_from_string(
-                    template_string=prompt_content,
-                    question=question,
-                    client_data=final_client_data,
-                    user_identifier=user_identifier,
-                    company=company,
-                )
-            # This is the final user-facing prompt for this specific turn
-            user_turn_prompt = f"{main_prompt}\n{files_context}"
-            if not prompt_name:
-                user_turn_prompt += f"\n### La pregunta que debes responder es: {question}"
-            else:
-                user_turn_prompt += f'\n### Contexto Adicional: El usuario ha aportado este contexto puede ayudar: {question}'
-            # add to the history context
-            if self.util.is_gemini_model(effective_model):
-                context_history.append({"role": "user", "content": user_turn_prompt})
-            # service list for the function calls
-            tools = self.dispatcher.get_company_services(company)
+            effective_model = self._resolve_model(company_short_name, model)
+            # --- Build User-Facing Prompt ---
+            user_turn_prompt, effective_question = self._build_user_facing_prompt(
+                company=company,
+                user_identifier=user_identifier,
+                client_data=client_data,
+                files=files,
+                prompt_name=prompt_name,
+                question=question
+            )
+            # --- History Management (Strategy Pattern) ---
+            history_handle, error_response = self._ensure_valid_history(
+                company=company,
+                user_identifier=user_identifier,
+                effective_model=effective_model,
+                user_turn_prompt=user_turn_prompt,
+                ignore_history=ignore_history
+            )
+            if error_response:
+                return error_response
+            # get the tools availables for this company
+            tools = self.tool_service.get_tools_for_llm(company)
             # openai structured output instructions
             output_schema = {}
+            # Safely extract parameters for invoke using the handle
+            # The handle is guaranteed to have request_params populated if no error returned
+            previous_response_id = history_handle.request_params.get('previous_response_id')
+            context_history = history_handle.request_params.get('context_history')
             # Now send the instructions to the llm
             response = self.llm_client.invoke(
                 company=company,
                 user_identifier=user_identifier,
                 model=effective_model,
                 previous_response_id=previous_response_id,
-                context_history=context_history if self.util.is_gemini_model(effective_model) else None,
-                question=question,
+                context_history=context_history,
+                question=effective_question,
                 context=user_turn_prompt,
                 tools=tools,
                 text=output_schema
@@ -330,11 +403,10 @@ class QueryService:
             if not response.get('valid_response'):
                 response['error'] = True
-            # save last_response_id for the history chain
-            if "response_id" in response:
-                self.session_context.save_last_response_id(company.short_name, user_identifier, response["response_id"])
-            if self.util.is_gemini_model(effective_model):
-                self.session_context.save_context_history(company.short_name, user_identifier, context_history)
+            # save history using the manager passing the handle
+            self.history_manager.update_history(
+                history_handle, user_turn_prompt, response
+            )
             return response
         except Exception as e:
@@ -348,23 +420,6 @@ class QueryService:
         except Exception:
             return "unknown"
-    def _has_valid_cached_context(self, company_short_name: str, user_identifier: str) -> bool:
-        """
-        Verifica si existe un estado de contexto reutilizable en sesión.
-        - OpenAI: last_response_id presente.
-        - Gemini: context_history con al menos 1 mensaje.
-        """
-        try:
-            if self.util.is_openai_model(self.default_model):
-                prev_id = self.session_context.get_last_response_id(company_short_name, user_identifier)
-                return bool(prev_id)
-            if self.util.is_gemini_model(self.default_model):
-                history = self.session_context.get_context_history(company_short_name, user_identifier) or []
-                return len(history) >= 1
-            return False
-        except Exception as e:
-            logging.warning(f"error verifying context cache: {e}")
-            return False
     def load_files_for_context(self, files: list) -> str:
         """
@@ -381,7 +436,7 @@ class QueryService:
             """
         for document in files:
             # Support both 'file_id' and 'filename' for robustness
-            filename = document.get('file_id') or document.get('filename')
+            filename = document.get('file_id') or document.get('filename') or document.get('name')
             if not filename:
                 context += "\n<error>Documento adjunto sin nombre ignorado.</error>\n"
                 continue
@@ -410,32 +465,3 @@ class QueryService:
         return context
-    def _trim_context_history(self, context_history: list):
-        """
-        Verifica el tamaño del historial de contexto y elimina los mensajes más antiguos
-        si supera un umbral, conservando siempre el mensaje del sistema (índice 0).
-        """
-        if not context_history or len(context_history) <= 1:
-            return  # nothing to remember
-        # calculate total tokens
-        try:
-            total_tokens = sum(self.llm_client.count_tokens(json.dumps(message)) for message in context_history)
-        except Exception as e:
-            logging.error(f"error counting tokens for history: {e}.")
-            return
-        # Si se excede el límite, eliminar mensajes antiguos (empezando por el segundo)
-        while total_tokens > GEMINI_MAX_TOKENS_CONTEXT_HISTORY and len(context_history) > 1:
-            try:
-                # Eliminar el mensaje más antiguo después del prompt del sistema
-                removed_message = context_history.pop(1)
-                removed_tokens = self.llm_client.count_tokens(json.dumps(removed_message))
-                total_tokens -= removed_tokens
-                logging.warning(
-                    f"history tokens ({total_tokens + removed_tokens} tokens) exceed the limit of: {GEMINI_MAX_TOKENS_CONTEXT_HISTORY}. "
-                    f"new context: {total_tokens} tokens."
-                )
-            except IndexError:
-                # Se produce si solo queda el mensaje del sistema, el bucle debería detenerse.
-                break

iatoolkit 0.71.4__py3-none-any.whl → 1.4.2__py3-none-any.whl

iatoolkit 0.71.4py3-none-any.whl → 1.4.2py3-none-any.whl