PyPI - h2ogpte - Versions diffs - 1.6.42__py3-none-any.whl → 1.6.43rc1__py3-none-any.whl - Mend

h2ogpte 1.6.42py3-none-any.whl → 1.6.43rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (98) hide show

h2ogpte/__init__.py +1 -1
h2ogpte/cli/__init__.py +0 -0
h2ogpte/cli/commands/__init__.py +0 -0
h2ogpte/cli/commands/command_handlers/__init__.py +0 -0
h2ogpte/cli/commands/command_handlers/agent.py +41 -0
h2ogpte/cli/commands/command_handlers/chat.py +37 -0
h2ogpte/cli/commands/command_handlers/clear.py +8 -0
h2ogpte/cli/commands/command_handlers/collection.py +67 -0
h2ogpte/cli/commands/command_handlers/config.py +113 -0
h2ogpte/cli/commands/command_handlers/disconnect.py +36 -0
h2ogpte/cli/commands/command_handlers/exit.py +37 -0
h2ogpte/cli/commands/command_handlers/help.py +8 -0
h2ogpte/cli/commands/command_handlers/history.py +29 -0
h2ogpte/cli/commands/command_handlers/rag.py +146 -0
h2ogpte/cli/commands/command_handlers/research_agent.py +45 -0
h2ogpte/cli/commands/command_handlers/session.py +77 -0
h2ogpte/cli/commands/command_handlers/status.py +33 -0
h2ogpte/cli/commands/dispatcher.py +79 -0
h2ogpte/cli/core/__init__.py +0 -0
h2ogpte/cli/core/app.py +105 -0
h2ogpte/cli/core/config.py +199 -0
h2ogpte/cli/core/encryption.py +104 -0
h2ogpte/cli/core/session.py +171 -0
h2ogpte/cli/integrations/__init__.py +0 -0
h2ogpte/cli/integrations/agent.py +338 -0
h2ogpte/cli/integrations/rag.py +442 -0
h2ogpte/cli/main.py +90 -0
h2ogpte/cli/ui/__init__.py +0 -0
h2ogpte/cli/ui/hbot_prompt.py +435 -0
h2ogpte/cli/ui/prompts.py +129 -0
h2ogpte/cli/ui/status_bar.py +133 -0
h2ogpte/cli/utils/__init__.py +0 -0
h2ogpte/cli/utils/file_manager.py +411 -0
h2ogpte/h2ogpte.py +471 -67
h2ogpte/h2ogpte_async.py +482 -68
h2ogpte/h2ogpte_sync_base.py +8 -1
h2ogpte/rest_async/__init__.py +6 -3
h2ogpte/rest_async/api/chat_api.py +29 -0
h2ogpte/rest_async/api/collections_api.py +293 -0
h2ogpte/rest_async/api/extractors_api.py +2874 -70
h2ogpte/rest_async/api/prompt_templates_api.py +32 -32
h2ogpte/rest_async/api_client.py +1 -1
h2ogpte/rest_async/configuration.py +1 -1
h2ogpte/rest_async/models/__init__.py +5 -2
h2ogpte/rest_async/models/chat_completion.py +4 -2
h2ogpte/rest_async/models/chat_completion_delta.py +5 -3
h2ogpte/rest_async/models/chat_completion_request.py +1 -1
h2ogpte/rest_async/models/chat_session.py +4 -2
h2ogpte/rest_async/models/chat_settings.py +1 -1
h2ogpte/rest_async/models/collection.py +4 -2
h2ogpte/rest_async/models/collection_create_request.py +4 -2
h2ogpte/rest_async/models/create_chat_session_request.py +87 -0
h2ogpte/rest_async/models/extraction_request.py +1 -1
h2ogpte/rest_async/models/extractor.py +4 -2
h2ogpte/rest_async/models/guardrails_settings.py +8 -4
h2ogpte/rest_async/models/guardrails_settings_create_request.py +1 -1
h2ogpte/rest_async/models/process_document_job_request.py +1 -1
h2ogpte/rest_async/models/question_request.py +1 -1
h2ogpte/rest_async/models/{reset_and_share_prompt_template_request.py → reset_and_share_request.py} +6 -6
h2ogpte/{rest_sync/models/reset_and_share_prompt_template_with_groups_request.py → rest_async/models/reset_and_share_with_groups_request.py} +6 -6
h2ogpte/rest_async/models/summarize_request.py +1 -1
h2ogpte/rest_async/models/update_collection_workspace_request.py +87 -0
h2ogpte/rest_async/models/update_extractor_privacy_request.py +87 -0
h2ogpte/rest_sync/__init__.py +6 -3
h2ogpte/rest_sync/api/chat_api.py +29 -0
h2ogpte/rest_sync/api/collections_api.py +293 -0
h2ogpte/rest_sync/api/extractors_api.py +2874 -70
h2ogpte/rest_sync/api/prompt_templates_api.py +32 -32
h2ogpte/rest_sync/api_client.py +1 -1
h2ogpte/rest_sync/configuration.py +1 -1
h2ogpte/rest_sync/models/__init__.py +5 -2
h2ogpte/rest_sync/models/chat_completion.py +4 -2
h2ogpte/rest_sync/models/chat_completion_delta.py +5 -3
h2ogpte/rest_sync/models/chat_completion_request.py +1 -1
h2ogpte/rest_sync/models/chat_session.py +4 -2
h2ogpte/rest_sync/models/chat_settings.py +1 -1
h2ogpte/rest_sync/models/collection.py +4 -2
h2ogpte/rest_sync/models/collection_create_request.py +4 -2
h2ogpte/rest_sync/models/create_chat_session_request.py +87 -0
h2ogpte/rest_sync/models/extraction_request.py +1 -1
h2ogpte/rest_sync/models/extractor.py +4 -2
h2ogpte/rest_sync/models/guardrails_settings.py +8 -4
h2ogpte/rest_sync/models/guardrails_settings_create_request.py +1 -1
h2ogpte/rest_sync/models/process_document_job_request.py +1 -1
h2ogpte/rest_sync/models/question_request.py +1 -1
h2ogpte/rest_sync/models/{reset_and_share_prompt_template_request.py → reset_and_share_request.py} +6 -6
h2ogpte/{rest_async/models/reset_and_share_prompt_template_with_groups_request.py → rest_sync/models/reset_and_share_with_groups_request.py} +6 -6
h2ogpte/rest_sync/models/summarize_request.py +1 -1
h2ogpte/rest_sync/models/update_collection_workspace_request.py +87 -0
h2ogpte/rest_sync/models/update_extractor_privacy_request.py +87 -0
h2ogpte/session.py +3 -2
h2ogpte/session_async.py +22 -6
h2ogpte/types.py +6 -0
{h2ogpte-1.6.42.dist-info → h2ogpte-1.6.43rc1.dist-info}/METADATA +5 -1
{h2ogpte-1.6.42.dist-info → h2ogpte-1.6.43rc1.dist-info}/RECORD +98 -59
h2ogpte-1.6.43rc1.dist-info/entry_points.txt +2 -0
{h2ogpte-1.6.42.dist-info → h2ogpte-1.6.43rc1.dist-info}/WHEEL +0 -0
{h2ogpte-1.6.42.dist-info → h2ogpte-1.6.43rc1.dist-info}/top_level.txt +0 -0

h2ogpte/h2ogpte.py CHANGED Viewed

@@ -1,7 +1,7 @@
 # This file was generated from `h2ogpte_async.py` by executing `make generate-sync-mux-py`.
 from pathlib import Path
-from typing import Iterable, Any, Union, List, Dict, Tuple
+from typing import Iterable, Any, Union, List, Dict, Tuple, Callable
 from h2ogpte.types import *
 from h2ogpte.errors import *
 from h2ogpte.connectors import *
@@ -92,19 +92,65 @@ class H2OGPTE(H2OGPTESyncBase):
                 Default value is to use the first model (0th index).
             llm_args:
                 Dictionary of kwargs to pass to the llm. Valid keys:
+                    # Core generation parameters
                     temperature (float, default: 0) — The value used to modulate the next token probabilities. Most deterministic: 0, Most creative: 1
-                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed.
-                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering.
-                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation.
-                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty.
-                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction.
-                    min_max_new_tokens (int, default: 512) — minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
-                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"].
-                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema.
-                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_choice (Optional[List[str]], default: None — If specified, the output will be exactly one of the choices. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
+                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed
+                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering
+                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation
+                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty
+                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction
+                    min_max_new_tokens (int, default: 512) — Minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
+                    min_chars_per_yield (int) — Minimum number of characters to yield at a time during streaming
+                    reasoning_effort (int, default: 0) — Level of reasoning effort for the model (higher values = deeper reasoning, e.g., 10000-65000). Use for models that support chain-of-thought reasoning. 0 means no additional reasoning effort
+                    # Output format parameters
+                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"]
+                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema
+                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation: check output of get_llms() for guided_vllm flag
+                    guided_choice (Optional[List[str]], default: None) — If specified, the output will be exactly one of the choices. Only for models that support guided generation
+                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation
+                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation
+                    json_preserve_system_prompt (bool) — Whether to preserve the system prompt when using JSON response format
+                    # Vision and image parameters
+                    images_num_max (int) — Maximum number of images to process
+                    visible_vision_models (list) — List of vision models that can be used
+                    # Agent parameters
+                    use_agent (bool, default: False) — Whether to enable agent functionality for advanced task processing with access to tools
+                    shared_agent (bool, default: False) — Whether to use shared agent instance across multiple requests for efficiency
+                    agent_type (str, default: "auto") — Type of agent to use. Options: ["auto", "agent_analysis", "agent_chat_history_md", "agent_code", "agent_rag"]
+                    selected_tool_type (str, default: "auto") — Type of tools to make available to the agent. Options: ["auto", "all", "any"] or specific tool names
+                    agent_accuracy (str, default: "standard") — Accuracy level for agent operations. Options:
+                        "quick" - Fastest, less verification (max_turns=10, timeout=30s)
+                        "basic" - Best for simple tasks (max_turns=20, timeout=60s)
+                        "standard" - Good for most tasks (max_turns=40, timeout=120s)
+                        "maximum" - Highest accuracy, can take a long time (max_turns=80, timeout=240s)
+                    agent_max_turns (Union[str, int], default: "auto") — Maximum number of back-and-forth turns the agent can take. Either "auto" or an integer
+                    agent_original_files (list) — List of file paths for agent to process and analyze
+                    agent_timeout (int) — Timeout in seconds for each individual agent turn/operation
+                    agent_total_timeout (int, default: 3600) — Total timeout in seconds for all agent operations combined
+                    agent_min_time (int) — Minimum time in seconds to run the agent before allowing completion
+                    agent_tools (Union[str, list], default: "auto") — List of specific tools available to the agent. Options: "auto", "all", "any", or list of tool names
+                    user_persona (str) — User persona description for agent context to customize agent behavior
+                    agent_code_writer_system_message (str) — Custom system message for code writing agent to guide code generation
+                    agent_code_restrictions_level (int) — Level of code execution restrictions for agent (typically 0 for unrestricted)
+                    agent_num_executable_code_blocks_limit (int) — Maximum number of code blocks the agent can execute in a single session
+                    agent_system_site_packages (bool, default: False) — Whether agent can use system site packages when executing code
+                    agent_main_model (str) — Main model to use for agent operations (e.g., specific LLM name)
+                    agent_max_stream_length (int, default: -1) — Maximum length for agent streaming responses, -1 for unlimited
+                    agent_max_memory_usage (int) — Maximum memory usage in bytes for agent operations
+                    agent_main_reasoning_effort (int) — Level of reasoning effort for main agent model (higher values = more reasoning, e.g., 10000)
+                    agent_advanced_reasoning_effort (int) — Level of reasoning effort for advanced agent operations (e.g., 20000)
+                    agent_max_confidence_level (int) — Maximum confidence level for agent decisions (typically 0, 1, or 2)
+                    agent_planning_forced_mode (bool) — Whether to force planning mode for agent (True to always plan first)
+                    agent_too_soon_forced_mode (bool) — Whether to force handling of premature agent decisions
+                    agent_critique_forced_mode (int) — Whether to force critique mode for agent self-evaluation
+                    agent_stream_files (bool, default: True) — Whether to stream files from agent operations for real-time updates
+                    # Other parameters
+                    max_time (int) — Maximum time in seconds for the operation
+                    client_metadata (dict) — Metadata to include with the request
             chat_conversation:
                 List of tuples for (human, bot) conversation that will be pre-appended
                 to an (question, None) case for a query.
@@ -216,18 +262,19 @@ class H2OGPTE(H2OGPTESyncBase):
             llm_args:
                 Dictionary of kwargs to pass to the llm. Valid keys:
                     temperature (float, default: 0) — The value used to modulate the next token probabilities. Most deterministic: 0, Most creative: 1
-                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed.
-                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering.
-                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation.
-                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty.
-                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction.
-                    min_max_new_tokens (int, default: 512) — minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
-                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"].
-                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema.
-                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_choice (Optional[List[str]], default: None — If specified, the output will be exactly one of the choices. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
+                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed
+                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering
+                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation
+                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty
+                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction
+                    min_max_new_tokens (int, default: 512) — Minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
+                    reasoning_effort (int, default: 0) — Level of reasoning effort for the model (higher values = deeper reasoning, e.g., 10000-65000). Use for models that support chain-of-thought reasoning. 0 means no additional reasoning effort
+                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"]
+                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema
+                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation
+                    guided_choice (Optional[List[str]], default: None) — If specified, the output will be exactly one of the choices. Only for models that support guided generation
+                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation
+                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation
             guardrails_settings:
                 Guardrails Settings.
             timeout:
@@ -326,18 +373,19 @@ class H2OGPTE(H2OGPTESyncBase):
             llm_args:
                 Dictionary of kwargs to pass to the llm. Valid keys:
                     temperature (float, default: 0) — The value used to modulate the next token probabilities. Most deterministic: 0, Most creative: 1
-                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed.
-                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering.
-                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation.
-                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty.
-                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction.
-                    min_max_new_tokens (int, default: 512) — minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
-                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"].
-                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema.
-                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_choice (Optional[List[str]], default: None — If specified, the output will be exactly one of the choices. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
+                    seed (int, default: 0) — The seed for the random number generator, only used if temperature > 0, seed=0 will pick a random number for each call, seed > 0 will be fixed
+                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering
+                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation
+                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty
+                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction
+                    min_max_new_tokens (int, default: 512) — Minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
+                    reasoning_effort (int, default: 0) — Level of reasoning effort for the model (higher values = deeper reasoning, e.g., 10000-65000). Use for models that support chain-of-thought reasoning. 0 means no additional reasoning effort
+                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"]
+                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema
+                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation
+                    guided_choice (Optional[List[str]], default: None) — If specified, the output will be exactly one of the choices. Only for models that support guided generation
+                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation
+                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation
             guardrails_settings:
                 Guardrails Settings.
             timeout:
@@ -649,13 +697,18 @@ class H2OGPTE(H2OGPTESyncBase):
         )
         return result
-    def create_chat_session(self, collection_id: Optional[str] = None) -> str:
+    def create_chat_session(
+        self, collection_id: Optional[str] = None, workspace: Optional[str] = None
+    ) -> str:
         """Creates a new chat session for asking questions (of documents).
         Args:
             collection_id:
                 String id of the collection to chat with.
                 If None, chat with LLM directly.
+            workspace:
+                String id of the workspace this chat will be associated with.
+                If None, the user's default workspace will be used.
         Returns:
             str: The ID of the newly created chat session.
@@ -664,7 +717,11 @@ class H2OGPTE(H2OGPTESyncBase):
         with self._RESTClient(self) as rest_client:
             response = _rest_to_client_exceptions(
                 lambda: rest_client.chat_api.create_chat_session(
-                    collection_id=collection_id, _headers=header
+                    collection_id=collection_id,
+                    create_chat_session_request=rest.CreateChatSessionRequest(
+                        workspace=workspace,
+                    ),
+                    _headers=header,
                 )
             )
             return response.id
@@ -679,7 +736,8 @@ class H2OGPTE(H2OGPTESyncBase):
         with self._RESTClient(self) as rest_client:
             response = _rest_to_client_exceptions(
                 lambda: rest_client.chat_api.create_chat_session(
-                    collection_id="default", _headers=header
+                    collection_id="default",
+                    _headers=header,
                 )
             )
         return response.id
@@ -766,6 +824,7 @@ class H2OGPTE(H2OGPTESyncBase):
         collection_settings: Union[dict, None] = None,
         thumbnail: Union[Path, None] = None,
         chat_settings: Union[dict, None] = None,
+        workspace: Union[str, None] = None,
     ) -> str:
         r"""Creates a new collection.
@@ -812,8 +871,8 @@ class H2OGPTE(H2OGPTESyncBase):
                     guardrails_labels_to_flag: list of entities to be flagged as safety violations in user prompts. Must be a subset of guardrails_entities, if provided.
                     guardrails_safe_category: (Optional) name of the safe category for guardrails. Must be a key in guardrails_entities, if provided. Otherwise uses system defaults.
                     guardrails_entities: (Optional) dictionary of entities and their descriptions for the guardrails model to classify. The first entry is the "safe" class, the rest are "unsafe" classes.
-                    column_redaction_custom_entities_to_flag: list of entities to redact in tabular data files. Must be a subset of column_redaction_custom_entities, if provided.
-                    column_redaction_custom_entities: (Optional) dictionary of entities and a short description for the LLM to check for and redact columns containing PII in tabular data files.
+                    custom_pii_entities_to_flag: list of entities to redact in tabular data files. Must be a subset of custom_pii_entities, if provided.
+                    custom_pii_entities: (Optional) dictionary of entities and a short description for the LLM to check for and redact columns containing PII in tabular data files.
                     guardrails_llm: LLM to use for guardrails and PII detection. Use "auto" for automatic. Use `H2OGPTE.get_llms()` to see all available options.
                 Example:
                     Note: Call client.get_guardrails_settings() to see all options for guardrails_settings.
@@ -845,10 +904,10 @@ class H2OGPTE(H2OGPTESyncBase):
                                 "Intellectual Property": "Messages that may violate the intellectual property rights of any third party",
                                 "Code Interpreter Abuse": "Messages that seek to abuse code interpreters, including those that enable denial of service attacks, container escapes or privilege escalation exploits",
                             },
-                            column_redaction_custom_entities_to_flag=[
+                            custom_pii_entities_to_flag=[
                                 "Mother's Maiden Name"
                             ],
-                            column_redaction_custom_entities={
+                            custom_pii_entities={
                                 "Mother's Maiden Name": "Mother's maiden name."
                             },
                             guardrails_llm="meta-llama/Llama-3.3-70B-Instruct",
@@ -859,12 +918,14 @@ class H2OGPTE(H2OGPTESyncBase):
             chat_settings:
                 (Optional) Dictionary with key/value pairs to configure the default values for certain chat specific settings
                 The following keys are supported, see the client.session() documentation for more details.
-                llm: str
-                llm_args: dict
-                self_reflection_config: dict
-                rag_config: dict
-                include_chat_history: bool
-                tags: list[str]
+                llm: str — Default LLM to use for chat sessions in this collection
+                llm_args: dict — Default LLM arguments (see answer_question method for full list of valid keys)
+                self_reflection_config: dict — Configuration for self-reflection functionality
+                rag_config: dict — Configuration for RAG (Retrieval-Augmented Generation)
+                include_chat_history: bool — Whether to include chat history in context
+                tags: list[str] — Tags to associate with the collection
+            workspace:
+                (Optional) The workspace id to be associated with this collection. None to use the default workspace.
         Returns:
             str: The ID of the newly created collection.
         """
@@ -878,6 +939,7 @@ class H2OGPTE(H2OGPTESyncBase):
                     collection_settings
                 ),
                 chat_settings=rest.ChatSettings.from_dict(chat_settings),
+                workspace=workspace,
             )
             collection = _rest_to_client_exceptions(
                 lambda: rest_client.collection_api.create_collection(
@@ -1561,20 +1623,21 @@ class H2OGPTE(H2OGPTESyncBase):
             llm_args:
                 Dictionary of kwargs to pass to the llm. Valid keys:
                     temperature (float, default: 0) — The value used to modulate the next token probabilities. Most deterministic: 0, Most creative: 1
-                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering.
-                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation.
-                    seed (int, default: 0) — The seed for the random number generator when sampling during generation (if temp>0 or top_k>1 or top_p<1), seed=0 picks a random seed.
-                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty.
-                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction.
-                    min_max_new_tokens (int, default: 512) — minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
-                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"].
-                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema.
-                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_choice (Optional[List[str]], default: None — If specified, the output will be exactly one of the choices. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation: check output of get_llms() for guided_vllm flag.
-                    enable_vision (str, default: "auto") - Controls vision mode, send images to the LLM in addition to text chunks. Only if have models that support vision, use get_vision_capable_llm_names() to see list. One of ["on", "off", "auto"].
-                    visible_vision_models (List[str], default: ["auto"]) - Controls which vision model to use when processing images. Use get_vision_capable_llm_names() to see list. Must provide exactly one model. ["auto"] for automatic.
+                    top_k (int, default: 1) — The number of highest probability vocabulary tokens to keep for top-k-filtering
+                    top_p (float, default: 1.0) — If set to float < 1, only the smallest set of most probable tokens with probabilities that add up to top_p or higher are kept for generation
+                    seed (int, default: 0) — The seed for the random number generator when sampling during generation (if temp>0 or top_k>1 or top_p<1), seed=0 picks a random seed
+                    repetition_penalty (float, default: 1.07) — The parameter for repetition penalty. 1.0 means no penalty
+                    max_new_tokens (int, default: 1024) — Maximum number of new tokens to generate. This limit applies to each (map+reduce) step during summarization and each (map) step during extraction
+                    reasoning_effort (int, default: 0) — Level of reasoning effort for the model (higher values = deeper reasoning, e.g., 10000-65000). Use for models that support chain-of-thought reasoning. 0 means no additional reasoning effort
+                    min_max_new_tokens (int, default: 512) — Minimum value for max_new_tokens when auto-adjusting for content of prompt, docs, etc.
+                    response_format (str, default: "text") — Output type, one of ["text", "json_object", "json_code"]
+                    guided_json (dict, default: None) — If specified, the output will follow the JSON schema
+                    guided_regex (str, default: "") — If specified, the output will follow the regex pattern. Only for models that support guided generation
+                    guided_choice (Optional[List[str]], default: None) — If specified, the output will be exactly one of the choices. Only for models that support guided generation
+                    guided_grammar (str, default: "") — If specified, the output will follow the context free grammar. Only for models that support guided generation
+                    guided_whitespace_pattern (str, default: "") — If specified, will override the default whitespace pattern for guided json decoding. Only for models that support guided generation
+                    enable_vision (str, default: "auto") — Controls vision mode, send images to the LLM in addition to text chunks. Only if have models that support vision, use get_vision_capable_llm_names() to see list. One of ["on", "off", "auto"]
+                    visible_vision_models (List[str], default: ["auto"]) — Controls which vision model to use when processing images. Use get_vision_capable_llm_names() to see list. Must provide exactly one model. ["auto"] for automatic
             max_num_chunks:
                 Max limit of chunks to send to the summarizer
             sampling_strategy:
@@ -2531,6 +2594,7 @@ class H2OGPTE(H2OGPTESyncBase):
         metadata: Union[Dict[str, Any], None] = None,
         timeout: Union[float, None] = None,
         ingest_mode: Union[str, None] = None,
+        callback: Optional[Callable[[Job], None]] = None,
     ) -> Job:
         """Add uploaded documents into a specific collection.
@@ -2577,6 +2641,8 @@ class H2OGPTE(H2OGPTESyncBase):
                 "standard" - Files will be ingested for use with RAG
                 "lite" - Files will be ingested for use with RAG, but minimal processing will be done, favoring ingest speed over accuracy
                 "agent_only" - Bypasses standard ingestion. Files can only be used with agents.
+            callback:
+                Function for processing job status info during the upload.
         """
         header = self._get_auth_header()
         with self._RESTClient(self) as rest_client:
@@ -2604,7 +2670,9 @@ class H2OGPTE(H2OGPTESyncBase):
                     _headers=header,
                 )
             )
-        return self._wait_for_completion(response.id, timeout=timeout)
+        return self._wait_for_completion(
+            response.id, timeout=timeout, callback=callback
+        )
     def ingest_website(
         self,
@@ -3723,6 +3791,298 @@ class H2OGPTE(H2OGPTESyncBase):
             )
         return result
+    def list_extractor_permissions(self, extractor_id: str) -> List[SharePermission]:
+        """Returns a list of access permissions for a given extractor.
+        The returned list of permissions denotes who has access to
+        the extractor and their access level.
+        Args:
+            extractor_id:
+                ID of the extractor to inspect.
+        Returns:
+            list of SharePermission: Sharing permissions list for the given extractor.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            response = _rest_to_client_exceptions(
+                lambda: rest_client.extractor_api.get_extractor_permissions(
+                    extractor_id=extractor_id,
+                    _headers=header,
+                )
+            )
+        return [SharePermission(**d.to_dict()) for d in response]
+    def list_extractor_group_permissions(
+        self, extractor_id: str
+    ) -> List[GroupSharePermission]:
+        """Returns a list of group access permissions for a given extractor.
+        The returned list of group permissions denoting which groups have access to
+        the extractor and their access level.
+        Args:
+            extractor_id:
+                ID of the extractor to inspect.
+        Returns:
+            list of GroupSharePermission: Group sharing permissions list for the given extractor.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            response = _rest_to_client_exceptions(
+                lambda: rest_client.extractor_api.get_extractor_group_permissions(
+                    extractor_id=extractor_id,
+                    _headers=header,
+                )
+            )
+        return [GroupSharePermission(**d.to_dict()) for d in response]
+    def share_extractor(
+        self, extractor_id: str, permission: SharePermission
+    ) -> ShareResponseStatus:
+        """Share an extractor to a user.
+        The permission attribute defined the level of access,
+        and who can access the extractor, the extractor_id attribute
+        denotes the extractor to be shared.
+        Args:
+            extractor_id:
+                ID of the extractor to share.
+            permission:
+                Defines the rule for sharing, i.e. permission level.
+        Returns:
+            ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.share_extractor(
+                        extractor_id=extractor_id,
+                        username=permission.username,
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def unshare_extractor(
+        self, extractor_id: str, permission: SharePermission
+    ) -> ShareResponseStatus:
+        """Remove sharing of an extractor to a user.
+        The permission attribute defined the level of access,
+        and who can access the extractor, the extractor_id attribute
+        denotes the extractor to be shared.
+        In case of un-sharing, the SharePermission's user is sufficient.
+        Args:
+            extractor_id:
+                ID of the extractor to un-share.
+            permission:
+                Defines the user for which extractor access is revoked.
+        ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.unshare_extractor(
+                        extractor_id=extractor_id,
+                        username=permission.username,
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def reset_and_share_extractor(
+        self, extractor_id: str, new_usernames: List[str]
+    ) -> ShareResponseStatus:
+        """Remove all users who have access to an extractor (except for the owner) and share it with the provided list of new users.
+        Args:
+            extractor_id:
+                ID of the extractor to un-share.
+            new_usernames:
+                The list of usernames belonging to the users this extractor will be shared with.
+        ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.reset_and_share_extractor(
+                        extractor_id=extractor_id,
+                        reset_and_share_request=rest.ResetAndShareRequest(
+                            usernames=new_usernames,
+                        ),
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def unshare_extractor_for_all(self, extractor_id: str) -> ShareResponseStatus:
+        """Remove sharing of an extractor to all other users but the original owner.
+        Args:
+            extractor_id:
+                ID of the extractor to un-share.
+        ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.unshare_extractor_for_all(
+                        extractor_id=extractor_id,
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def share_extractor_with_group(
+        self, extractor_id: str, permission: GroupSharePermission
+    ) -> ShareResponseStatus:
+        """Share an extractor to a group.
+        The permission attribute defines which group can access the extractor,
+        the extractor_id attribute denotes the extractor to be shared.
+        Args:
+            extractor_id:
+                ID of the extractor to share.
+            permission:
+                Defines the group for sharing with.
+        Returns:
+            ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.share_extractor_with_group(
+                        extractor_id=extractor_id,
+                        group_id=permission.group_id,
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def unshare_extractor_from_group(
+        self, extractor_id: str, permission: GroupSharePermission
+    ) -> ShareResponseStatus:
+        """Remove sharing of an extractor from a group.
+        The permission attribute defines which group to remove access from,
+        the extractor_id attribute denotes the extractor to be unshared.
+        Args:
+            extractor_id:
+                ID of the extractor to un-share.
+            permission:
+                Defines the group for which extractor access is revoked.
+        Returns:
+            ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.unshare_extractor_from_group(
+                        extractor_id=extractor_id,
+                        group_id=permission.group_id,
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def reset_and_share_extractor_with_groups(
+        self, extractor_id: str, new_groups: List[str]
+    ) -> ShareResponseStatus:
+        """Remove all groups who have access to an extractor and share it with the provided list of new group ids.
+        Args:
+            extractor_id:
+                ID of the extractor to un-share.
+            new_groups:
+                The list of group ids this extractor will be shared with.
+        ShareResponseStatus: Status of share request.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            result = _get_share_permission_status(
+                lambda: _rest_to_client_exceptions(
+                    lambda: rest_client.extractor_api.reset_and_share_extractor_with_groups(
+                        extractor_id=extractor_id,
+                        reset_and_share_with_groups_request=rest.ResetAndShareWithGroupsRequest(
+                            groups=new_groups,
+                        ),
+                        _headers=header,
+                    )
+                )
+            )
+        return result
+    def make_extractor_public(self, extractor_id: str):
+        """Make an extractor public
+        Once an extractor is public, it can be seen and used by all users.
+        Args:
+            extractor_id:
+                ID of the extractor to make public.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            _rest_to_client_exceptions(
+                lambda: rest_client.extractor_api.update_extractor_privacy(
+                    extractor_id=extractor_id,
+                    update_extractor_privacy_request=rest.UpdateExtractorPrivacyRequest(
+                        is_public=True
+                    ),
+                    _headers=header,
+                )
+            )
+    def make_extractor_private(self, extractor_id: str):
+        """Make an extractor private
+        Once a extractor is private, other users will no longer
+        be able to see or use it unless it has been shared individually or by group.
+        Args:
+            extractore_id:
+                ID of the extractor to make private.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            _rest_to_client_exceptions(
+                lambda: rest_client.extractor_api.update_extractor_privacy(
+                    extractor_id=extractor_id,
+                    update_extractor_privacy_request=rest.UpdateExtractorPrivacyRequest(
+                        is_public=False
+                    ),
+                    _headers=header,
+                )
+            )
     def list_recent_documents(
         self, offset: int, limit: int, metadata_filter: dict = {}
     ) -> List[DocumentInfo]:
@@ -4149,6 +4509,29 @@ class H2OGPTE(H2OGPTESyncBase):
             )
         return collection_id
+    def update_collection_workspace(self, collection_id: str, workspace: str) -> str:
+        """Update the workspace associated with a collection.
+        Args:
+            collection_id:
+                ID of the collection to update.
+            workspace:
+                The workspace associated with the collection.
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            _rest_to_client_exceptions(
+                lambda: rest_client.collection_api.update_collection_workspace(
+                    collection_id=collection_id,
+                    update_collection_workspace_request=rest.UpdateCollectionWorkspaceRequest(
+                        workspace=workspace
+                    ),
+                    _headers=header,
+                )
+            )
+        return collection_id
     def update_document_name(self, document_id: str, name: str) -> str:
         """Update the name metadata for a given document.
@@ -5008,7 +5391,7 @@ class H2OGPTE(H2OGPTESyncBase):
                 lambda: _rest_to_client_exceptions(
                     lambda: rest_client.prompt_template_api.reset_and_share_prompt_template_with_groups(
                         prompt_template_id=prompt_id,
-                        reset_and_share_prompt_template_with_groups_request=rest.ResetAndSharePromptTemplateWithGroupsRequest(
+                        reset_and_share_with_groups_request=rest.ResetAndShareWithGroupsRequest(
                             groups=new_groups,
                         ),
                         _headers=header,
@@ -5056,7 +5439,7 @@ class H2OGPTE(H2OGPTESyncBase):
                 lambda: _rest_to_client_exceptions(
                     lambda: rest_client.prompt_template_api.reset_and_share_prompt_template(
                         prompt_template_id=prompt_id,
-                        reset_and_share_prompt_template_request=rest.ResetAndSharePromptTemplateRequest(
+                        reset_and_share_request=rest.ResetAndShareRequest(
                             usernames=new_usernames,
                         ),
                         _headers=header,
@@ -5329,6 +5712,27 @@ class H2OGPTE(H2OGPTESyncBase):
         return self.get_prompt_template(rest_session.prompt_template_id)
+    def get_chat_session_workspace(self, chat_session_id: str) -> str:
+        """Get the workspace associated with the chat session.
+        Args:
+            chat_session_id:
+                String id of the chat session to search for.
+        Returns:
+            str: The identifier of the workspace
+        """
+        header = self._get_auth_header()
+        with self._RESTClient(self) as rest_client:
+            response = _rest_to_client_exceptions(
+                lambda: rest_client.chat_api.get_chat_session(
+                    session_id=chat_session_id,
+                    _headers=header,
+                )
+            )
+        return response.workspace
     def set_chat_session_collection(
         self, chat_session_id: str, collection_id: Union[str, None]
     ) -> str:

h2ogpte 1.6.42__py3-none-any.whl → 1.6.43rc1__py3-none-any.whl

h2ogpte 1.6.42py3-none-any.whl → 1.6.43rc1py3-none-any.whl