PyPI - hamtaa-texttools - Versions diffs - 1.0.6__py3-none-any.whl → 1.0.8__py3-none-any.whl - Mend

hamtaa-texttools 1.0.6py3-none-any.whl → 1.0.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

texttools/tools/the_tool.py CHANGED Viewed

@@ -8,466 +8,350 @@ import texttools.tools.internals.output_models as OutputModels
 class TheTool:
     """
-    High-level interface exposing specialized text tools for.
     Each method configures the operator with a specific YAML prompt,
     output schema, and flags, then delegates execution to `operator.run()`.
-    Supported capabilities:
-    - categorize: assign a text to one of several Islamic categories.
-    - extract_keywords: produce a keyword list from text.
-    - extract_entities: simple NER (name/type pairs).
-    - is_question: binary check whether input is a question.
-    - text_to_question: produce a new question from a text.
-    - merge_questions: combine multiple questions (default/reason modes).
-    - rewrite: rephrase questions (same meaning/different wording, or vice versa).
-    - subject_to_question: generate multiple questions given a subject.
-    - summarize: produce a concise summary of a subject.
-    - translate: translate text between languages.
-    Usage pattern:
+    Usage:
         client = OpenAI(...)
-        tool = TheTool(client, model="gemma-3")
-        result = tool.categorize("متن ورودی ...", with_analysis=True)
+        tool = TheTool(client, model="model-name")
+        result = tool.categorize("text ...", with_analysis=True)
     """
     def __init__(
         self,
         client: OpenAI,
-        *,
-        model: str = "google/gemma-3n-e4b-it",
-        user_prompt: str | None = None,
-        output_lang: str | None = None,
-        with_analysis: bool = False,
-        temperature: float = 0.0,
-        logprobs: bool = False,
-        top_logprobs: int = 3,
+        model: str,
     ):
-        # Initialize Operator
-        self.operator = Operator(client=client)
-        # Initialize default values
-        self.model = model
-        self.user_prompt = user_prompt
-        self.output_lang = output_lang
-        self.with_analysis = with_analysis
-        self.temperature = temperature
-        self.logprobs = logprobs
-        self.top_logprobs = top_logprobs
+        self.operator = Operator(client=client, model=model)
     def categorize(
         self,
         text: str,
-        model: str | None = None,
+        with_analysis: bool = False,
         user_prompt: str | None = None,
-        output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, str]:
         """
         Categorize a text into a single Islamic studies domain category.
-        Args:
-            text: Input string to categorize.
-            with_analysis: If True, first runs an LLM "analysis" step and
-                           conditions the main prompt on that analysis.
         Returns:
-            {"result": <category string>}
-            Example: {"result": "باورهای دینی"}
+            {"result": <category string>} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
             prompt_file="categorizer.yaml",
             output_model=OutputModels.CategorizerOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
+            output_lang=None,
         )
     def extract_keywords(
         self,
         text: str,
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, list[str]]:
         """
         Extract salient keywords from text.
-        Args:
-            text: Input string to analyze.
-            with_analysis: Whether to run an extra LLM reasoning step.
         Returns:
-            {"result": [<keyword1>, <keyword2>, ...]}
+            {"result": [<keyword1>, <keyword2>, ...]} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
-            prompt_file="keyword_extractor.yaml",
+            prompt_file="extract_keywords.yaml",
             output_model=OutputModels.ListStrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
         )
     def extract_entities(
         self,
         text: str,
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, list[dict[str, str]]]:
         """
         Perform Named Entity Recognition (NER) over the input text.
-        Args:
-            text: Input string.
-            with_analysis: Whether to run an extra LLM reasoning step.
         Returns:
-            {"result": [{"text": <entity>, "type": <entity_type>}, ...]}
+            {"result": [{"text": <entity>, "type": <entity_type>}, ...]} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
-            prompt_file="ner_extractor.yaml",
+            prompt_file="extract_entities.yaml",
             output_model=OutputModels.ListDictStrStrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
         )
     def is_question(
         self,
         text: str,
-        model: str | None = None,
+        with_analysis: bool = False,
         user_prompt: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, bool]:
         """
         Detect if the input is phrased as a question.
-        Args:
-            question: Input string to evaluate.
-            with_analysis: Whether to include an analysis step.
         Returns:
-            {"result": "true"} or {"result": "false"}
+            {"result": True} or {"result": False} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
             prompt_file="is_question.yaml",
             output_model=OutputModels.BoolOutput,
             resp_format="parse",
-            output_lang=False,
-            # User parameters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
+            output_lang=None,
         )
     def text_to_question(
         self,
         text: str,
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, str]:
         """
         Generate a single question from the given text.
-        Args:
-            text: Source text to derive a question from.
-            with_analysis: Whether to use analysis before generation.
         Returns:
-            {"result": <generated_question>}
+            {"result": <generated_question>} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
             prompt_file="text_to_question.yaml",
             output_model=OutputModels.StrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
         )
     def merge_questions(
         self,
-        questions: list[str],
-        mode: Literal["default", "reason"] = "default",
-        model: str | None = None,
-        user_prompt: str | None = None,
+        text: list[str],
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
+        mode: Literal["default", "reason"] = "default",
     ) -> dict[str, str]:
         """
         Merge multiple questions into a single unified question.
-        Args:
-            questions: List of question strings.
-            mode: Merge strategy:
-                - "default": simple merging.
-                - "reason": merging with reasoning explanation.
-            with_analysis: Whether to use an analysis step.
         Returns:
-            {"result": <merged_question>}
+            {"result": <merged_question>} + ("logprobs" and "analysis" if enabled)
         """
-        text = ", ".join(questions)
+        text = ", ".join(text)
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
-            prompt_file="question_merger.yaml",
+            prompt_file="merge_questions.yaml",
             output_model=OutputModels.StrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
             mode=mode,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
         )
     def rewrite(
         self,
         text: str,
-        mode: Literal["positive", "negative", "hard_negative"] = "positive",
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
+        mode: Literal["positive", "negative", "hard_negative"] = "positive",
     ) -> dict[str, str]:
         """
-        Rewrite a question with different wording or meaning.
-        Args:
-            question: Input question to rewrite.
-            mode: Rewrite strategy:
-                - "positive": keep meaning, change words.
-                - "negative": alter meaning, preserve wording style.
-            with_analysis: Whether to include an analysis step.
+        Rewrite a text with different modes.
         Returns:
-            {"result": <rewritten_question>}
+            {"result": <rewritten_text>} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
-            prompt_file="rewriter.yaml",
+            prompt_file="rewrite.yaml",
             output_model=OutputModels.StrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
             mode=mode,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
         )
     def subject_to_question(
         self,
         text: str,
         number_of_questions: int,
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, list[str]]:
         """
         Generate a list of questions about a subject.
-        Args:
-            subject: Topic of interest.
-            number_of_questions: Number of questions to produce.
-            language: Target language for generated questions.
-            with_analysis: Whether to include an analysis step.
         Returns:
-            {"result": [<question1>, <question2>, ...]}
+            {"result": [<question1>, <question2>, ...]} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            number_of_questions=number_of_questions,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
             prompt_file="subject_to_question.yaml",
             output_model=OutputModels.ReasonListStrOutput,
             resp_format="parse",
-            # User parameters
-            text=text,
-            number_of_questions=number_of_questions,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
         )
     def summarize(
         self,
         text: str,
-        model: str | None = None,
-        user_prompt: str | None = None,
+        with_analysis: bool = False,
         output_lang: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, str]:
         """
         Summarize the given subject text.
-        Args:
-            subject: Input text to summarize.
-            with_analysis: Whether to include an analysis step.
         Returns:
-            {"result": <summary>}
+            {"result": <summary>} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
             # Internal parameters
-            prompt_file="summarizer.yaml",
+            prompt_file="summarize.yaml",
             output_model=OutputModels.StrOutput,
             resp_format="parse",
-            # User paramaeters
-            text=text,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            mode=None,
         )
     def translate(
         self,
         text: str,
         target_language: str,
-        model: str | None = None,
+        with_analysis: bool = False,
         user_prompt: str | None = None,
-        with_analysis: bool | None = None,
-        temperature: float | None = None,
-        logprobs: bool | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
         top_logprobs: int | None = None,
     ) -> dict[str, str]:
         """
         Translate text between languages.
-        Args:
-            text: Input string to translate.
-            target_language: Language code or name to translate into.
-            with_analysis: Whether to include an analysis step.
         Returns:
-            {"result": <translated_text>}
+            {"result": <translated_text>} + ("logprobs" and "analysis" if enabled)
         """
         return self.operator.run(
-            # Internal parameters
-            prompt_file="translator.yaml",
-            output_model=OutputModels.StrOutput,
-            resp_format="parse",
-            output_lang=False,
             # User parameters
             text=text,
             target_language=target_language,
-            model=self.model if model is None else model,
-            user_prompt=self.user_prompt if user_prompt is None else user_prompt,
-            with_analysis=self.with_analysis
-            if with_analysis is None
-            else with_analysis,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            # Internal parameters
+            prompt_file="translate.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=None,
+            output_lang=None,
         )
     def run_custom(
         self,
         prompt: str,
         output_model: Any,
-        model: str | None = None,
         output_lang: str | None = None,
         temperature: float | None = None,
         logprobs: bool | None = None,
@@ -476,26 +360,22 @@ class TheTool:
         """
         Custom tool that can do almost anything!
-        Args:
-            prompt: Custom prompt.
-            output_model: Custom BaseModel output model.
         Returns:
             {"result": <Any>}
         """
         return self.operator.run(
-            # Internal parameters
-            prompt_file="run_custom.yaml",
-            resp_format="parse",
-            user_prompt=False,
-            with_analysis=False,
             # User paramaeters
             text=prompt,
             output_model=output_model,
             output_model_str=output_model.model_json_schema(),
-            model=self.model if model is None else model,
-            output_lang=self.output_lang if output_lang is None else output_lang,
-            temperature=self.temperature if temperature is None else temperature,
-            logprobs=self.logprobs if logprobs is None else logprobs,
-            top_logprobs=self.top_logprobs if top_logprobs is None else top_logprobs,
+            output_lang=output_lang,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            # Internal parameters
+            prompt_file="run_custom.yaml",
+            resp_format="parse",
+            user_prompt=None,
+            with_analysis=False,
+            mode=None,
         )

hamtaa-texttools 1.0.6__py3-none-any.whl → 1.0.8__py3-none-any.whl

hamtaa-texttools 1.0.6py3-none-any.whl → 1.0.8py3-none-any.whl