PyPI - hamtaa-texttools - Versions diffs - 0.1.48__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

hamtaa-texttools 0.1.48py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hamtaa-texttools might be problematic. Click here for more details.

Files changed (86) hide show

hamtaa_texttools-1.1.7.dist-info/METADATA +228 -0
hamtaa_texttools-1.1.7.dist-info/RECORD +30 -0
hamtaa_texttools-1.1.7.dist-info/licenses/LICENSE +21 -0
texttools/__init__.py +4 -26
texttools/batch/__init__.py +3 -0
texttools/{utils/batch_manager → batch}/batch_manager.py +226 -241
texttools/batch/batch_runner.py +254 -0
texttools/prompts/README.md +35 -0
texttools/prompts/categorizer.yaml +28 -0
texttools/prompts/extract_entities.yaml +20 -0
texttools/prompts/extract_keywords.yaml +18 -0
texttools/prompts/is_question.yaml +14 -0
texttools/prompts/merge_questions.yaml +46 -0
texttools/prompts/rewrite.yaml +111 -0
texttools/prompts/run_custom.yaml +7 -0
texttools/prompts/subject_to_question.yaml +22 -0
texttools/prompts/summarize.yaml +14 -0
texttools/prompts/text_to_question.yaml +20 -0
texttools/prompts/translate.yaml +15 -0
texttools/tools/__init__.py +4 -33
texttools/tools/async_the_tool.py +435 -0
texttools/tools/internals/async_operator.py +242 -0
texttools/tools/internals/base_operator.py +100 -0
texttools/tools/internals/formatters.py +24 -0
texttools/tools/internals/operator.py +242 -0
texttools/tools/internals/output_models.py +62 -0
texttools/tools/internals/prompt_loader.py +60 -0
texttools/tools/the_tool.py +433 -0
hamtaa_texttools-0.1.48.dist-info/METADATA +0 -60
hamtaa_texttools-0.1.48.dist-info/RECORD +0 -61
texttools/base/__init__.py +0 -3
texttools/base/base_categorizer.py +0 -40
texttools/base/base_keyword_extractor.py +0 -35
texttools/base/base_ner_extractor.py +0 -61
texttools/base/base_question_detector.py +0 -35
texttools/base/base_question_generator.py +0 -99
texttools/base/base_question_merger.py +0 -59
texttools/base/base_question_rewriter.py +0 -61
texttools/base/base_router.py +0 -33
texttools/base/base_summarizer.py +0 -55
texttools/base/base_task_performer.py +0 -53
texttools/base/base_translator.py +0 -38
texttools/formatter/__init__.py +0 -1
texttools/formatter/base.py +0 -26
texttools/formatter/gemma3_formatter.py +0 -54
texttools/handlers/__init__.py +0 -6
texttools/handlers/categorizer/__init__.py +0 -6
texttools/handlers/categorizer/categorizer.py +0 -61
texttools/handlers/handlers.py +0 -88
texttools/tools/categorizer/__init__.py +0 -2
texttools/tools/categorizer/encoder_model/__init__.py +0 -1
texttools/tools/categorizer/encoder_model/encoder_vectorizer.py +0 -51
texttools/tools/categorizer/llm/__init__.py +0 -2
texttools/tools/categorizer/llm/gemma_categorizer.py +0 -169
texttools/tools/categorizer/llm/openai_categorizer.py +0 -80
texttools/tools/keyword_extractor/__init__.py +0 -1
texttools/tools/keyword_extractor/gemma_extractor.py +0 -138
texttools/tools/merger/__init__.py +0 -2
texttools/tools/merger/gemma_question_merger.py +0 -214
texttools/tools/ner/__init__.py +0 -1
texttools/tools/ner/gemma_ner_extractor.py +0 -157
texttools/tools/question_detector/__init__.py +0 -2
texttools/tools/question_detector/gemma_detector.py +0 -114
texttools/tools/question_detector/llm_detector.py +0 -112
texttools/tools/question_generator/__init__.py +0 -1
texttools/tools/question_generator/gemma_question_generator.py +0 -198
texttools/tools/reranker/__init__.py +0 -3
texttools/tools/reranker/reranker.py +0 -137
texttools/tools/reranker/scorer.py +0 -216
texttools/tools/reranker/sorter.py +0 -278
texttools/tools/rewriter/__init__.py +0 -2
texttools/tools/rewriter/gemma_question_rewriter.py +0 -213
texttools/tools/router/__init__.py +0 -0
texttools/tools/router/gemma_router.py +0 -169
texttools/tools/subject_to_question/__init__.py +0 -1
texttools/tools/subject_to_question/gemma_question_generator.py +0 -224
texttools/tools/summarizer/__init__.py +0 -2
texttools/tools/summarizer/gemma_summarizer.py +0 -140
texttools/tools/summarizer/llm_summerizer.py +0 -108
texttools/tools/translator/__init__.py +0 -1
texttools/tools/translator/gemma_translator.py +0 -189
texttools/utils/batch_manager/__init__.py +0 -2
texttools/utils/batch_manager/batch_runner.py +0 -207
texttools/utils/flex_processor.py +0 -78
{hamtaa_texttools-0.1.48.dist-info → hamtaa_texttools-1.1.7.dist-info}/WHEEL +0 -0
{hamtaa_texttools-0.1.48.dist-info → hamtaa_texttools-1.1.7.dist-info}/top_level.txt +0 -0

texttools/tools/the_tool.py ADDED Viewed

@@ -0,0 +1,433 @@
+from typing import Literal, Any, Callable
+from openai import OpenAI
+from texttools.tools.internals.operator import Operator
+import texttools.tools.internals.output_models as OutputModels
+class TheTool:
+    """
+    Each method configures the operator with a specific YAML prompt,
+    output schema, and flags, then delegates execution to `operator.run()`.
+    Usage:
+        client = OpenAI(...)
+        tool = TheTool(client, model="model-name")
+        result = tool.categorize("text ...", with_analysis=True)
+    """
+    def __init__(
+        self,
+        client: OpenAI,
+        model: str,
+    ):
+        self.operator = Operator(client=client, model=model)
+    def categorize(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Categorize a text into a single Islamic studies domain category.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The assigned Islamic studies category
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="categorizer.yaml",
+            output_model=OutputModels.CategorizerOutput,
+            resp_format="parse",
+            mode=None,
+            output_lang=None,
+        )
+    def extract_keywords(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Extract salient keywords from text.
+        Returns:
+            ToolOutput: Object containing:
+                - result (list[str]): List of extracted keywords
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="extract_keywords.yaml",
+            output_model=OutputModels.ListStrOutput,
+            resp_format="parse",
+            mode=None,
+        )
+    def extract_entities(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Perform Named Entity Recognition (NER) over the input text.
+        Returns:
+            ToolOutput: Object containing:
+                - result (list[dict]): List of entities with 'text' and 'type' keys
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="extract_entities.yaml",
+            output_model=OutputModels.ListDictStrStrOutput,
+            resp_format="parse",
+            mode=None,
+        )
+    def is_question(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Detect if the input is phrased as a question.
+        Returns:
+            ToolOutput: Object containing:
+                - result (bool): True if text is a question, False otherwise
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="is_question.yaml",
+            output_model=OutputModels.BoolOutput,
+            resp_format="parse",
+            mode=None,
+            output_lang=None,
+        )
+    def text_to_question(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Generate a single question from the given text.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The generated question
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="text_to_question.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=None,
+        )
+    def merge_questions(
+        self,
+        text: list[str],
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        mode: Literal["default", "reason"] = "default",
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Merge multiple questions into a single unified question.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The merged question
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        text = ", ".join(text)
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="merge_questions.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=mode,
+        )
+    def rewrite(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        mode: Literal["positive", "negative", "hard_negative"] = "positive",
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Rewrite a text with different modes.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The rewritten text
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="rewrite.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=mode,
+        )
+    def subject_to_question(
+        self,
+        text: str,
+        number_of_questions: int,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Generate a list of questions about a subject.
+        Returns:
+            ToolOutput: Object containing:
+                - result (list[str]): List of generated questions
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            number_of_questions=number_of_questions,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="subject_to_question.yaml",
+            output_model=OutputModels.ReasonListStrOutput,
+            resp_format="parse",
+            mode=None,
+        )
+    def summarize(
+        self,
+        text: str,
+        with_analysis: bool = False,
+        output_lang: str | None = None,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Summarize the given subject text.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The summary text
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            with_analysis=with_analysis,
+            output_lang=output_lang,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="summarize.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=None,
+        )
+    def translate(
+        self,
+        text: str,
+        target_language: str,
+        with_analysis: bool = False,
+        user_prompt: str | None = None,
+        temperature: float | None = 0.0,
+        logprobs: bool = False,
+        top_logprobs: int | None = None,
+        validator: Callable[[Any], bool] | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Translate text between languages.
+        Returns:
+            ToolOutput: Object containing:
+                - result (str): The translated text
+                - logprobs (list | None): Probability data if logprobs enabled
+                - analysis (str | None): Detailed reasoning if with_analysis enabled
+        """
+        return self.operator.run(
+            # User parameters
+            text=text,
+            target_language=target_language,
+            with_analysis=with_analysis,
+            user_prompt=user_prompt,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            validator=validator,
+            # Internal parameters
+            prompt_file="translate.yaml",
+            output_model=OutputModels.StrOutput,
+            resp_format="parse",
+            mode=None,
+            output_lang=None,
+        )
+    def run_custom(
+        self,
+        prompt: str,
+        output_model: Any,
+        output_lang: str | None = None,
+        temperature: float | None = None,
+        logprobs: bool | None = None,
+        top_logprobs: int | None = None,
+    ) -> OutputModels.ToolOutput:
+        """
+        Custom tool that can do almost anything!
+        Returns:
+            ToolOutput: Object with fields:
+                - result (str): The output result
+        """
+        return self.operator.run(
+            # User paramaeters
+            text=prompt,
+            output_model=output_model,
+            output_model_str=output_model.model_json_schema(),
+            output_lang=output_lang,
+            temperature=temperature,
+            logprobs=logprobs,
+            top_logprobs=top_logprobs,
+            # Internal parameters
+            prompt_file="run_custom.yaml",
+            resp_format="parse",
+            user_prompt=None,
+            with_analysis=False,
+            mode=None,
+            validator=None,
+        )

hamtaa_texttools-0.1.48.dist-info/METADATA DELETED Viewed

@@ -1,60 +0,0 @@
-Metadata-Version: 2.4
-Name: hamtaa-texttools
-Version: 0.1.48
-Summary: A set of high-level NLP tools
-Author: Tohidi, Montazer, Givechi, Mousavinezhad
-Requires-Python: >=3.8
-Description-Content-Type: text/markdown
-Requires-Dist: openai==1.97.1
-Requires-Dist: numpy==1.26.4
-# Text Tools
-<p align="center">
-  <img src="https://img.shields.io/badge/TextTools-Python%20Text%20Processing-black?style=for-the-badge&logo=python&logoColor=white">
-</p>
-<p align="center">
-  <img src="docs/logo.png" alt="Preview" width="300" height="300">
-</p>
-## How to Install
-Install the package using:
-```bash
-pip install -U hamta-texttools
-```
----
-## What This Library Is *Not*
-This is **not** a collection of low-level utilities.
-To clarify: this library **does not** include things like:
-- An standard `regex`
-- Word normalization utilities
----
-## What This Library *Provides*
-This is a set of **high-level natural language processing (NLP)** tools.
-Some of the features include:
-- `question_detector`: Detecting if an incoming text is a question or not
-- `categorizer`: No finetuning need, categorizer
-- ... (Tell me what you want!)
----
-## When to Use This Library
-Use `texttools` when:
-- You need to **process large volumes of data using OpenAI’s GPT models** via the BATCH API.
-- You want to treat an **LLM as a function** in Python that outputs structured JSON or Pydantic models.
-- You need to **categorize large datasets** using vector embeddings, efficiently and at scale.

hamtaa_texttools-0.1.48.dist-info/RECORD DELETED Viewed

@@ -1,61 +0,0 @@
-texttools/__init__.py,sha256=UEPcm1wKU7Hiqw1K_E2ojZSnyQrGyNLzN0spQ_ZXjJ4,784
-texttools/base/__init__.py,sha256=KUGm-Oe0BxlrRhPS-Jm2q1NCmwX8MdtZtloia7bcLaM,189
-texttools/base/base_categorizer.py,sha256=ojup94iXLxh92TjiJmrFXeRbsWKlon7PPAqez96B1bs,1130
-texttools/base/base_keyword_extractor.py,sha256=uKpxb3xI-sim-vXWe1R4_36QRhSNsWDR4IuVdpkZMME,868
-texttools/base/base_ner_extractor.py,sha256=D0LRNSyq1uIU9Qtepi7zpCWWzYz-AOxpVNjq97S1oUA,1933
-texttools/base/base_question_detector.py,sha256=FR9yDP0Z8aAfGafZy3kcpSDUUYWLJM7saRKdeVN5TiM,829
-texttools/base/base_question_generator.py,sha256=L_2ZwqyV9GxsKiQynWKRJG15OBFgQqiCic5H0i8R5yk,3238
-texttools/base/base_question_merger.py,sha256=TYhsihKaIdyGCVu4AcjxPZ1_HocHt__voV8WWGMRpMs,1945
-texttools/base/base_question_rewriter.py,sha256=K6ZnAjxi2qw4yLxm92zTI1IStCfX6c_6lCfIuBDSx8w,1973
-texttools/base/base_router.py,sha256=pFDjIXFqAhPiS9Onu5py_GxOq8geDGJDQh6k6IhCkvw,933
-texttools/base/base_summarizer.py,sha256=7NAilhUPs6ZUwkBpTtXAj6n2XxQH1w6SOolf3gQX2gc,1627
-texttools/base/base_task_performer.py,sha256=3-6qshkie50S7pRG4WHRNC_RdUbSmHOPKW56CD92-rM,1852
-texttools/base/base_translator.py,sha256=BoOxqaoPoUs8t1O3m2yL9pQa5iwisl097immTVcGZoE,1020
-texttools/formatter/__init__.py,sha256=KHz2tFZctbit_HVbQNCTMi46JzmKlg-uB6Ost63IpVU,46
-texttools/formatter/base.py,sha256=0fiM6E7NdJevAVpL6yyPaUZVJGKWxE3fr-Ay1oqgJqQ,879
-texttools/formatter/gemma3_formatter.py,sha256=AmdKBYLj6HMsI2DDX4KHNEEVYJmz_VVNUBOv8ScGjsY,1865
-texttools/handlers/__init__.py,sha256=sv0JloipQ57AI0xo-3w9k6cK5rYjZP3ltR2EbBhkHTA,121
-texttools/handlers/handlers.py,sha256=LtC4FBuzRUDy3Jw-Fp21WR-QS1jOcDhsGaMPFQGjfTw,2381
-texttools/handlers/categorizer/__init__.py,sha256=mE05vt_ma6vcP8pQ37BZ85WVQ8jhcjDS0iZV81_LFCY,127
-texttools/handlers/categorizer/categorizer.py,sha256=HBpdhtCGUPl1TJUOxbgSLmVWD7o9xeIjmSWXvYzGrCA,1592
-texttools/tools/__init__.py,sha256=V3ZjSj_ZI9r02sOmxpxxxKBbBbtuYS1MQqtrdGZHC_A,1121
-texttools/tools/categorizer/__init__.py,sha256=VY0SVdik0et0fwLDj7qn-d5LtVqVBIalvlRVci699i4,48
-texttools/tools/categorizer/encoder_model/__init__.py,sha256=7UwoPlQ09VGN0cqfi5fPQRfsZZ8hoZj6fL6cax1BLSU,53
-texttools/tools/categorizer/encoder_model/encoder_vectorizer.py,sha256=MHPVJQJlvNhZ5xLVXk4FtvrORW2yxPSAnjEhjPbkQts,1476
-texttools/tools/categorizer/llm/__init__.py,sha256=0VbxvInITfNUlOF6bJqcUKKaYWlIe9K3vRmIRuvAGcY,95
-texttools/tools/categorizer/llm/gemma_categorizer.py,sha256=tjwKonTjT5cAhxWQaVyvyooRyOlGACHpnn72PNoLk-8,5636
-texttools/tools/categorizer/llm/openai_categorizer.py,sha256=omRk77Z5ZCIAz17h4wPDP_EcBSsscA-PQJpQjtI6--o,2547
-texttools/tools/keyword_extractor/__init__.py,sha256=eTpujS85MmRRbnNwc2ifKUh60W8OG4RQFmWki3Z7C_0,84
-texttools/tools/keyword_extractor/gemma_extractor.py,sha256=TJ4wMPWRuuzRi_Q0hr7UauKhEg8U_5U5j1D_lTFrn4s,4349
-texttools/tools/merger/__init__.py,sha256=bh2RBpqJvDaqEmDrM9y_GcjRqibagifAxiZVu8nEHc0,115
-texttools/tools/merger/gemma_question_merger.py,sha256=JAC-52kBbabIzEWp0MFi9viiu8nZOAMPaJZALHvNMqo,8035
-texttools/tools/ner/__init__.py,sha256=BW84BcItel6Mc2JlaDL6qvAktVMkti67VXceeCnOB1g,70
-texttools/tools/ner/gemma_ner_extractor.py,sha256=YhyIwX_8bdwkFb4gY8g9mZdYHW_r1jCvbmjjNCK9Wfo,5384
-texttools/tools/question_detector/__init__.py,sha256=ulArGttooSoxEe0vUDQSxUQrnsxr7gH9l-LjSER2dVI,162
-texttools/tools/question_detector/gemma_detector.py,sha256=DhlCAA6Hws_OTuYil6UY4sYlbjdQQU6EqHdoTl3a--w,3772
-texttools/tools/question_detector/llm_detector.py,sha256=zo89eh359hqQGGf83-6M22AaiH7q-m0m91SjTyxZaYs,3862
-texttools/tools/question_generator/__init__.py,sha256=EAElpB_YeyMoBqvFNjbW2a_j18SLtiKQ7sRmdS58Fww,61
-texttools/tools/question_generator/gemma_question_generator.py,sha256=V5QcXmHZ5shTvrThOxUrKJ4FqP0P58NIJbsPdyyy5IM,6744
-texttools/tools/reranker/__init__.py,sha256=70jqJ9cjpPzzvnMYgHYGVZ9PrWrN9N97visqD_PVxwU,100
-texttools/tools/reranker/reranker.py,sha256=2SiTMIxempMuHui2n4GJV_2dLGBeoC7WAn_rVVXlMBA,5518
-texttools/tools/reranker/scorer.py,sha256=fQ3Ya8QmNhrcmb-Rf-72hvhweGvVj6gQ4KOlham2eE8,8176
-texttools/tools/reranker/sorter.py,sha256=_ed5zGz7K60skPFFuEQZ1ObBFA71LAfVT6FyWicA-Pw,11419
-texttools/tools/rewriter/__init__.py,sha256=U_qwGeEOqHAcV4p2CHVb0AIvHKFfdvykRzGyWD54aWA,121
-texttools/tools/rewriter/gemma_question_rewriter.py,sha256=jXtRswfBvHn9QmE90JvxEmLvCTbwZqZhD_A5ONWeCzo,7925
-texttools/tools/router/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-texttools/tools/router/gemma_router.py,sha256=VX-kHphZVZNd0_ajugN08hGkWNUeUriwfonpYy2TIS4,5619
-texttools/tools/subject_to_question/__init__.py,sha256=VJpns16Qe5OL_-4WuGDUNShcJsodB2khGWT3Q1Hc-WU,72
-texttools/tools/subject_to_question/gemma_question_generator.py,sha256=VKXHhYHEvhFLUR87iEh0eFpD_4ueX4np8IjF-NkgWrY,7417
-texttools/tools/summarizer/__init__.py,sha256=phrR7qO20CNhO3hjXQBzhTRVumdVdGSufmH4GEYkhj4,140
-texttools/tools/summarizer/gemma_summarizer.py,sha256=ikhsBv7AiZD1dT_d12AyjXxojzSW92e2y5WjchI_3bE,4474
-texttools/tools/summarizer/llm_summerizer.py,sha256=-0rUKbSnl1aDeBfJ5DCSbIlwd2k-9qIaCKgoQJa0hWc,3412
-texttools/tools/translator/__init__.py,sha256=KO1m08J2BZwRqBGO9ICB4l4cnH1jfHLHL5HbgYFUWM8,72
-texttools/tools/translator/gemma_translator.py,sha256=rbP0kgkhOiEPdHWgHQc7Lev7lrAIYqNb6t_OfZLp44E,7180
-texttools/utils/flex_processor.py,sha256=Y44uTracvXUJiUm5hh57Uk0933RU9GTc3dN_1Bo_XQA,3214
-texttools/utils/batch_manager/__init__.py,sha256=3ZkxA395lRD4gNxJ1vp0fNuz_XuBr50GoP51rrwQ0Ks,87
-texttools/utils/batch_manager/batch_manager.py,sha256=jAmKskL3OTYwwsO1mWsWAB3VxMlOF07c2GW1Ev83ZhY,9283
-texttools/utils/batch_manager/batch_runner.py,sha256=kW0IPauI11xpssApMA7b4XI19FePImywym3V7tBaa-o,7404
-hamtaa_texttools-0.1.48.dist-info/METADATA,sha256=cUMn4AfOaYObchCIOQ-xrj0vmF3VTsmHYnob3Xi7R2M,1481
-hamtaa_texttools-0.1.48.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-hamtaa_texttools-0.1.48.dist-info/top_level.txt,sha256=5Mh0jIxxZ5rOXHGJ6Mp-JPKviywwN0MYuH0xk5bEWqE,10
-hamtaa_texttools-0.1.48.dist-info/RECORD,,

texttools/base/__init__.py DELETED Viewed

@@ -1,3 +0,0 @@
-from texttools.base.base_categorizer import BaseCategorizer
-from texttools.base.base_question_detector import BaseQuestionDetector
-from texttools.base.base_summarizer import BaseSummarizer

texttools/base/base_categorizer.py DELETED Viewed

@@ -1,40 +0,0 @@
-import logging
-from abc import ABC, abstractmethod
-from enum import Enum
-from typing import Optional
-from texttools.handlers import NoOpResultHandler, ResultHandler
-class BaseCategorizer(ABC):
-    def __init__(
-        self,
-        handlers: Optional[list[ResultHandler]] = None,
-    ):
-        """
-        handlers: List of ResultHandler objects that will process results after categorization.
-        """
-        self.handlers = handlers or [NoOpResultHandler()]
-    @abstractmethod
-    def categorize(self, text: str) -> Enum:
-        """
-        Categorize the input text.
-        Must return one of the Enum members defined in self.categories.
-        """
-        pass
-    def preprocess(self, text: str) -> str:
-        """
-        Optional: Preprocess text before categorization.
-        """
-        return text
-    def _dispatch(self, results: dict) -> None:
-        for handler in self.handlers:
-            try:
-                handler.handle(results)
-            except Exception:
-                logging.error(
-                    f"Handler {handler.__class__.__name__} failed", exc_info=True
-                )

texttools/base/base_keyword_extractor.py DELETED Viewed

@@ -1,35 +0,0 @@
-from abc import ABC, abstractmethod
-from typing import Any, Optional
-class BaseKeywordExtractor(ABC):
-    """
-    Base class for all detectors that output a list of keywords.
-    """
-    def __init__(
-        self,
-        handlers: Optional[list[Any]] = None,
-    ):
-        self.handlers = handlers or []
-    @abstractmethod
-    def extract_keywords(self, text: str) -> list[str]:
-        """
-        Extract keywords from the input text.
-        Should return a list of strings, where each string is a keyword.
-        """
-        pass
-    def preprocess(self, text: str) -> str:
-        """
-        Optional text preprocessing step.
-        """
-        return text.strip()
-    def _dispatch(self, result: dict) -> None:
-        """
-        Dispatch the result to handlers.
-        """
-        for handler in self.handlers:
-            handler.handle(result)

hamtaa-texttools 0.1.48__py3-none-any.whl → 1.1.7__py3-none-any.whl

Potentially problematic release.

hamtaa-texttools 0.1.48py3-none-any.whl → 1.1.7py3-none-any.whl