hamtaa-texttools 0.1.50__tar.gz → 0.1.51__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of hamtaa-texttools might be problematic. Click here for more details.
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/pyproject.toml +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/translator/gemma_translator.py +14 -6
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/README.md +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/SOURCES.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/dependency_links.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/requires.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/top_level.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/setup.cfg +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/setup.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/tests/test_vllm_output.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_keyword_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_merger.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_router.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_summarizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_task_performer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_translator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/formatter/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/formatter/base.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/formatter/gemma3_formatter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/categorizer/categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/handlers.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/encoder_model/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/encoder_model/encoder_vectorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/llm/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/llm/gemma_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/llm/openai_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/keyword_extractor/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/keyword_extractor/gemma_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/merger/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/merger/gemma_question_merger.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/ner/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/ner/gemma_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_detector/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_detector/gemma_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_detector/llm_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_generator/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_generator/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/reranker/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/reranker/reranker.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/reranker/scorer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/reranker/sorter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/rewriter/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/rewriter/gemma_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/router/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/router/gemma_router.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/subject_to_question/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/subject_to_question/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/summarizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/summarizer/gemma_summarizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/summarizer/llm_summerizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/translator/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/batch_manager.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/batch_runner.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/flex_processor.py +0 -0
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/translator/gemma_translator.py
RENAMED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
from typing import Any, Optional
|
|
1
|
+
from typing import Any, List, Optional
|
|
2
2
|
|
|
3
3
|
from openai import OpenAI
|
|
4
|
-
from pydantic import BaseModel
|
|
4
|
+
from pydantic import BaseModel, Field
|
|
5
5
|
|
|
6
6
|
from texttools.base.base_translator import BaseTranslator
|
|
7
7
|
from texttools.formatter.gemma3_formatter import Gemma3Formatter
|
|
@@ -10,8 +10,16 @@ from texttools.formatter.gemma3_formatter import Gemma3Formatter
|
|
|
10
10
|
# Pydantic BaseModel to specify the output format of preprocessor
|
|
11
11
|
# Preprocessor's job is to extract proper names
|
|
12
12
|
class PreprocessorOutput(BaseModel):
|
|
13
|
-
|
|
14
|
-
|
|
13
|
+
"""
|
|
14
|
+
A single proper-name entity extracted from the source text.
|
|
15
|
+
"""
|
|
16
|
+
|
|
17
|
+
text: str = Field(
|
|
18
|
+
description="The exact substring from the original text that represents a proper name."
|
|
19
|
+
)
|
|
20
|
+
text_type: str = Field(
|
|
21
|
+
description='Always use the literal value "Proper Name" when this entity is a real persons name.'
|
|
22
|
+
)
|
|
15
23
|
|
|
16
24
|
|
|
17
25
|
class GemmaTranslator(BaseTranslator):
|
|
@@ -135,7 +143,7 @@ class GemmaTranslator(BaseTranslator):
|
|
|
135
143
|
completion = self.client.chat.completions.parse(
|
|
136
144
|
model=self.model,
|
|
137
145
|
messages=restructured,
|
|
138
|
-
response_format=PreprocessorOutput,
|
|
146
|
+
response_format=List[PreprocessorOutput],
|
|
139
147
|
temperature=self.temperature,
|
|
140
148
|
extra_body=dict(guided_decoding_backend="auto") ** self.client_kwargs,
|
|
141
149
|
)
|
|
@@ -153,7 +161,7 @@ class GemmaTranslator(BaseTranslator):
|
|
|
153
161
|
|
|
154
162
|
# Extract proper names to tell the LLM what names not to translate, but to transliterate
|
|
155
163
|
extracted = self.preprocess(text)
|
|
156
|
-
proper_names = [e
|
|
164
|
+
proper_names = [e.text for e in extracted]
|
|
157
165
|
|
|
158
166
|
reason_summary = None
|
|
159
167
|
if self.use_reason:
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/hamtaa_texttools.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_keyword_extractor.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_detector.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_generator.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/base/base_question_rewriter.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/categorizer/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/handlers/categorizer/categorizer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/categorizer/llm/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/keyword_extractor/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/merger/gemma_question_merger.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/ner/gemma_ner_extractor.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_detector/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/question_generator/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/subject_to_question/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/summarizer/gemma_summarizer.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/tools/summarizer/llm_summerizer.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/batch_manager.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.51}/texttools/utils/batch_manager/batch_runner.py
RENAMED
|
File without changes
|
|
File without changes
|