hamtaa-texttools 0.1.52__tar.gz → 0.1.54__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of hamtaa-texttools might be problematic. Click here for more details.
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/pyproject.toml +1 -1
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/translator/gemma_translator.py +7 -12
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/README.md +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/SOURCES.txt +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/dependency_links.txt +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/requires.txt +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/top_level.txt +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/setup.cfg +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/setup.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/tests/test_vllm_output.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_categorizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_keyword_extractor.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_detector.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_generator.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_merger.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_router.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_summarizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_task_performer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_translator.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/formatter/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/formatter/base.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/formatter/gemma3_formatter.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/categorizer/categorizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/handlers.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/encoder_model/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/encoder_model/encoder_vectorizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/llm/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/llm/gemma_categorizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/llm/openai_categorizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/keyword_extractor/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/keyword_extractor/gemma_extractor.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/merger/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/merger/gemma_question_merger.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/ner/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/ner/gemma_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_detector/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_detector/gemma_detector.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_detector/llm_detector.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_generator/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_generator/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/reranker/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/reranker/reranker.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/reranker/scorer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/reranker/sorter.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/rewriter/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/rewriter/gemma_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/router/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/router/gemma_router.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/subject_to_question/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/subject_to_question/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/summarizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/summarizer/gemma_summarizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/summarizer/llm_summerizer.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/translator/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/__init__.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/batch_manager.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/batch_runner.py +0 -0
- {hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/flex_processor.py +0 -0
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/translator/gemma_translator.py
RENAMED
|
@@ -7,18 +7,13 @@ from texttools.base.base_translator import BaseTranslator
|
|
|
7
7
|
from texttools.formatter.gemma3_formatter import Gemma3Formatter
|
|
8
8
|
|
|
9
9
|
|
|
10
|
-
# Pydantic BaseModel to specify the output format of preprocessor
|
|
11
|
-
# Preprocessor's job is to extract proper names
|
|
12
10
|
class PreprocessorOutput(BaseModel):
|
|
13
11
|
"""
|
|
14
|
-
|
|
12
|
+
List of proper-name strings extracted from the source text.
|
|
15
13
|
"""
|
|
16
14
|
|
|
17
|
-
|
|
18
|
-
description="
|
|
19
|
-
)
|
|
20
|
-
text_type: str = Field(
|
|
21
|
-
description='Always use the literal value "Proper Name" when this entity is a real persons name.'
|
|
15
|
+
entities: List[str] = Field(
|
|
16
|
+
description="All proper names found in the text; return an empty list if none."
|
|
22
17
|
)
|
|
23
18
|
|
|
24
19
|
|
|
@@ -73,7 +68,7 @@ class GemmaTranslator(BaseTranslator):
|
|
|
73
68
|
"""
|
|
74
69
|
messages.append({"role": "user", "content": enforce_prompt})
|
|
75
70
|
|
|
76
|
-
clean_text = text
|
|
71
|
+
clean_text = text
|
|
77
72
|
if reason:
|
|
78
73
|
reason_prompt = f"""
|
|
79
74
|
Based on the analysis conducted, translate the following text {"from" + source_language if source_language else ""} to {target_language}.
|
|
@@ -143,7 +138,7 @@ class GemmaTranslator(BaseTranslator):
|
|
|
143
138
|
completion = self.client.chat.completions.parse(
|
|
144
139
|
model=self.model,
|
|
145
140
|
messages=restructured,
|
|
146
|
-
response_format=
|
|
141
|
+
response_format=PreprocessorOutput,
|
|
147
142
|
temperature=self.temperature,
|
|
148
143
|
extra_body={
|
|
149
144
|
"guided_decoding_backend": "auto",
|
|
@@ -164,11 +159,11 @@ class GemmaTranslator(BaseTranslator):
|
|
|
164
159
|
|
|
165
160
|
# Extract proper names to tell the LLM what names not to translate, but to transliterate
|
|
166
161
|
extracted = self.preprocess(text)
|
|
167
|
-
proper_names =
|
|
162
|
+
proper_names = extracted.entities
|
|
168
163
|
|
|
169
164
|
reason_summary = None
|
|
170
165
|
if self.use_reason:
|
|
171
|
-
reason_summary = self._reason(text, target_language
|
|
166
|
+
reason_summary = self._reason(text, target_language)
|
|
172
167
|
|
|
173
168
|
messages = self._build_messages(
|
|
174
169
|
text, target_language, source_language, reason_summary, proper_names
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/hamtaa_texttools.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_keyword_extractor.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_detector.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_generator.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/base/base_question_rewriter.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/categorizer/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/handlers/categorizer/categorizer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/categorizer/llm/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/keyword_extractor/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/merger/gemma_question_merger.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/ner/gemma_ner_extractor.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_detector/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/question_generator/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/subject_to_question/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/summarizer/gemma_summarizer.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/tools/summarizer/llm_summerizer.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/batch_manager.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.52 → hamtaa_texttools-0.1.54}/texttools/utils/batch_manager/batch_runner.py
RENAMED
|
File without changes
|
|
File without changes
|