hamtaa-texttools 0.1.50__tar.gz → 0.1.52__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of hamtaa-texttools might be problematic. Click here for more details.
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/PKG-INFO +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/pyproject.toml +1 -1
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/translator/gemma_translator.py +18 -7
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/README.md +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/SOURCES.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/dependency_links.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/requires.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/top_level.txt +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/setup.cfg +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/setup.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/tests/test_vllm_output.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_keyword_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_merger.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_router.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_summarizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_task_performer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_translator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/formatter/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/formatter/base.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/formatter/gemma3_formatter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/categorizer/categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/handlers.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/encoder_model/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/encoder_model/encoder_vectorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/llm/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/llm/gemma_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/llm/openai_categorizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/keyword_extractor/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/keyword_extractor/gemma_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/merger/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/merger/gemma_question_merger.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/ner/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/ner/gemma_ner_extractor.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_detector/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_detector/gemma_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_detector/llm_detector.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_generator/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_generator/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/reranker/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/reranker/reranker.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/reranker/scorer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/reranker/sorter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/rewriter/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/rewriter/gemma_question_rewriter.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/router/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/router/gemma_router.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/subject_to_question/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/subject_to_question/gemma_question_generator.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/summarizer/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/summarizer/gemma_summarizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/summarizer/llm_summerizer.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/translator/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/__init__.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/batch_manager.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/batch_runner.py +0 -0
- {hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/flex_processor.py +0 -0
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/translator/gemma_translator.py
RENAMED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
from typing import Any, Optional
|
|
1
|
+
from typing import Any, List, Optional
|
|
2
2
|
|
|
3
3
|
from openai import OpenAI
|
|
4
|
-
from pydantic import BaseModel
|
|
4
|
+
from pydantic import BaseModel, Field
|
|
5
5
|
|
|
6
6
|
from texttools.base.base_translator import BaseTranslator
|
|
7
7
|
from texttools.formatter.gemma3_formatter import Gemma3Formatter
|
|
@@ -10,8 +10,16 @@ from texttools.formatter.gemma3_formatter import Gemma3Formatter
|
|
|
10
10
|
# Pydantic BaseModel to specify the output format of preprocessor
|
|
11
11
|
# Preprocessor's job is to extract proper names
|
|
12
12
|
class PreprocessorOutput(BaseModel):
|
|
13
|
-
|
|
14
|
-
|
|
13
|
+
"""
|
|
14
|
+
A single proper-name entity extracted from the source text.
|
|
15
|
+
"""
|
|
16
|
+
|
|
17
|
+
text: str = Field(
|
|
18
|
+
description="The exact substring from the original text that represents a proper name."
|
|
19
|
+
)
|
|
20
|
+
text_type: str = Field(
|
|
21
|
+
description='Always use the literal value "Proper Name" when this entity is a real persons name.'
|
|
22
|
+
)
|
|
15
23
|
|
|
16
24
|
|
|
17
25
|
class GemmaTranslator(BaseTranslator):
|
|
@@ -135,9 +143,12 @@ class GemmaTranslator(BaseTranslator):
|
|
|
135
143
|
completion = self.client.chat.completions.parse(
|
|
136
144
|
model=self.model,
|
|
137
145
|
messages=restructured,
|
|
138
|
-
response_format=PreprocessorOutput,
|
|
146
|
+
response_format=List[PreprocessorOutput],
|
|
139
147
|
temperature=self.temperature,
|
|
140
|
-
extra_body=
|
|
148
|
+
extra_body={
|
|
149
|
+
"guided_decoding_backend": "auto",
|
|
150
|
+
},
|
|
151
|
+
**self.client_kwargs,
|
|
141
152
|
)
|
|
142
153
|
message = completion.choices[0].message
|
|
143
154
|
|
|
@@ -153,7 +164,7 @@ class GemmaTranslator(BaseTranslator):
|
|
|
153
164
|
|
|
154
165
|
# Extract proper names to tell the LLM what names not to translate, but to transliterate
|
|
155
166
|
extracted = self.preprocess(text)
|
|
156
|
-
proper_names = [e
|
|
167
|
+
proper_names = [e.text for e in extracted]
|
|
157
168
|
|
|
158
169
|
reason_summary = None
|
|
159
170
|
if self.use_reason:
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/hamtaa_texttools.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_keyword_extractor.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_detector.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_generator.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/base/base_question_rewriter.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/categorizer/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/handlers/categorizer/categorizer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/categorizer/llm/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/keyword_extractor/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/merger/gemma_question_merger.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/ner/gemma_ner_extractor.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_detector/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/question_generator/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/subject_to_question/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/summarizer/gemma_summarizer.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/tools/summarizer/llm_summerizer.py
RENAMED
|
File without changes
|
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/__init__.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/batch_manager.py
RENAMED
|
File without changes
|
{hamtaa_texttools-0.1.50 → hamtaa_texttools-0.1.52}/texttools/utils/batch_manager/batch_runner.py
RENAMED
|
File without changes
|
|
File without changes
|