PyPI - llm-ie - Versions diffs - 1.0.0__py3-none-any.whl → 1.2.0__py3-none-any.whl - Mend

llm-ie 1.0.0py3-none-any.whl → 1.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

llm_ie/__init__.py +4 -4
llm_ie/asset/prompt_guide/AttributeExtractor_prompt_guide.txt +52 -0
llm_ie/engines.py +497 -250
llm_ie/extractors.py +479 -681
llm_ie/prompt_editor.py +13 -13
{llm_ie-1.0.0.dist-info → llm_ie-1.2.0.dist-info}/METADATA +2 -2
{llm_ie-1.0.0.dist-info → llm_ie-1.2.0.dist-info}/RECORD +8 -7
{llm_ie-1.0.0.dist-info → llm_ie-1.2.0.dist-info}/WHEEL +0 -0

llm_ie/__init__.py CHANGED Viewed

@@ -1,11 +1,11 @@
 from .data_types import LLMInformationExtractionFrame, LLMInformationExtractionDocument
-from .engines import LlamaCppInferenceEngine, OllamaInferenceEngine, HuggingFaceHubInferenceEngine, OpenAIInferenceEngine, AzureOpenAIInferenceEngine, LiteLLMInferenceEngine
-from .extractors import DirectFrameExtractor, ReviewFrameExtractor, BasicFrameExtractor, BasicReviewFrameExtractor, SentenceFrameExtractor, SentenceReviewFrameExtractor, BinaryRelationExtractor, MultiClassRelationExtractor
+from .engines import BasicLLMConfig, Qwen3LLMConfig, OpenAIReasoningLLMConfig, LlamaCppInferenceEngine, OllamaInferenceEngine, HuggingFaceHubInferenceEngine, OpenAIInferenceEngine, AzureOpenAIInferenceEngine, LiteLLMInferenceEngine
+from .extractors import DirectFrameExtractor, ReviewFrameExtractor, BasicFrameExtractor, BasicReviewFrameExtractor, SentenceFrameExtractor, SentenceReviewFrameExtractor, AttributeExtractor, BinaryRelationExtractor, MultiClassRelationExtractor
 from .chunkers import UnitChunker, WholeDocumentUnitChunker, SentenceUnitChunker, TextLineUnitChunker, ContextChunker, NoContextChunker, WholeDocumentContextChunker, SlideWindowContextChunker
 from .prompt_editor import PromptEditor
 __all__ = ["LLMInformationExtractionFrame", "LLMInformationExtractionDocument",
-           "LlamaCppInferenceEngine", "OllamaInferenceEngine", "HuggingFaceHubInferenceEngine", "OpenAIInferenceEngine", "AzureOpenAIInferenceEngine", "LiteLLMInferenceEngine",
-           "DirectFrameExtractor", "ReviewFrameExtractor", "BasicFrameExtractor", "BasicReviewFrameExtractor", "SentenceFrameExtractor", "SentenceReviewFrameExtractor", "BinaryRelationExtractor", "MultiClassRelationExtractor",
+           "BasicLLMConfig", "Qwen3LLMConfig", "OpenAIReasoningLLMConfig", "LlamaCppInferenceEngine", "OllamaInferenceEngine", "HuggingFaceHubInferenceEngine", "OpenAIInferenceEngine", "AzureOpenAIInferenceEngine", "LiteLLMInferenceEngine",
+           "DirectFrameExtractor", "ReviewFrameExtractor", "BasicFrameExtractor", "BasicReviewFrameExtractor", "SentenceFrameExtractor", "SentenceReviewFrameExtractor", "AttributeExtractor", "BinaryRelationExtractor", "MultiClassRelationExtractor",
            "UnitChunker", "WholeDocumentUnitChunker", "SentenceUnitChunker", "TextLineUnitChunker", "ContextChunker", "NoContextChunker", "WholeDocumentContextChunker", "SlideWindowContextChunker",
            "PromptEditor"]

llm_ie/asset/prompt_guide/AttributeExtractor_prompt_guide.txt ADDED Viewed

@@ -0,0 +1,52 @@
+Prompt Template Design:
+1. Task Description:
+   Provide a detailed description of the task, including the background and the type of task (e.g., attribute extraction task).
+2. Schema Definition:
+   List the attributes to extract, and provide clear definitions for each one.
+3. Output Format Definition:
+   The output should be a JSON list, where each attribute be a key. The values could be any structure (e.g., str, int, List[str]).
+4. Optional: Hints:
+   Provide itemized hints for the information extractors to guide the extraction process. Remind the prompted agent to be truthful. Emphasize that the prompted agent is supposed to perform the task instead of writting code or instruct other agents to do it.
+5. Optional: Examples:
+   Include examples in the format:
+    Input: ...
+    Output: ...
+6. Entity:
+   The template must include a placeholder {{frame}} for the entity.
+7. Context:
+   The template must include a placeholder {{context}} for the context. Explain to the prompted agent that <Entity> tags are used to mark the entity in the context.
+Example:
+    ### Task description
+    This is an attribute extraction task. Given a diagnosis entity and the context, you need to generate attributes for the entity.
+    ### Schema definition
+        "Date" which is the date when the diagnosis was made in MM/DD/YYYY format,
+        "Status" which is the current status of the diagnosis (e.g. active, resolved, etc.)
+    ### Output format definition
+    Your output should follow the JSON format:
+    {"Date": "<MM/DD/YYYY>", "Status": "<status>"}
+    I am only interested in the content between []. Do not explain your answer.
+    ### Hints
+    - If the date is not complete, use the first available date in the context. For example, if the date is 01/2023, you should return 01/01/2023.
+    - If the status is not available, you should return "not specified".
+    ### Entity
+    Information about the entity to extract attributes from:
+    {{frame}}
+    ### Context
+    Context for the entity. The <Entity> tags are used to mark the entity in the context.
+    {{context}}

llm-ie 1.0.0__py3-none-any.whl → 1.2.0__py3-none-any.whl

llm-ie 1.0.0py3-none-any.whl → 1.2.0py3-none-any.whl