PyPI - llm-ie - Versions diffs - 1.1.0__py3-none-any.whl → 1.2.1__py3-none-any.whl - Mend

llm-ie 1.1.0py3-none-any.whl → 1.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

llm_ie/__init__.py +2 -2
llm_ie/asset/prompt_guide/AttributeExtractor_prompt_guide.txt +52 -0
llm_ie/engines.py +8 -6
llm_ie/extractors.py +409 -460
llm_ie/prompt_editor.py +88 -34
{llm_ie-1.1.0.dist-info → llm_ie-1.2.1.dist-info}/METADATA +1 -1
{llm_ie-1.1.0.dist-info → llm_ie-1.2.1.dist-info}/RECORD +8 -7
{llm_ie-1.1.0.dist-info → llm_ie-1.2.1.dist-info}/WHEEL +0 -0

llm_ie/__init__.py CHANGED Viewed

@@ -1,11 +1,11 @@
 from .data_types import LLMInformationExtractionFrame, LLMInformationExtractionDocument
 from .engines import BasicLLMConfig, Qwen3LLMConfig, OpenAIReasoningLLMConfig, LlamaCppInferenceEngine, OllamaInferenceEngine, HuggingFaceHubInferenceEngine, OpenAIInferenceEngine, AzureOpenAIInferenceEngine, LiteLLMInferenceEngine
-from .extractors import DirectFrameExtractor, ReviewFrameExtractor, BasicFrameExtractor, BasicReviewFrameExtractor, SentenceFrameExtractor, SentenceReviewFrameExtractor, BinaryRelationExtractor, MultiClassRelationExtractor
+from .extractors import DirectFrameExtractor, ReviewFrameExtractor, BasicFrameExtractor, BasicReviewFrameExtractor, SentenceFrameExtractor, SentenceReviewFrameExtractor, AttributeExtractor, BinaryRelationExtractor, MultiClassRelationExtractor
 from .chunkers import UnitChunker, WholeDocumentUnitChunker, SentenceUnitChunker, TextLineUnitChunker, ContextChunker, NoContextChunker, WholeDocumentContextChunker, SlideWindowContextChunker
 from .prompt_editor import PromptEditor
 __all__ = ["LLMInformationExtractionFrame", "LLMInformationExtractionDocument",
            "BasicLLMConfig", "Qwen3LLMConfig", "OpenAIReasoningLLMConfig", "LlamaCppInferenceEngine", "OllamaInferenceEngine", "HuggingFaceHubInferenceEngine", "OpenAIInferenceEngine", "AzureOpenAIInferenceEngine", "LiteLLMInferenceEngine",
-           "DirectFrameExtractor", "ReviewFrameExtractor", "BasicFrameExtractor", "BasicReviewFrameExtractor", "SentenceFrameExtractor", "SentenceReviewFrameExtractor", "BinaryRelationExtractor", "MultiClassRelationExtractor",
+           "DirectFrameExtractor", "ReviewFrameExtractor", "BasicFrameExtractor", "BasicReviewFrameExtractor", "SentenceFrameExtractor", "SentenceReviewFrameExtractor", "AttributeExtractor", "BinaryRelationExtractor", "MultiClassRelationExtractor",
            "UnitChunker", "WholeDocumentUnitChunker", "SentenceUnitChunker", "TextLineUnitChunker", "ContextChunker", "NoContextChunker", "WholeDocumentContextChunker", "SlideWindowContextChunker",
            "PromptEditor"]

llm_ie/asset/prompt_guide/AttributeExtractor_prompt_guide.txt ADDED Viewed

@@ -0,0 +1,52 @@
+Prompt Template Design:
+1. Task Description:
+   Provide a detailed description of the task, including the background and the type of task (e.g., attribute extraction task).
+2. Schema Definition:
+   List the attributes to extract, and provide clear definitions for each one.
+3. Output Format Definition:
+   The output should be a JSON list, where each attribute be a key. The values could be any structure (e.g., str, int, List[str]).
+4. Optional: Hints:
+   Provide itemized hints for the information extractors to guide the extraction process. Remind the prompted agent to be truthful. Emphasize that the prompted agent is supposed to perform the task instead of writting code or instruct other agents to do it.
+5. Optional: Examples:
+   Include examples in the format:
+    Input: ...
+    Output: ...
+6. Entity:
+   The template must include a placeholder {{frame}} for the entity.
+7. Context:
+   The template must include a placeholder {{context}} for the context. Explain to the prompted agent that <Entity> tags are used to mark the entity in the context.
+Example:
+    ### Task description
+    This is an attribute extraction task. Given a diagnosis entity and the context, you need to generate attributes for the entity.
+    ### Schema definition
+        "Date" which is the date when the diagnosis was made in MM/DD/YYYY format,
+        "Status" which is the current status of the diagnosis (e.g. active, resolved, etc.)
+    ### Output format definition
+    Your output should follow the JSON format:
+    {"Date": "<MM/DD/YYYY>", "Status": "<status>"}
+    I am only interested in the content between []. Do not explain your answer.
+    ### Hints
+    - If the date is not complete, use the first available date in the context. For example, if the date is 01/2023, you should return 01/01/2023.
+    - If the status is not available, you should return "not specified".
+    ### Entity
+    Information about the entity to extract attributes from:
+    {{frame}}
+    ### Context
+    Context for the entity. The <Entity> tags are used to mark the entity in the context.
+    {{context}}

llm_ie/engines.py CHANGED Viewed

@@ -185,10 +185,11 @@ class Qwen3LLMConfig(LLMConfig):
 class OpenAIReasoningLLMConfig(LLMConfig):
-    def __init__(self, reasoning_effort:str="low", **kwargs):
+    def __init__(self, reasoning_effort:str=None, **kwargs):
         """
         The OpenAI "o" series configuration.
-        1. The reasoning effort is set to "low" by default.
+        1. The reasoning effort as one of {"low", "medium", "high"}.
+            For models that do not support setting reasoning effort (e.g., o1-mini, o1-preview), set to None.
         2. The temperature parameter is not supported and will be ignored.
         3. The system prompt is not supported and will be concatenated to the next user prompt.
@@ -198,11 +199,12 @@ class OpenAIReasoningLLMConfig(LLMConfig):
             the reasoning effort. Must be one of {"low", "medium", "high"}. Default is "low".
         """
         super().__init__(**kwargs)
-        if reasoning_effort not in ["low", "medium", "high"]:
-            raise ValueError("reasoning_effort must be one of {'low', 'medium', 'high'}.")
+        if reasoning_effort is not None:
+            if reasoning_effort not in ["low", "medium", "high"]:
+                raise ValueError("reasoning_effort must be one of {'low', 'medium', 'high'}.")
-        self.reasoning_effort = reasoning_effort
-        self.params["reasoning_effort"] = self.reasoning_effort
+            self.reasoning_effort = reasoning_effort
+            self.params["reasoning_effort"] = self.reasoning_effort
         if "temperature" in self.params:
             warnings.warn("Reasoning models do not support temperature parameter. Will be ignored.", UserWarning)

llm-ie 1.1.0__py3-none-any.whl → 1.2.1__py3-none-any.whl

llm-ie 1.1.0py3-none-any.whl → 1.2.1py3-none-any.whl