PyPI - llm-ie - Versions diffs - 0.3.3__py3-none-any.whl → 0.3.4__py3-none-any.whl - Mend

llm-ie 0.3.3py3-none-any.whl → 0.3.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

llm_ie/extractors.py CHANGED Viewed

@@ -181,19 +181,22 @@ class FrameExtractor(Extractor):
         Returns : Tuple[Tuple[int, int], float]
             a tuple of 2-tuple span and Jaccard score.
         """
+        if not text or not pattern:
+            return None, 0
         text_tokens, text_spans = self._get_word_tokens(text)
         pattern_tokens, _ = self._get_word_tokens(pattern)
         pattern_tokens_set = set(pattern_tokens)
         window_size = len(pattern_tokens)
-        window_size_min = int(window_size * (1 - buffer_size))
-        window_size_max = int(window_size * (1 + buffer_size))
+        window_size_min = max(1, int(window_size * (1 - buffer_size)))
+        window_size_max = int(window_size * (1 + buffer_size)) + 1
         closest_substring_span = None
         best_score = 0
         for i in range(len(text_tokens) - window_size_max):
             for w in range(window_size_min, window_size_max):
                 sub_str_tokens = text_tokens[i:i + w]
-                if sub_str_tokens[0] == pattern_tokens[0]:
+                if len(sub_str_tokens) > 0 and sub_str_tokens[0] == pattern_tokens[0]:
                     score = self._jaccard_score(set(sub_str_tokens), pattern_tokens_set)
                     if score > best_score:
                         best_score = score
@@ -238,7 +241,7 @@ class FrameExtractor(Extractor):
             # Exact match
             match = re.search(re.escape(entity), text)
-            if match:
+            if match and entity:
                 start, end = match.span()
                 entity_spans.append((start, end))
                 # Replace the found entity with spaces to avoid finding the same instance again
@@ -246,7 +249,7 @@ class FrameExtractor(Extractor):
             # Fuzzy match
             elif fuzzy_match:
                 closest_substring_span, best_score = self._get_closest_substring(text, entity, buffer_size=fuzzy_buffer_size)
-                if best_score >= fuzzy_score_cutoff and closest_substring_span:
+                if closest_substring_span and best_score >= fuzzy_score_cutoff:
                     entity_spans.append(closest_substring_span)
                     # Replace the found entity with spaces to avoid finding the same instance again
                     text = text[:closest_substring_span[0]] + ' ' * (closest_substring_span[1] - closest_substring_span[0]) + text[closest_substring_span[1]:]

{llm_ie-0.3.3.dist-info → llm_ie-0.3.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: llm-ie
-Version: 0.3.3
+Version: 0.3.4
 Summary: An LLM-powered tool that transforms everyday language into robust information extraction pipelines.
 License: MIT
 Author: Enshuo (David) Hsu

{llm_ie-0.3.3.dist-info → llm_ie-0.3.4.dist-info}/RECORD RENAMED Viewed

@@ -16,8 +16,8 @@ llm_ie/asset/prompt_guide/SentenceFrameExtractor_prompt_guide.txt,sha256=oKH_QeD
 llm_ie/asset/prompt_guide/SentenceReviewFrameExtractor_prompt_guide.txt,sha256=oKH_QeDgpw771ZdHk3L7DYz2Jvfm7OolUoTiJyMJI30,9541
 llm_ie/data_types.py,sha256=hPz3WOeAzfn2QKmb0CxHmRdQWZQ4G9zq8U-RJBVFdYk,14329
 llm_ie/engines.py,sha256=PTYs7s_iCPmI-yFUCVCPY_cMGS77ma2VGoz4rdNkODI,9308
-llm_ie/extractors.py,sha256=yBdIcevjMfwto85Jb0KkRMN-AjIMk92fD5yWB3Qm8MY,64408
+llm_ie/extractors.py,sha256=j9L9USybJBmYZM4RAjGO6DR4StYBgzhqCN6nEFZZQVQ,64523
 llm_ie/prompt_editor.py,sha256=Xc5ZHsEnM8-YYITokIsM6BVsf2Ec_8ajJDaldPf-P8U,8577
-llm_ie-0.3.3.dist-info/METADATA,sha256=CeTsMNtWhEWCvOqHWSXu0KqOgDp3kMwN2WtBF4N-4zE,41266
-llm_ie-0.3.3.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-llm_ie-0.3.3.dist-info/RECORD,,
+llm_ie-0.3.4.dist-info/METADATA,sha256=-5Tf9TCWczCVOsdMavkBZ-KnYPGnbNrV1rsU-pMHfPA,41266
+llm_ie-0.3.4.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+llm_ie-0.3.4.dist-info/RECORD,,

{llm_ie-0.3.3.dist-info → llm_ie-0.3.4.dist-info}/WHEEL RENAMED Viewed

File without changes

llm-ie 0.3.3__py3-none-any.whl → 0.3.4__py3-none-any.whl

llm-ie 0.3.3py3-none-any.whl → 0.3.4py3-none-any.whl