cocoindex 0.2.14__cp311-abi3-macosx_11_0_arm64.whl → 0.2.15__cp311-abi3-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
cocoindex/__init__.py CHANGED
@@ -2,6 +2,7 @@
2
2
  Cocoindex is a framework for building and running indexing pipelines.
3
3
  """
4
4
 
5
+ from . import _engine # type: ignore
5
6
  from . import functions, sources, targets, cli, utils
6
7
 
7
8
  from . import targets as storages # Deprecated: Use targets instead
@@ -42,6 +43,8 @@ from .typing import (
42
43
  Json,
43
44
  )
44
45
 
46
+ _engine.init_pyo3_runtime()
47
+
45
48
  __all__ = [
46
49
  # Submodules
47
50
  "_engine",
cocoindex/_engine.abi3.so CHANGED
Binary file
cocoindex/functions.py CHANGED
@@ -2,13 +2,13 @@
2
2
 
3
3
  import dataclasses
4
4
  import functools
5
- from typing import Annotated, Any, Literal
5
+ from typing import Any, Literal
6
6
 
7
7
  import numpy as np
8
8
  from numpy.typing import NDArray
9
9
 
10
10
  from . import llm, op
11
- from .typing import TypeAttr, Vector
11
+ from .typing import Vector
12
12
 
13
13
 
14
14
  class ParseJson(op.FunctionSpec):
@@ -40,6 +40,24 @@ class SplitRecursively(op.FunctionSpec):
40
40
  custom_languages: list[CustomLanguageSpec] = dataclasses.field(default_factory=list)
41
41
 
42
42
 
43
+ class SplitBySeparators(op.FunctionSpec):
44
+ """
45
+ Split text by specified regex separators only.
46
+ Output schema matches SplitRecursively for drop-in compatibility:
47
+ KTable rows with fields: location (Range), text (Str), start, end.
48
+ Args:
49
+ separators_regex: list[str] # e.g., [r"\\n\\n+"]
50
+ keep_separator: Literal["NONE", "LEFT", "RIGHT"] = "NONE"
51
+ include_empty: bool = False
52
+ trim: bool = True
53
+ """
54
+
55
+ separators_regex: list[str] = dataclasses.field(default_factory=list)
56
+ keep_separator: Literal["NONE", "LEFT", "RIGHT"] = "NONE"
57
+ include_empty: bool = False
58
+ trim: bool = True
59
+
60
+
43
61
  class EmbedText(op.FunctionSpec):
44
62
  """Embed a text into a vector space."""
45
63
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: cocoindex
3
- Version: 0.2.14
3
+ Version: 0.2.15
4
4
  Classifier: Development Status :: 3 - Alpha
5
5
  Classifier: License :: OSI Approved :: Apache Software License
6
6
  Classifier: Operating System :: OS Independent
@@ -1,14 +1,14 @@
1
- cocoindex-0.2.14.dist-info/METADATA,sha256=rohqn4_9s8I4l6dxYLSTqdphN-fogyzjZNFU65w_ZiE,13316
2
- cocoindex-0.2.14.dist-info/WHEEL,sha256=cVaoL47Ex1FxzwnkO_WCjy3a1Wl6mtZbBPTvTiNCHdY,103
3
- cocoindex-0.2.14.dist-info/entry_points.txt,sha256=_NretjYVzBdNTn7dK-zgwr7YfG2afz1u1uSE-5bZXF8,46
4
- cocoindex-0.2.14.dist-info/licenses/THIRD_PARTY_NOTICES.html,sha256=3Rq0MMyXp4exsfuop4rrPxu53e48XPYvzTfvV8EBY-Y,717769
5
- cocoindex/__init__.py,sha256=DP7l1Z05oxOiBl-PmLhqs3Lh2HcGg589DrSv4KCEvio,2563
6
- cocoindex/_engine.abi3.so,sha256=f5BiPkYwefBffPViOoMqs-QNWQ0FghAvuV0nAOkGLPM,67232816
1
+ cocoindex-0.2.15.dist-info/METADATA,sha256=3u9PxzHp4NgjbknLyCtuASJeXskfIpODzlIpSyaBcSI,13316
2
+ cocoindex-0.2.15.dist-info/WHEEL,sha256=cVaoL47Ex1FxzwnkO_WCjy3a1Wl6mtZbBPTvTiNCHdY,103
3
+ cocoindex-0.2.15.dist-info/entry_points.txt,sha256=_NretjYVzBdNTn7dK-zgwr7YfG2afz1u1uSE-5bZXF8,46
4
+ cocoindex-0.2.15.dist-info/licenses/THIRD_PARTY_NOTICES.html,sha256=LV2CtczxHQ5mN6Rj9TgnBa06dAxNPXZLXc0hMbco8tU,717769
5
+ cocoindex/__init__.py,sha256=6qZWVkK4WZ01BIAg3CPh_bRRdA6Clk4d4Q6OnZ2jFa4,2630
6
+ cocoindex/_engine.abi3.so,sha256=fCnSkunJcYsjrtesJqRupKG7o9neU6pQ25vZRHVOjUU,67288912
7
7
  cocoindex/auth_registry.py,sha256=_DOIY42C79joLCY_XczHwP5uebkmSavweoAHc0L3hQY,1334
8
8
  cocoindex/cli.py,sha256=69X30bFTFdM7c0_6lgIHR19CeQ7UEkobEQYihy8IdOQ,21599
9
9
  cocoindex/convert.py,sha256=itkUBCriOk8fdauahHRqJ-L8mnHehNZsBe_FouN0K1Q,28695
10
10
  cocoindex/flow.py,sha256=Vk72dX_svfpinvsolQ11aw6YDqbzaafrAi7xrQHo1i0,39844
11
- cocoindex/functions.py,sha256=09erNt3WbzY9l1KER-akBF2O5-6xEahV2ORBECaL6yk,12260
11
+ cocoindex/functions.py,sha256=V4ljBnCprvA25XlCVvNLwK5ergXiEcKU76jkOGC-X3A,12882
12
12
  cocoindex/index.py,sha256=tz5ilvmOp0BtroGehCQDqWK_pIX9m6ghkhcxsDVU8WE,982
13
13
  cocoindex/lib.py,sha256=0XheDF7fiFdqExpdqzU-VKun_Zll6DwZ5JfTm7u42aY,2284
14
14
  cocoindex/llm.py,sha256=Pv_cdnRngTLtuLU9AUmS8izIHhcKVnuBNolC33f9BDI,851
@@ -34,4 +34,4 @@ cocoindex/typing.py,sha256=jZO3meRVL_RsFdhj8Sx6gWF-Z207VhoPtb1ZmqzAnH0,19974
34
34
  cocoindex/user_app_loader.py,sha256=bc3Af-gYRxJ9GpObtpjegZY855oQBCv5FGkrkWV2yGY,1873
35
35
  cocoindex/utils.py,sha256=hUhX-XV6XGCtJSEIpBOuDv6VvqImwPlgBxztBTw7u0U,598
36
36
  cocoindex/validation.py,sha256=PZnJoby4sLbsmPv9fOjOQXuefjfZ7gmtsiTGU8SH-tc,3090
37
- cocoindex-0.2.14.dist-info/RECORD,,
37
+ cocoindex-0.2.15.dist-info/RECORD,,
@@ -2428,7 +2428,7 @@ Software.
2428
2428
  <h3 id="Apache-2.0">Apache License 2.0</h3>
2429
2429
  <h4>Used by:</h4>
2430
2430
  <ul class="license-used-by">
2431
- <li><a href=" https://crates.io/crates/cocoindex ">cocoindex 0.2.14</a></li>
2431
+ <li><a href=" https://crates.io/crates/cocoindex ">cocoindex 0.2.15</a></li>
2432
2432
  <li><a href=" https://github.com/awesomized/crc-fast-rust ">crc-fast 1.3.0</a></li>
2433
2433
  <li><a href=" https://github.com/qdrant/rust-client ">qdrant-client 1.15.0</a></li>
2434
2434
  </ul>