ragbandit-core 0.1.1__tar.gz → 0.1.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (43) hide show
  1. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/PKG-INFO +1 -1
  2. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/pyproject.toml +1 -1
  3. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/chunkers/semantic_chunker.py +3 -3
  4. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit_core.egg-info/PKG-INFO +1 -1
  5. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/LICENSE.md +0 -0
  6. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/README.md +0 -0
  7. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/setup.cfg +0 -0
  8. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/__init__.py +0 -0
  9. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/config/__init__.py +0 -0
  10. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/config/llms.py +0 -0
  11. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/config/pricing.py +0 -0
  12. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/__init__.py +0 -0
  13. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/chunkers/__init__.py +0 -0
  14. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/chunkers/base_chunker.py +0 -0
  15. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/chunkers/fixed_size_chunker.py +0 -0
  16. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/document_pipeline.py +0 -0
  17. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/embedders/__init__.py +0 -0
  18. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/embedders/base_embedder.py +0 -0
  19. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/embedders/mistral_embedder.py +0 -0
  20. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/ocr/__init__.py +0 -0
  21. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/ocr/base_ocr.py +0 -0
  22. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/ocr/mistral_ocr.py +0 -0
  23. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/processors/__init__.py +0 -0
  24. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/processors/base_processor.py +0 -0
  25. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/processors/footnotes_processor.py +0 -0
  26. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/processors/references_processor.py +0 -0
  27. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/utils/__init__.py +0 -0
  28. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/documents/utils/secure_file_handler.py +0 -0
  29. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/prompt_tools/__init__.py +0 -0
  30. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/prompt_tools/footnotes_processor_tools.py +0 -0
  31. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/prompt_tools/prompt_tool.py +0 -0
  32. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/prompt_tools/references_processor_tools.py +0 -0
  33. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/prompt_tools/semantic_chunker_tools.py +0 -0
  34. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/schema.py +0 -0
  35. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/utils/__init__.py +0 -0
  36. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/utils/in_memory_log_handler.py +0 -0
  37. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/utils/llm_utils.py +0 -0
  38. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/utils/mistral_client.py +0 -0
  39. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit/utils/token_usage_tracker.py +0 -0
  40. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit_core.egg-info/SOURCES.txt +0 -0
  41. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit_core.egg-info/dependency_links.txt +0 -0
  42. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit_core.egg-info/requires.txt +0 -0
  43. {ragbandit_core-0.1.1 → ragbandit_core-0.1.2}/src/ragbandit_core.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ragbandit-core
3
- Version: 0.1.1
3
+ Version: 0.1.2
4
4
  Summary: Core utilities for document processing, RAG configuration, querying, and evaluation.
5
5
  Author-email: Martim Chaves <martim@ragbandit.com>
6
6
  License: MIT
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "ragbandit-core"
7
- version = "0.1.1"
7
+ version = "0.1.2"
8
8
  description = "Core utilities for document processing, RAG configuration, querying, and evaluation."
9
9
  authors = [
10
10
  { name="Martim Chaves", email="martim@ragbandit.com" }
@@ -99,9 +99,9 @@ class SemanticChunker(BaseChunker):
99
99
  ]
100
100
  idx = full_text.find(current_break_lead)
101
101
 
102
- if idx == -1:
103
- # If we still can't find the snippet after
104
- # trying shorter versions,
102
+ if idx == -1 or idx == 0:
103
+ # If we can't find the snippet, or if the break is at
104
+ # the very start (idx == 0 would create an empty chunk),
105
105
  # fallback: chunk everything as is
106
106
  meta = ChunkMetadata(page_index=i, images=[], extra={})
107
107
  chunks.append(Chunk(text=full_text, metadata=meta))
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ragbandit-core
3
- Version: 0.1.1
3
+ Version: 0.1.2
4
4
  Summary: Core utilities for document processing, RAG configuration, querying, and evaluation.
5
5
  Author-email: Martim Chaves <martim@ragbandit.com>
6
6
  License: MIT
File without changes
File without changes