wizit-context-ingestor 0.3.0b6__tar.gz → 0.3.0b8__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of wizit-context-ingestor might be problematic. Click here for more details.

Files changed (44) hide show
  1. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/PKG-INFO +1 -1
  2. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/pyproject.toml +1 -1
  3. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/data/prompts.py +2 -4
  4. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/rag/semantic_chunks.py +0 -2
  5. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/README.md +0 -0
  6. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/.DS_Store +0 -0
  7. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/__init__.py +0 -0
  8. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/application/__init__.py +0 -0
  9. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/application/context_chunk_service.py +0 -0
  10. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/application/interfaces.py +0 -0
  11. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/application/transcription_service.py +0 -0
  12. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/data/__init__.py +0 -0
  13. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/data/kdb.py +0 -0
  14. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/data/storage.py +0 -0
  15. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/domain/__init__.py +0 -0
  16. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/domain/models.py +0 -0
  17. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/domain/services.py +0 -0
  18. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/__init__.py +0 -0
  19. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/aws_model.py +0 -0
  20. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/persistence/__init__.py +0 -0
  21. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/persistence/local_storage.py +0 -0
  22. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/persistence/s3_storage.py +0 -0
  23. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/rag/chroma_embeddings.py +0 -0
  24. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/rag/pg_embeddings.py +0 -0
  25. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/rag/redis_embeddings.py +0 -0
  26. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/secrets/__init__.py +0 -0
  27. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/secrets/aws_secrets_manager.py +0 -0
  28. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/infra/vertex_model.py +0 -0
  29. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/main.py +0 -0
  30. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/services/.DS_Store +0 -0
  31. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/services/__init__.py +0 -0
  32. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/services/chunks.py +0 -0
  33. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/services/parse_doc.py +0 -0
  34. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/services/pg_embeddings_manager.py +0 -0
  35. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/utils/file_utils.py +0 -0
  36. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/context_nodes.py +0 -0
  37. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/context_state.py +0 -0
  38. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/context_tools.py +0 -0
  39. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/context_workflow.py +0 -0
  40. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/transcription_nodes.py +0 -0
  41. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/transcription_schemas.py +0 -0
  42. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/transcription_state.py +0 -0
  43. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/transcription_tools.py +0 -0
  44. {wizit_context_ingestor-0.3.0b6 → wizit_context_ingestor-0.3.0b8}/src/wizit_context_ingestor/workflows/transcription_workflow.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: wizit-context-ingestor
3
- Version: 0.3.0b6
3
+ Version: 0.3.0b8
4
4
  Summary: Contextual Rag with Cloud Solutions
5
5
  Requires-Dist: anthropic[vertex]>=0.66.0
6
6
  Requires-Dist: boto3>=1.40.23
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "wizit_context_ingestor"
3
- version = "0.3.0-beta-6"
3
+ version = "0.3.0-beta-8"
4
4
  description = "Contextual Rag with Cloud Solutions"
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.12"
@@ -227,7 +227,7 @@ Generate the optimized context following these specifications:
227
227
 
228
228
  WORKFLOW_CONTEXT_CHUNKS_IN_DOCUMENT_SYSTEM_PROMPT = """
229
229
  You are an expert RAG (Retrieval-Augmented Generation) context generator that creates optimized contextual chunks from markdown document content for enhanced search and retrieval performance.
230
- OBJECTIVE: Generate rich, searchable context descriptions that maximize retrieval accuracy and relevance in RAG systems.
230
+ OBJECTIVE: Generate concise, searchable context descriptions that maximize retrieval accuracy and relevance in RAG systems.
231
231
  WORKFLOW:
232
232
  <task_analysis>
233
233
  1. LANGUAGE DETECTION: Identify the primary language used in the document content
@@ -243,10 +243,7 @@ Your generated context must synthesize ALL of these elements into a coherent des
243
243
  - chunk_keywords: Primary and secondary keywords, technical terms, and searchable phrases that would help users find this content
244
244
  - chunk_description: Clear explanation of what the chunk contains, including data types, concepts, and information presented
245
245
  - chunk_function: The chunk's specific purpose and role (e.g., definition, explanation, example, instruction, procedure, list, summary, analysis, conclusion)
246
- - chunk_structure: Format and organizational pattern (paragraph, bulleted list, numbered steps, table, code block, heading, etc.)
247
- - chunk_main_idea: The central concept, message, or takeaway that the chunk communicates
248
246
  - chunk_domain: Subject area or field of knowledge (e.g., technical documentation, legal text, medical information, business process)
249
- - chunk_audience: Intended reader level and background (e.g., beginner, expert, general audience, specific role)
250
247
  </context_elements>
251
248
  CRITICAL RULES:
252
249
  <critical_rules>
@@ -258,6 +255,7 @@ CRITICAL RULES:
258
255
  - Do NOT reproduce or quote the original chunk content verbatim
259
256
  - Ensure context is self-contained and understandable without the original chunk
260
257
  - Use natural language that flows well while incorporating all required elements
258
+ - Do not generate extensive contexts, two sentences or less is required, ensure concise and succinct context.
261
259
  </critical_rules>
262
260
 
263
261
  SEARCH OPTIMIZATION GUIDELINES:
@@ -1,5 +1,3 @@
1
- from posix import fork
2
-
3
1
  # check this documentation
4
2
  # https://python.langchain.com/docs/how_to/semantic-chunker/
5
3
  # https://github.com/FullStackRetrieval-com/RetrievalTutorials/blob/main/tutorials/LevelsOfTextSplitting/5_Levels_Of_Text_Splitting.ipynb