wizit-context-ingestor 0.3.0b4__tar.gz → 0.3.0b5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of wizit-context-ingestor might be problematic. Click here for more details.

Files changed (44) hide show
  1. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/PKG-INFO +1 -1
  2. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/pyproject.toml +1 -1
  3. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/application/transcription_service.py +6 -3
  4. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/README.md +0 -0
  5. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/.DS_Store +0 -0
  6. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/__init__.py +0 -0
  7. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/application/__init__.py +0 -0
  8. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/application/context_chunk_service.py +0 -0
  9. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/application/interfaces.py +0 -0
  10. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/data/__init__.py +0 -0
  11. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/data/kdb.py +0 -0
  12. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/data/prompts.py +0 -0
  13. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/data/storage.py +0 -0
  14. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/domain/__init__.py +0 -0
  15. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/domain/models.py +0 -0
  16. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/domain/services.py +0 -0
  17. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/__init__.py +0 -0
  18. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/aws_model.py +0 -0
  19. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/persistence/__init__.py +0 -0
  20. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/persistence/local_storage.py +0 -0
  21. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/persistence/s3_storage.py +0 -0
  22. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/rag/chroma_embeddings.py +0 -0
  23. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/rag/pg_embeddings.py +0 -0
  24. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/rag/redis_embeddings.py +0 -0
  25. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/rag/semantic_chunks.py +0 -0
  26. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/secrets/__init__.py +0 -0
  27. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/secrets/aws_secrets_manager.py +0 -0
  28. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/infra/vertex_model.py +0 -0
  29. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/main.py +0 -0
  30. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/services/.DS_Store +0 -0
  31. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/services/__init__.py +0 -0
  32. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/services/chunks.py +0 -0
  33. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/services/parse_doc.py +0 -0
  34. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/services/pg_embeddings_manager.py +0 -0
  35. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/utils/file_utils.py +0 -0
  36. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/context_nodes.py +0 -0
  37. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/context_state.py +0 -0
  38. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/context_tools.py +0 -0
  39. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/context_workflow.py +0 -0
  40. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/transcription_nodes.py +0 -0
  41. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/transcription_schemas.py +0 -0
  42. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/transcription_state.py +0 -0
  43. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/transcription_tools.py +0 -0
  44. {wizit_context_ingestor-0.3.0b4 → wizit_context_ingestor-0.3.0b5}/src/wizit_context_ingestor/workflows/transcription_workflow.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: wizit-context-ingestor
3
- Version: 0.3.0b4
3
+ Version: 0.3.0b5
4
4
  Summary: Contextual Rag with Cloud Solutions
5
5
  Requires-Dist: anthropic[vertex]>=0.66.0
6
6
  Requires-Dist: boto3>=1.40.23
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "wizit_context_ingestor"
3
- version = "0.3.0-beta-4"
3
+ version = "0.3.0-beta-5"
4
4
  description = "Contextual Rag with Cloud Solutions"
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.12"
@@ -112,7 +112,7 @@ class TranscriptionService:
112
112
  # raise
113
113
 
114
114
  async def parse_doc_page_with_workflow(
115
- self, document: ParsedDocPage
115
+ self, document: ParsedDocPage, retries: int = 0
116
116
  ) -> ParsedDocPage:
117
117
  """Transcribe an image to text using an agent.
118
118
  Args:
@@ -120,6 +120,9 @@ class TranscriptionService:
120
120
  Returns:
121
121
  Processed text
122
122
  """
123
+ if retries > 1:
124
+ logger.info("Max retries exceeded")
125
+ return document
123
126
  result = await self.compiled_transcription_workflow.ainvoke(
124
127
  {
125
128
  "messages": [
@@ -150,10 +153,10 @@ class TranscriptionService:
150
153
  }
151
154
  },
152
155
  )
153
- if result["transcription"]:
156
+ if "transcription" in result:
154
157
  document.page_text = result["transcription"]
155
158
  else:
156
- raise ValueError(f"No transcription found: {result} ")
159
+ await self.parse_doc_page_with_workflow(document, retries=retries + 1)
157
160
  return document
158
161
 
159
162
  # def process_document(self, file_key: str) -> Tuple[List[ParsedDocPage], ParsedDoc]: