visual-rag-toolkit 0.1.4__py3-none-any.whl → 0.1.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
demo/__init__.py CHANGED
@@ -7,4 +7,4 @@ A Streamlit-based UI for:
7
7
  - Interactive playground for visual search
8
8
  """
9
9
 
10
- __version__ = "0.1.4"
10
+ __version__ = "0.1.5"
visual_rag/__init__.py CHANGED
@@ -33,7 +33,7 @@ Each component works independently - use only what you need.
33
33
 
34
34
  import logging
35
35
 
36
- __version__ = "0.1.4"
36
+ __version__ = "0.1.5"
37
37
 
38
38
 
39
39
  def setup_logging(level: str = "INFO", format: str = None) -> None:
visual_rag/cli/main.py CHANGED
@@ -288,7 +288,7 @@ def cmd_search(args):
288
288
  )
289
289
 
290
290
  # Search
291
- query_np = query_embedding.detach().cpu().numpy()
291
+ query_np = query_embedding.detach().cpu().float().numpy() # .float() for BFloat16
292
292
  if args.strategy == "single_full":
293
293
  results = single_stage.search(
294
294
  query_embedding=query_np,
@@ -157,9 +157,10 @@ class MultiVectorRetriever:
157
157
  ) -> List[Dict[str, Any]]:
158
158
  q = self.embedder.embed_query(query)
159
159
  if isinstance(q, torch.Tensor):
160
- query_embedding = q.detach().cpu().numpy()
160
+ # .float() converts BFloat16 to Float32 (numpy doesn't support BFloat16)
161
+ query_embedding = q.detach().cpu().float().numpy()
161
162
  else:
162
- query_embedding = np.asarray(q)
163
+ query_embedding = np.asarray(q, dtype=np.float32)
163
164
 
164
165
  return self.search_embedded(
165
166
  query_embedding=query_embedding,
@@ -129,5 +129,5 @@ class SingleStageRetriever:
129
129
  if isinstance(embedding, torch.Tensor):
130
130
  if embedding.dtype == torch.bfloat16:
131
131
  return embedding.cpu().float().numpy()
132
- return embedding.cpu().numpy()
132
+ return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
133
133
  return np.array(embedding, dtype=np.float32)
@@ -51,7 +51,7 @@ class ThreeStageRetriever:
51
51
  if isinstance(embedding, torch.Tensor):
52
52
  if embedding.dtype == torch.bfloat16:
53
53
  return embedding.cpu().float().numpy()
54
- return embedding.cpu().numpy()
54
+ return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
55
55
  return np.array(embedding, dtype=np.float32)
56
56
 
57
57
  def _infer_vector_is_multivector(self, vector_name: str) -> bool:
@@ -418,7 +418,7 @@ class TwoStageRetriever:
418
418
  if isinstance(embedding, torch.Tensor):
419
419
  if embedding.dtype == torch.bfloat16:
420
420
  return embedding.cpu().float().numpy()
421
- return embedding.cpu().numpy()
421
+ return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
422
422
  return np.array(embedding, dtype=np.float32)
423
423
 
424
424
  def build_filter(
@@ -55,14 +55,14 @@ def generate_saliency_map(
55
55
  if hasattr(query_embedding, "numpy"):
56
56
  query_np = query_embedding.numpy()
57
57
  elif hasattr(query_embedding, "cpu"):
58
- query_np = query_embedding.cpu().numpy()
58
+ query_np = query_embedding.cpu().float().numpy() # .float() for BFloat16
59
59
  else:
60
60
  query_np = np.array(query_embedding, dtype=np.float32)
61
61
 
62
62
  if hasattr(doc_embedding, "numpy"):
63
63
  doc_np = doc_embedding.numpy()
64
64
  elif hasattr(doc_embedding, "cpu"):
65
- doc_np = doc_embedding.cpu().numpy()
65
+ doc_np = doc_embedding.cpu().float().numpy() # .float() for BFloat16
66
66
  else:
67
67
  doc_np = np.array(doc_embedding, dtype=np.float32)
68
68
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: visual-rag-toolkit
3
- Version: 0.1.4
3
+ Version: 0.1.5
4
4
  Summary: End-to-end visual document retrieval with ColPali, featuring two-stage pooling for scalable search
5
5
  Project-URL: Homepage, https://github.com/Ara-Yeroyan/visual-rag-toolkit
6
6
  Project-URL: Documentation, https://github.com/Ara-Yeroyan/visual-rag-toolkit#readme
@@ -11,7 +11,7 @@ benchmarks/vidore_tatdqa_test/dataset_loader.py,sha256=gCCneGAKWQm0WlJHLvGjoMrAb
11
11
  benchmarks/vidore_tatdqa_test/metrics.py,sha256=cLdYbRt5VcxInO1cN79ve6ZLP3kaSxRkdzRX3IbPPMs,1112
12
12
  benchmarks/vidore_tatdqa_test/run_qdrant.py,sha256=_PikeqIYpWPim-KEQOwvT-aqwYoAWASjqJVisi8PfQg,28681
13
13
  benchmarks/vidore_tatdqa_test/sweep_eval.py,sha256=d_kbyNTJ1LoFfIVnsZyiRO1nKyMqmRB5jEweZL6kYd4,12688
14
- demo/__init__.py,sha256=QtvjqZ94WpbJ915Xik5ZzYFDtK7APmsQK6m0-Sxe8uw,204
14
+ demo/__init__.py,sha256=zxRkBWe4opMZXfJxNULuktXdZLuYsZFHeaijgxPe07w,204
15
15
  demo/app.py,sha256=nZbCz1mpRK-GZTgOHyz4m4AfgKFgsH-09JwXeL3d3ng,1405
16
16
  demo/commands.py,sha256=qxRE2x610yZvcjwEfSKiR9CyFonX-vRxFqQNJCUKfyA,13690
17
17
  demo/config.py,sha256=BNkV4NSEEMIV9e6Z-cxds2v247uVmTPCgL-M5ItPzMg,757
@@ -27,12 +27,12 @@ demo/ui/header.py,sha256=J2hXr_nNyg1H9rmrd-EGx3WUl7lYo-Ca30ptgzBCfBs,806
27
27
  demo/ui/playground.py,sha256=yRlWWzJgsc596vALn5f0PHhmhtJCMmfv61nYakW75GQ,13672
28
28
  demo/ui/sidebar.py,sha256=k7CZ5V7SxwbPOL9nQTWUct5y9mPY-YnLIeBgha7aIEE,8379
29
29
  demo/ui/upload.py,sha256=NVmd1-xRj_dfgq14x_eqcN6MjDAZ3hbPBD0YRUz8OOY,20508
30
- visual_rag/__init__.py,sha256=O8I4wQdQcQxAs7_SIPxnAzUOmRv5I9ezau8sZx9yqXQ,4384
30
+ visual_rag/__init__.py,sha256=mOcAcA2rkPVA9GQ63CKFb1g3KatGqILsjfWFj4kkpus,4384
31
31
  visual_rag/config.py,sha256=qqSQk2lM5MiRji-6xQNGS2gSiXA4NgyJnCbgGx7uGJQ,7395
32
32
  visual_rag/demo_runner.py,sha256=ahIKYhHQSLOF_kWbj0u_29SLX4qTdyxb3Smt_cMMfzI,2763
33
33
  visual_rag/qdrant_admin.py,sha256=NNczko2S5-K3qATNUxgYn51hNWgWb6boheL7vlCQGpM,7055
34
34
  visual_rag/cli/__init__.py,sha256=WgBRXm0VACfLltvVlLcSs3FTM1uQ7Uuw3CVD4-zWZwc,46
35
- visual_rag/cli/main.py,sha256=QmpnQ0lbC6Q9lwxaSCDh6paEEzI78IPY1jwc3_9y7VI,21083
35
+ visual_rag/cli/main.py,sha256=lw2xS96FtdzFnftModGcqRyJYlxFWA0U3aE3C247mBk,21116
36
36
  visual_rag/embedding/__init__.py,sha256=7QIENmxwRnwnUzsYKRY3VQTyF3HJkRiL1D7Au9XHF0w,682
37
37
  visual_rag/embedding/pooling.py,sha256=x8uY4VHbxEnsJRM2JeOkzPHDiwOkbi5NK4XW21U1hAc,11401
38
38
  visual_rag/embedding/visual_embedder.py,sha256=he9JpVHmo_szOiXCwtJdrCseGmf2y5Gi0UEFjwazzVY,23198
@@ -44,14 +44,14 @@ visual_rag/indexing/qdrant_indexer.py,sha256=E9uDwOL3A1nFJhFhJcI8V3JR8FL7nDahEYi
44
44
  visual_rag/preprocessing/__init__.py,sha256=rCzfBO0jaVKp6MpPRRused_4gasHfobAbG-139Y806E,121
45
45
  visual_rag/preprocessing/crop_empty.py,sha256=iHXITFkRlF40VPJ4k9d432RUAi_89BhAEvK4wOEn96Q,5211
46
46
  visual_rag/retrieval/__init__.py,sha256=J9pnbeB83Fqs9n4g3GcIp1VR9dnuyAlcsIDVsf0lSb8,601
47
- visual_rag/retrieval/multi_vector.py,sha256=KyJg1VAxODr5rY80vXmsjSD9ueRpay4QGCJizPKiiBw,7008
48
- visual_rag/retrieval/single_stage.py,sha256=Ba06V-KRSFSZm0xzbjFR3EBEWaQkDo7U_pWNx25W8H0,4425
49
- visual_rag/retrieval/three_stage.py,sha256=YC0CVEohxTT5zhilcQHI7nYAk08E5jC3zkQ3-rNdLMw,5951
50
- visual_rag/retrieval/two_stage.py,sha256=eUbyvdf0-3f0qIiAdU6Wmlos5hGrGNyXjuvc2-Be41M,16775
47
+ visual_rag/retrieval/multi_vector.py,sha256=oQowl-Yv4cYDj2jroX1nv_uZl8sb0d5VKMmwxL-GlBA,7119
48
+ visual_rag/retrieval/single_stage.py,sha256=-hljRha6kWZAr1IQJVSii4pqiIqk0cHhW68bUyYK41o,4472
49
+ visual_rag/retrieval/three_stage.py,sha256=UDjH92V6ILV_w4bOeN0vCF3SdXYHMml9oN2gl3kfwWk,5998
50
+ visual_rag/retrieval/two_stage.py,sha256=OTTH-MYtwK45RHYMF1esEeciXMTU8h7AQzH68BZVrYE,16822
51
51
  visual_rag/visualization/__init__.py,sha256=SITKNvBEseDp7F3K6UzLPA-6OQFqYfY5azS5nlDdihQ,447
52
- visual_rag/visualization/saliency.py,sha256=F3Plc18Sf3tzWcyncuaruTmENm1IfW5j9NFGEQR93cY,11248
53
- visual_rag_toolkit-0.1.4.dist-info/METADATA,sha256=2nnhqsq3P_OG8GRk48sz569VB1I-aaKcOjKXYl-OvJo,13460
54
- visual_rag_toolkit-0.1.4.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
55
- visual_rag_toolkit-0.1.4.dist-info/entry_points.txt,sha256=6Tob1GPg_ILGELjYTPsAnNMZ1W0NS939nfI7xyW2DIY,102
56
- visual_rag_toolkit-0.1.4.dist-info/licenses/LICENSE,sha256=hEg_weKnHXJakQRR3sw2ygcZ101zCI00zMhBOPb3yfA,1069
57
- visual_rag_toolkit-0.1.4.dist-info/RECORD,,
52
+ visual_rag/visualization/saliency.py,sha256=RuVcF1cPrmzdwfigqhP-e1aqzMr817F64aYucbwT79g,11314
53
+ visual_rag_toolkit-0.1.5.dist-info/METADATA,sha256=66Z99JyOGp5QVb2eJR7U2zjF8Qd6nvRJanhezrbZ-3o,13460
54
+ visual_rag_toolkit-0.1.5.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
55
+ visual_rag_toolkit-0.1.5.dist-info/entry_points.txt,sha256=6Tob1GPg_ILGELjYTPsAnNMZ1W0NS939nfI7xyW2DIY,102
56
+ visual_rag_toolkit-0.1.5.dist-info/licenses/LICENSE,sha256=hEg_weKnHXJakQRR3sw2ygcZ101zCI00zMhBOPb3yfA,1069
57
+ visual_rag_toolkit-0.1.5.dist-info/RECORD,,