visual-rag-toolkit 0.1.4__py3-none-any.whl → 0.1.5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- demo/__init__.py +1 -1
- visual_rag/__init__.py +1 -1
- visual_rag/cli/main.py +1 -1
- visual_rag/retrieval/multi_vector.py +3 -2
- visual_rag/retrieval/single_stage.py +1 -1
- visual_rag/retrieval/three_stage.py +1 -1
- visual_rag/retrieval/two_stage.py +1 -1
- visual_rag/visualization/saliency.py +2 -2
- {visual_rag_toolkit-0.1.4.dist-info → visual_rag_toolkit-0.1.5.dist-info}/METADATA +1 -1
- {visual_rag_toolkit-0.1.4.dist-info → visual_rag_toolkit-0.1.5.dist-info}/RECORD +13 -13
- {visual_rag_toolkit-0.1.4.dist-info → visual_rag_toolkit-0.1.5.dist-info}/WHEEL +0 -0
- {visual_rag_toolkit-0.1.4.dist-info → visual_rag_toolkit-0.1.5.dist-info}/entry_points.txt +0 -0
- {visual_rag_toolkit-0.1.4.dist-info → visual_rag_toolkit-0.1.5.dist-info}/licenses/LICENSE +0 -0
demo/__init__.py
CHANGED
visual_rag/__init__.py
CHANGED
visual_rag/cli/main.py
CHANGED
|
@@ -288,7 +288,7 @@ def cmd_search(args):
|
|
|
288
288
|
)
|
|
289
289
|
|
|
290
290
|
# Search
|
|
291
|
-
query_np = query_embedding.detach().cpu().numpy()
|
|
291
|
+
query_np = query_embedding.detach().cpu().float().numpy() # .float() for BFloat16
|
|
292
292
|
if args.strategy == "single_full":
|
|
293
293
|
results = single_stage.search(
|
|
294
294
|
query_embedding=query_np,
|
|
@@ -157,9 +157,10 @@ class MultiVectorRetriever:
|
|
|
157
157
|
) -> List[Dict[str, Any]]:
|
|
158
158
|
q = self.embedder.embed_query(query)
|
|
159
159
|
if isinstance(q, torch.Tensor):
|
|
160
|
-
|
|
160
|
+
# .float() converts BFloat16 to Float32 (numpy doesn't support BFloat16)
|
|
161
|
+
query_embedding = q.detach().cpu().float().numpy()
|
|
161
162
|
else:
|
|
162
|
-
query_embedding = np.asarray(q)
|
|
163
|
+
query_embedding = np.asarray(q, dtype=np.float32)
|
|
163
164
|
|
|
164
165
|
return self.search_embedded(
|
|
165
166
|
query_embedding=query_embedding,
|
|
@@ -129,5 +129,5 @@ class SingleStageRetriever:
|
|
|
129
129
|
if isinstance(embedding, torch.Tensor):
|
|
130
130
|
if embedding.dtype == torch.bfloat16:
|
|
131
131
|
return embedding.cpu().float().numpy()
|
|
132
|
-
return embedding.cpu().numpy()
|
|
132
|
+
return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
|
|
133
133
|
return np.array(embedding, dtype=np.float32)
|
|
@@ -51,7 +51,7 @@ class ThreeStageRetriever:
|
|
|
51
51
|
if isinstance(embedding, torch.Tensor):
|
|
52
52
|
if embedding.dtype == torch.bfloat16:
|
|
53
53
|
return embedding.cpu().float().numpy()
|
|
54
|
-
return embedding.cpu().numpy()
|
|
54
|
+
return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
|
|
55
55
|
return np.array(embedding, dtype=np.float32)
|
|
56
56
|
|
|
57
57
|
def _infer_vector_is_multivector(self, vector_name: str) -> bool:
|
|
@@ -418,7 +418,7 @@ class TwoStageRetriever:
|
|
|
418
418
|
if isinstance(embedding, torch.Tensor):
|
|
419
419
|
if embedding.dtype == torch.bfloat16:
|
|
420
420
|
return embedding.cpu().float().numpy()
|
|
421
|
-
return embedding.cpu().numpy()
|
|
421
|
+
return embedding.cpu().float().numpy() # .float() for BFloat16 compatibility
|
|
422
422
|
return np.array(embedding, dtype=np.float32)
|
|
423
423
|
|
|
424
424
|
def build_filter(
|
|
@@ -55,14 +55,14 @@ def generate_saliency_map(
|
|
|
55
55
|
if hasattr(query_embedding, "numpy"):
|
|
56
56
|
query_np = query_embedding.numpy()
|
|
57
57
|
elif hasattr(query_embedding, "cpu"):
|
|
58
|
-
query_np = query_embedding.cpu().numpy()
|
|
58
|
+
query_np = query_embedding.cpu().float().numpy() # .float() for BFloat16
|
|
59
59
|
else:
|
|
60
60
|
query_np = np.array(query_embedding, dtype=np.float32)
|
|
61
61
|
|
|
62
62
|
if hasattr(doc_embedding, "numpy"):
|
|
63
63
|
doc_np = doc_embedding.numpy()
|
|
64
64
|
elif hasattr(doc_embedding, "cpu"):
|
|
65
|
-
doc_np = doc_embedding.cpu().numpy()
|
|
65
|
+
doc_np = doc_embedding.cpu().float().numpy() # .float() for BFloat16
|
|
66
66
|
else:
|
|
67
67
|
doc_np = np.array(doc_embedding, dtype=np.float32)
|
|
68
68
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: visual-rag-toolkit
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.5
|
|
4
4
|
Summary: End-to-end visual document retrieval with ColPali, featuring two-stage pooling for scalable search
|
|
5
5
|
Project-URL: Homepage, https://github.com/Ara-Yeroyan/visual-rag-toolkit
|
|
6
6
|
Project-URL: Documentation, https://github.com/Ara-Yeroyan/visual-rag-toolkit#readme
|
|
@@ -11,7 +11,7 @@ benchmarks/vidore_tatdqa_test/dataset_loader.py,sha256=gCCneGAKWQm0WlJHLvGjoMrAb
|
|
|
11
11
|
benchmarks/vidore_tatdqa_test/metrics.py,sha256=cLdYbRt5VcxInO1cN79ve6ZLP3kaSxRkdzRX3IbPPMs,1112
|
|
12
12
|
benchmarks/vidore_tatdqa_test/run_qdrant.py,sha256=_PikeqIYpWPim-KEQOwvT-aqwYoAWASjqJVisi8PfQg,28681
|
|
13
13
|
benchmarks/vidore_tatdqa_test/sweep_eval.py,sha256=d_kbyNTJ1LoFfIVnsZyiRO1nKyMqmRB5jEweZL6kYd4,12688
|
|
14
|
-
demo/__init__.py,sha256=
|
|
14
|
+
demo/__init__.py,sha256=zxRkBWe4opMZXfJxNULuktXdZLuYsZFHeaijgxPe07w,204
|
|
15
15
|
demo/app.py,sha256=nZbCz1mpRK-GZTgOHyz4m4AfgKFgsH-09JwXeL3d3ng,1405
|
|
16
16
|
demo/commands.py,sha256=qxRE2x610yZvcjwEfSKiR9CyFonX-vRxFqQNJCUKfyA,13690
|
|
17
17
|
demo/config.py,sha256=BNkV4NSEEMIV9e6Z-cxds2v247uVmTPCgL-M5ItPzMg,757
|
|
@@ -27,12 +27,12 @@ demo/ui/header.py,sha256=J2hXr_nNyg1H9rmrd-EGx3WUl7lYo-Ca30ptgzBCfBs,806
|
|
|
27
27
|
demo/ui/playground.py,sha256=yRlWWzJgsc596vALn5f0PHhmhtJCMmfv61nYakW75GQ,13672
|
|
28
28
|
demo/ui/sidebar.py,sha256=k7CZ5V7SxwbPOL9nQTWUct5y9mPY-YnLIeBgha7aIEE,8379
|
|
29
29
|
demo/ui/upload.py,sha256=NVmd1-xRj_dfgq14x_eqcN6MjDAZ3hbPBD0YRUz8OOY,20508
|
|
30
|
-
visual_rag/__init__.py,sha256=
|
|
30
|
+
visual_rag/__init__.py,sha256=mOcAcA2rkPVA9GQ63CKFb1g3KatGqILsjfWFj4kkpus,4384
|
|
31
31
|
visual_rag/config.py,sha256=qqSQk2lM5MiRji-6xQNGS2gSiXA4NgyJnCbgGx7uGJQ,7395
|
|
32
32
|
visual_rag/demo_runner.py,sha256=ahIKYhHQSLOF_kWbj0u_29SLX4qTdyxb3Smt_cMMfzI,2763
|
|
33
33
|
visual_rag/qdrant_admin.py,sha256=NNczko2S5-K3qATNUxgYn51hNWgWb6boheL7vlCQGpM,7055
|
|
34
34
|
visual_rag/cli/__init__.py,sha256=WgBRXm0VACfLltvVlLcSs3FTM1uQ7Uuw3CVD4-zWZwc,46
|
|
35
|
-
visual_rag/cli/main.py,sha256=
|
|
35
|
+
visual_rag/cli/main.py,sha256=lw2xS96FtdzFnftModGcqRyJYlxFWA0U3aE3C247mBk,21116
|
|
36
36
|
visual_rag/embedding/__init__.py,sha256=7QIENmxwRnwnUzsYKRY3VQTyF3HJkRiL1D7Au9XHF0w,682
|
|
37
37
|
visual_rag/embedding/pooling.py,sha256=x8uY4VHbxEnsJRM2JeOkzPHDiwOkbi5NK4XW21U1hAc,11401
|
|
38
38
|
visual_rag/embedding/visual_embedder.py,sha256=he9JpVHmo_szOiXCwtJdrCseGmf2y5Gi0UEFjwazzVY,23198
|
|
@@ -44,14 +44,14 @@ visual_rag/indexing/qdrant_indexer.py,sha256=E9uDwOL3A1nFJhFhJcI8V3JR8FL7nDahEYi
|
|
|
44
44
|
visual_rag/preprocessing/__init__.py,sha256=rCzfBO0jaVKp6MpPRRused_4gasHfobAbG-139Y806E,121
|
|
45
45
|
visual_rag/preprocessing/crop_empty.py,sha256=iHXITFkRlF40VPJ4k9d432RUAi_89BhAEvK4wOEn96Q,5211
|
|
46
46
|
visual_rag/retrieval/__init__.py,sha256=J9pnbeB83Fqs9n4g3GcIp1VR9dnuyAlcsIDVsf0lSb8,601
|
|
47
|
-
visual_rag/retrieval/multi_vector.py,sha256=
|
|
48
|
-
visual_rag/retrieval/single_stage.py,sha256
|
|
49
|
-
visual_rag/retrieval/three_stage.py,sha256=
|
|
50
|
-
visual_rag/retrieval/two_stage.py,sha256=
|
|
47
|
+
visual_rag/retrieval/multi_vector.py,sha256=oQowl-Yv4cYDj2jroX1nv_uZl8sb0d5VKMmwxL-GlBA,7119
|
|
48
|
+
visual_rag/retrieval/single_stage.py,sha256=-hljRha6kWZAr1IQJVSii4pqiIqk0cHhW68bUyYK41o,4472
|
|
49
|
+
visual_rag/retrieval/three_stage.py,sha256=UDjH92V6ILV_w4bOeN0vCF3SdXYHMml9oN2gl3kfwWk,5998
|
|
50
|
+
visual_rag/retrieval/two_stage.py,sha256=OTTH-MYtwK45RHYMF1esEeciXMTU8h7AQzH68BZVrYE,16822
|
|
51
51
|
visual_rag/visualization/__init__.py,sha256=SITKNvBEseDp7F3K6UzLPA-6OQFqYfY5azS5nlDdihQ,447
|
|
52
|
-
visual_rag/visualization/saliency.py,sha256=
|
|
53
|
-
visual_rag_toolkit-0.1.
|
|
54
|
-
visual_rag_toolkit-0.1.
|
|
55
|
-
visual_rag_toolkit-0.1.
|
|
56
|
-
visual_rag_toolkit-0.1.
|
|
57
|
-
visual_rag_toolkit-0.1.
|
|
52
|
+
visual_rag/visualization/saliency.py,sha256=RuVcF1cPrmzdwfigqhP-e1aqzMr817F64aYucbwT79g,11314
|
|
53
|
+
visual_rag_toolkit-0.1.5.dist-info/METADATA,sha256=66Z99JyOGp5QVb2eJR7U2zjF8Qd6nvRJanhezrbZ-3o,13460
|
|
54
|
+
visual_rag_toolkit-0.1.5.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
55
|
+
visual_rag_toolkit-0.1.5.dist-info/entry_points.txt,sha256=6Tob1GPg_ILGELjYTPsAnNMZ1W0NS939nfI7xyW2DIY,102
|
|
56
|
+
visual_rag_toolkit-0.1.5.dist-info/licenses/LICENSE,sha256=hEg_weKnHXJakQRR3sw2ygcZ101zCI00zMhBOPb3yfA,1069
|
|
57
|
+
visual_rag_toolkit-0.1.5.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|