vectordb-bench 0.0.26__py3-none-any.whl → 0.0.27__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -220,10 +220,12 @@ class DatasetManager(BaseModel):
220
220
  train_files = utils.compose_train_files(file_count, use_shuffled)
221
221
  all_files = train_files
222
222
 
223
- gt_file, test_file = None, None
223
+ test_file = "test.parquet"
224
+ all_files.extend([test_file])
225
+ gt_file = None
224
226
  if self.data.with_gt:
225
- gt_file, test_file = utils.compose_gt_file(filters), "test.parquet"
226
- all_files.extend([gt_file, test_file])
227
+ gt_file = utils.compose_gt_file(filters)
228
+ all_files.extend([gt_file])
227
229
 
228
230
  if not self.data.is_custom:
229
231
  source.reader().read(
@@ -232,8 +234,10 @@ class DatasetManager(BaseModel):
232
234
  local_ds_root=self.data_dir,
233
235
  )
234
236
 
235
- if gt_file is not None and test_file is not None:
237
+ if test_file is not None:
236
238
  self.test_data = self._read_file(test_file)
239
+
240
+ if gt_file is not None:
237
241
  self.gt_data = self._read_file(gt_file)
238
242
 
239
243
  prefix = "shuffle_train" if use_shuffled else "train"
@@ -209,7 +209,8 @@ class SerialSearchRunner:
209
209
  ideal_dcg = get_ideal_dcg(self.k)
210
210
 
211
211
  log.debug(f"test dataset size: {len(test_data)}")
212
- log.debug(f"ground truth size: {ground_truth.columns}, shape: {ground_truth.shape}")
212
+ if ground_truth is not None:
213
+ log.debug(f"ground truth size: {ground_truth.columns}, shape: {ground_truth.shape}")
213
214
 
214
215
  latencies, recalls, ndcgs = [], [], []
215
216
  for idx, emb in enumerate(test_data):
@@ -228,9 +229,13 @@ class SerialSearchRunner:
228
229
 
229
230
  latencies.append(time.perf_counter() - s)
230
231
 
231
- gt = ground_truth["neighbors_id"][idx]
232
- recalls.append(calc_recall(self.k, gt[: self.k], results))
233
- ndcgs.append(calc_ndcg(gt[: self.k], results, ideal_dcg))
232
+ if ground_truth is not None:
233
+ gt = ground_truth["neighbors_id"][idx]
234
+ recalls.append(calc_recall(self.k, gt[: self.k], results))
235
+ ndcgs.append(calc_ndcg(gt[: self.k], results, ideal_dcg))
236
+ else:
237
+ recalls.append(0)
238
+ ndcgs.append(0)
234
239
 
235
240
  if len(latencies) % 100 == 0:
236
241
  log.debug(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: vectordb-bench
3
- Version: 0.0.26
3
+ Version: 0.0.27
4
4
  Summary: VectorDBBench is not just an offering of benchmark results for mainstream vector databases and cloud services, it's your go-to tool for the ultimate performance and cost-effectiveness comparison. Designed with ease-of-use in mind, VectorDBBench is devised to help users, even non-professionals, reproduce results or test new systems, making the hunt for the optimal choice amongst a plethora of cloud services and open-source vector databases a breeze.
5
5
  Author-email: XuanYang-cn <xuan.yang@zilliz.com>
6
6
  Project-URL: repository, https://github.com/zilliztech/VectorDBBench
@@ -9,7 +9,7 @@ vectordb_bench/backend/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3
9
9
  vectordb_bench/backend/assembler.py,sha256=6GInRT7yBgfTaIPmo-XMkYX4pA8PJQmjMQInynwaunE,2047
10
10
  vectordb_bench/backend/cases.py,sha256=obDdY6g3p9Z2fog7qDwLLDuRMwo3LGQKMHsP66QZd2M,16296
11
11
  vectordb_bench/backend/data_source.py,sha256=bfa_Zg4O9fRP2ENmVZ_2-NISKozoFN-TocyxOlw1JtE,5524
12
- vectordb_bench/backend/dataset.py,sha256=V4OKPt23v0kmdvgJwDr_R2fLJv3lXLZEii992cEM2Q0,8993
12
+ vectordb_bench/backend/dataset.py,sha256=lH2Q01AEJxA-sYfZHzH2BM019mwuy9mB_i0VLhIgDJ8,9020
13
13
  vectordb_bench/backend/result_collector.py,sha256=mpROVdZ-HChKBVyMV5TZ5v7YGRb69bvfT7Gezn5F5sY,819
14
14
  vectordb_bench/backend/task_runner.py,sha256=vlaXB0_25-G9w1Lj-F0SrvJzhXT7ceDWGIb2aKRXukU,11488
15
15
  vectordb_bench/backend/utils.py,sha256=R6THuJdZhiQYSSJTqv0Uegl2B20taV_QjwvFrun2yxE,1949
@@ -83,7 +83,7 @@ vectordb_bench/backend/runner/__init__.py,sha256=mF8YnErTa7MVG37zZb0KFXBSrmMw_af
83
83
  vectordb_bench/backend/runner/mp_runner.py,sha256=AJHrQmUADDWDQZ0eZ4aaAH9HOQtZHiafXJYGU5PNq3Y,9645
84
84
  vectordb_bench/backend/runner/rate_runner.py,sha256=2coO7qalEh6ZbVKUkyFvip4JWjs1yJM-iiExSrjEp9c,4306
85
85
  vectordb_bench/backend/runner/read_write_runner.py,sha256=CXYBXEEkS1S7-NurdzN5Wh6N0Vx-rprM9Qehk1WKwl8,7822
86
- vectordb_bench/backend/runner/serial_runner.py,sha256=URymqOy-9NdVE3kXWBW3e9R0Oh2sG9zF1vJkV7sk48E,10092
86
+ vectordb_bench/backend/runner/serial_runner.py,sha256=Y4Y2mSK8nU3hml7gliiF6BXUaW49sD-Ueci0xn62IL0,10290
87
87
  vectordb_bench/backend/runner/util.py,sha256=tjTFUxth6hNnVrlU82TqkHhfeZo4ymj7WlyK4zFyPTg,522
88
88
  vectordb_bench/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
89
89
  vectordb_bench/cli/cli.py,sha256=cr4BycwIs51YJgNorHplzKP46M474jDTatevPdD-oKE,15434
@@ -142,9 +142,9 @@ vectordb_bench/results/WeaviateCloud/result_20230808_standard_weaviatecloud.json
142
142
  vectordb_bench/results/ZillizCloud/result_20230727_standard_zillizcloud.json,sha256=-Mdm4By65XDRCrmVOCF8yQXjcZtH4Xo4shcjoDoBUKU,18293
143
143
  vectordb_bench/results/ZillizCloud/result_20230808_standard_zillizcloud.json,sha256=77XlHT5zM_K7mG5HfDQKwXZnSCuR37VUbt6-P3J_amI,15737
144
144
  vectordb_bench/results/ZillizCloud/result_20240105_standard_202401_zillizcloud.json,sha256=TualfJ0664Hs-vdIW68bdkqAEYyzotXmu2P0yIN-GHk,42526
145
- vectordb_bench-0.0.26.dist-info/licenses/LICENSE,sha256=HXbxhrb5u5SegVzeLNF_voVgRsJMavcLaOmD1N0lZkM,1067
146
- vectordb_bench-0.0.26.dist-info/METADATA,sha256=lsc4Y28tVwbXr3fUrVHbppegppAtYWoH0rEV3pn820g,38061
147
- vectordb_bench-0.0.26.dist-info/WHEEL,sha256=ck4Vq1_RXyvS4Jt6SI0Vz6fyVs4GWg7AINwpsaGEgPE,91
148
- vectordb_bench-0.0.26.dist-info/entry_points.txt,sha256=Qzw6gVx96ui8esG21H6yHsI6nboEohRmV424TYhQNrA,113
149
- vectordb_bench-0.0.26.dist-info/top_level.txt,sha256=jnhZFZAuKX1J60yt-XOeBZ__ctiZMvoC_s0RFq29lpM,15
150
- vectordb_bench-0.0.26.dist-info/RECORD,,
145
+ vectordb_bench-0.0.27.dist-info/licenses/LICENSE,sha256=HXbxhrb5u5SegVzeLNF_voVgRsJMavcLaOmD1N0lZkM,1067
146
+ vectordb_bench-0.0.27.dist-info/METADATA,sha256=UC8hc6cQKAYshgbSFEBzDPODzeltBiimXbVkrakDLDQ,38061
147
+ vectordb_bench-0.0.27.dist-info/WHEEL,sha256=ooBFpIzZCPdw3uqIQsOo4qqbA4ZRPxHnOH7peeONza0,91
148
+ vectordb_bench-0.0.27.dist-info/entry_points.txt,sha256=Qzw6gVx96ui8esG21H6yHsI6nboEohRmV424TYhQNrA,113
149
+ vectordb_bench-0.0.27.dist-info/top_level.txt,sha256=jnhZFZAuKX1J60yt-XOeBZ__ctiZMvoC_s0RFq29lpM,15
150
+ vectordb_bench-0.0.27.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (80.0.0)
2
+ Generator: setuptools (80.0.1)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5