vectordb-bench 0.0.16__tar.gz → 0.0.18__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (162) hide show
  1. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/PKG-INFO +7 -2
  2. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/README.md +2 -1
  3. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/pyproject.toml +1 -0
  4. vectordb_bench-0.0.18/tests/test_rate_runner.py +88 -0
  5. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/__init__.py +1 -1
  6. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/__init__.py +13 -0
  7. vectordb_bench-0.0.18/vectordb_bench/backend/clients/alloydb/alloydb.py +372 -0
  8. vectordb_bench-0.0.18/vectordb_bench/backend/clients/alloydb/cli.py +147 -0
  9. vectordb_bench-0.0.18/vectordb_bench/backend/clients/alloydb/config.py +168 -0
  10. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/api.py +2 -0
  11. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/milvus/milvus.py +2 -1
  12. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/dataset.py +8 -5
  13. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/runner/mp_runner.py +94 -4
  14. vectordb_bench-0.0.18/vectordb_bench/backend/runner/rate_runner.py +79 -0
  15. vectordb_bench-0.0.18/vectordb_bench/backend/runner/read_write_runner.py +112 -0
  16. vectordb_bench-0.0.18/vectordb_bench/backend/runner/util.py +32 -0
  17. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/task_runner.py +5 -5
  18. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/cli/vectordbbench.py +2 -0
  19. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/concurrent/charts.py +25 -9
  20. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/config/dbCaseConfigs.py +166 -0
  21. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/pages/concurrent.py +5 -1
  22. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/metric.py +1 -0
  23. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/models.py +9 -0
  24. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/PKG-INFO +7 -2
  25. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/SOURCES.txt +7 -0
  26. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/requires.txt +5 -0
  27. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.devcontainer/Dockerfile +0 -0
  28. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.devcontainer/devcontainer.json +0 -0
  29. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.env.example +0 -0
  30. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.github/workflows/publish_package_on_release.yml +0 -0
  31. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.github/workflows/pull_request.yml +0 -0
  32. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.gitignore +0 -0
  33. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/.ruff.toml +0 -0
  34. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/Dockerfile +0 -0
  35. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/LICENSE +0 -0
  36. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/Makefile +0 -0
  37. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/OWNERS +0 -0
  38. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/fig/custom_case_run_test.png +0 -0
  39. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/fig/custom_dataset.png +0 -0
  40. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/install/requirements_py3.11.txt +0 -0
  41. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/install.py +0 -0
  42. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/setup.cfg +0 -0
  43. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/conftest.py +0 -0
  44. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/pytest.ini +0 -0
  45. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_bench_runner.py +0 -0
  46. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_chroma.py +0 -0
  47. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_data_source.py +0 -0
  48. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_dataset.py +0 -0
  49. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_elasticsearch_cloud.py +0 -0
  50. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_models.py +0 -0
  51. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_redis.py +0 -0
  52. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/test_utils.py +0 -0
  53. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/tests/ut_cases.py +0 -0
  54. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/__main__.py +0 -0
  55. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/__init__.py +0 -0
  56. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/assembler.py +0 -0
  57. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/cases.py +0 -0
  58. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/aws_opensearch/aws_opensearch.py +0 -0
  59. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/aws_opensearch/cli.py +0 -0
  60. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/aws_opensearch/config.py +0 -0
  61. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/aws_opensearch/run.py +0 -0
  62. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/chroma/chroma.py +0 -0
  63. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/chroma/config.py +0 -0
  64. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/elastic_cloud/config.py +0 -0
  65. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/elastic_cloud/elastic_cloud.py +0 -0
  66. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/memorydb/cli.py +0 -0
  67. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/memorydb/config.py +0 -0
  68. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/memorydb/memorydb.py +0 -0
  69. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/milvus/cli.py +0 -0
  70. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/milvus/config.py +0 -0
  71. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgdiskann/cli.py +0 -0
  72. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgdiskann/config.py +0 -0
  73. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgdiskann/pgdiskann.py +0 -0
  74. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvecto_rs/cli.py +0 -0
  75. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvecto_rs/config.py +0 -0
  76. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvecto_rs/pgvecto_rs.py +0 -0
  77. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvector/cli.py +0 -0
  78. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvector/config.py +0 -0
  79. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvector/pgvector.py +0 -0
  80. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvectorscale/cli.py +0 -0
  81. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvectorscale/config.py +0 -0
  82. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pgvectorscale/pgvectorscale.py +0 -0
  83. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pinecone/config.py +0 -0
  84. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/pinecone/pinecone.py +0 -0
  85. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/qdrant_cloud/config.py +0 -0
  86. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/qdrant_cloud/qdrant_cloud.py +0 -0
  87. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/redis/cli.py +0 -0
  88. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/redis/config.py +0 -0
  89. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/redis/redis.py +0 -0
  90. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/test/cli.py +0 -0
  91. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/test/config.py +0 -0
  92. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/test/test.py +0 -0
  93. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/weaviate_cloud/cli.py +0 -0
  94. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/weaviate_cloud/config.py +0 -0
  95. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/weaviate_cloud/weaviate_cloud.py +0 -0
  96. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/zilliz_cloud/cli.py +0 -0
  97. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/zilliz_cloud/config.py +0 -0
  98. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/clients/zilliz_cloud/zilliz_cloud.py +0 -0
  99. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/data_source.py +0 -0
  100. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/result_collector.py +0 -0
  101. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/runner/__init__.py +0 -0
  102. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/runner/serial_runner.py +0 -0
  103. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/backend/utils.py +0 -0
  104. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/base.py +0 -0
  105. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/cli/__init__.py +0 -0
  106. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/cli/cli.py +0 -0
  107. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/config-files/sample_config.yml +0 -0
  108. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/custom/custom_case.json +0 -0
  109. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/charts.py +0 -0
  110. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/data.py +0 -0
  111. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/expanderStyle.py +0 -0
  112. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/filters.py +0 -0
  113. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/footer.py +0 -0
  114. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/headerIcon.py +0 -0
  115. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/nav.py +0 -0
  116. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/priceTable.py +0 -0
  117. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/check_results/stPageConfig.py +0 -0
  118. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/custom/displayCustomCase.py +0 -0
  119. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/custom/displaypPrams.py +0 -0
  120. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/custom/getCustomConfig.py +0 -0
  121. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/custom/initStyle.py +0 -0
  122. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/get_results/saveAsImage.py +0 -0
  123. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/autoRefresh.py +0 -0
  124. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/caseSelector.py +0 -0
  125. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/dbConfigSetting.py +0 -0
  126. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/dbSelector.py +0 -0
  127. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/generateTasks.py +0 -0
  128. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/hideSidebar.py +0 -0
  129. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/initStyle.py +0 -0
  130. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/run_test/submitTask.py +0 -0
  131. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/components/tables/data.py +0 -0
  132. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/config/dbPrices.py +0 -0
  133. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/config/styles.py +0 -0
  134. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/pages/custom.py +0 -0
  135. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/pages/quries_per_dollar.py +0 -0
  136. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/pages/run_test.py +0 -0
  137. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/pages/tables.py +0 -0
  138. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/utils.py +0 -0
  139. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/frontend/vdb_benchmark.py +0 -0
  140. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/interface.py +0 -0
  141. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/log_util.py +0 -0
  142. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/ElasticCloud/result_20230727_standard_elasticcloud.json +0 -0
  143. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/ElasticCloud/result_20230808_standard_elasticcloud.json +0 -0
  144. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/Milvus/result_20230727_standard_milvus.json +0 -0
  145. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/Milvus/result_20230808_standard_milvus.json +0 -0
  146. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/PgVector/result_20230727_standard_pgvector.json +0 -0
  147. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/PgVector/result_20230808_standard_pgvector.json +0 -0
  148. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/Pinecone/result_20230727_standard_pinecone.json +0 -0
  149. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/Pinecone/result_20230808_standard_pinecone.json +0 -0
  150. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/QdrantCloud/result_20230727_standard_qdrantcloud.json +0 -0
  151. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/QdrantCloud/result_20230808_standard_qdrantcloud.json +0 -0
  152. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/WeaviateCloud/result_20230727_standard_weaviatecloud.json +0 -0
  153. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/WeaviateCloud/result_20230808_standard_weaviatecloud.json +0 -0
  154. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/ZillizCloud/result_20230727_standard_zillizcloud.json +0 -0
  155. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/ZillizCloud/result_20230808_standard_zillizcloud.json +0 -0
  156. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/ZillizCloud/result_20240105_standard_202401_zillizcloud.json +0 -0
  157. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/dbPrices.json +0 -0
  158. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/getLeaderboardData.py +0 -0
  159. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench/results/leaderboard.json +0 -0
  160. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/dependency_links.txt +0 -0
  161. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/entry_points.txt +0 -0
  162. {vectordb_bench-0.0.16 → vectordb_bench-0.0.18}/vectordb_bench.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vectordb-bench
3
- Version: 0.0.16
3
+ Version: 0.0.18
4
4
  Summary: VectorDBBench is not just an offering of benchmark results for mainstream vector databases and cloud services, it's your go-to tool for the ultimate performance and cost-effectiveness comparison. Designed with ease-of-use in mind, VectorDBBench is devised to help users, even non-professionals, reproduce results or test new systems, making the hunt for the optimal choice amongst a plethora of cloud services and open-source vector databases a breeze.
5
5
  Author-email: XuanYang-cn <xuan.yang@zilliz.com>
6
6
  Project-URL: repository, https://github.com/zilliztech/VectorDBBench
@@ -64,6 +64,10 @@ Provides-Extra: pgdiskann
64
64
  Requires-Dist: psycopg; extra == "pgdiskann"
65
65
  Requires-Dist: psycopg-binary; extra == "pgdiskann"
66
66
  Requires-Dist: pgvector; extra == "pgdiskann"
67
+ Provides-Extra: alloydb
68
+ Requires-Dist: psycopg; extra == "alloydb"
69
+ Requires-Dist: psycopg-binary; extra == "alloydb"
70
+ Requires-Dist: pgvector; extra == "alloydb"
67
71
  Provides-Extra: pgvecto-rs
68
72
  Requires-Dist: pgvecto_rs[psycopg3]>=0.2.2; extra == "pgvecto-rs"
69
73
  Provides-Extra: redis
@@ -116,11 +120,12 @@ All the database client supported
116
120
  | pgvector | `pip install vectordb-bench[pgvector]` |
117
121
  | pgvecto.rs | `pip install vectordb-bench[pgvecto_rs]` |
118
122
  | pgvectorscale | `pip install vectordb-bench[pgvectorscale]` |
119
- | pgdiskann | `pip install vectordb-bench[pgdiskann]` |
123
+ | pgdiskann | `pip install vectordb-bench[pgdiskann]` |
120
124
  | redis | `pip install vectordb-bench[redis]` |
121
125
  | memorydb | `pip install vectordb-bench[memorydb]` |
122
126
  | chromadb | `pip install vectordb-bench[chromadb]` |
123
127
  | awsopensearch | `pip install vectordb-bench[awsopensearch]` |
128
+ | alloydb | `pip install vectordb-bench[alloydb]` |
124
129
 
125
130
  ### Run
126
131
 
@@ -38,11 +38,12 @@ All the database client supported
38
38
  | pgvector | `pip install vectordb-bench[pgvector]` |
39
39
  | pgvecto.rs | `pip install vectordb-bench[pgvecto_rs]` |
40
40
  | pgvectorscale | `pip install vectordb-bench[pgvectorscale]` |
41
- | pgdiskann | `pip install vectordb-bench[pgdiskann]` |
41
+ | pgdiskann | `pip install vectordb-bench[pgdiskann]` |
42
42
  | redis | `pip install vectordb-bench[redis]` |
43
43
  | memorydb | `pip install vectordb-bench[memorydb]` |
44
44
  | chromadb | `pip install vectordb-bench[chromadb]` |
45
45
  | awsopensearch | `pip install vectordb-bench[awsopensearch]` |
46
+ | alloydb | `pip install vectordb-bench[alloydb]` |
46
47
 
47
48
  ### Run
48
49
 
@@ -73,6 +73,7 @@ elastic = [ "elasticsearch" ]
73
73
  pgvector = [ "psycopg", "psycopg-binary", "pgvector" ]
74
74
  pgvectorscale = [ "psycopg", "psycopg-binary", "pgvector" ]
75
75
  pgdiskann = [ "psycopg", "psycopg-binary", "pgvector" ]
76
+ alloydb = [ "psycopg", "psycopg-binary", "pgvector"]
76
77
  pgvecto_rs = [ "pgvecto_rs[psycopg3]>=0.2.2" ]
77
78
  redis = [ "redis" ]
78
79
  memorydb = [ "memorydb" ]
@@ -0,0 +1,88 @@
1
+ from typing import Iterable
2
+ import argparse
3
+ from vectordb_bench.backend.dataset import Dataset, DatasetSource
4
+ from vectordb_bench.backend.runner.rate_runner import RatedMultiThreadingInsertRunner
5
+ from vectordb_bench.backend.runner.read_write_runner import ReadWriteRunner
6
+ from vectordb_bench.backend.clients import DB, VectorDB
7
+ from vectordb_bench.backend.clients.milvus.config import FLATConfig
8
+ from vectordb_bench.backend.clients.zilliz_cloud.config import AutoIndexConfig
9
+
10
+ import logging
11
+
12
+ log = logging.getLogger("vectordb_bench")
13
+ log.setLevel(logging.DEBUG)
14
+
15
+ def get_rate_runner(db):
16
+ cohere = Dataset.COHERE.manager(100_000)
17
+ prepared = cohere.prepare(DatasetSource.AliyunOSS)
18
+ assert prepared
19
+ runner = RatedMultiThreadingInsertRunner(
20
+ rate = 10,
21
+ db = db,
22
+ dataset = cohere,
23
+ )
24
+
25
+ return runner
26
+
27
+ def test_rate_runner(db, insert_rate):
28
+ runner = get_rate_runner(db)
29
+
30
+ _, t = runner.run_with_rate()
31
+ log.info(f"insert run done, time={t}")
32
+
33
+ def test_read_write_runner(db, insert_rate, conc: list, search_stage: Iterable[float], read_dur_after_write: int, local: bool=False):
34
+ cohere = Dataset.COHERE.manager(1_000_000)
35
+ if local is True:
36
+ source = DatasetSource.AliyunOSS
37
+ else:
38
+ source = DatasetSource.S3
39
+ prepared = cohere.prepare(source)
40
+ assert prepared
41
+
42
+ rw_runner = ReadWriteRunner(
43
+ db=db,
44
+ dataset=cohere,
45
+ insert_rate=insert_rate,
46
+ search_stage=search_stage,
47
+ read_dur_after_write=read_dur_after_write,
48
+ concurrencies=conc
49
+ )
50
+ rw_runner.run_read_write()
51
+
52
+
53
+ def get_db(db: str, config: dict) -> VectorDB:
54
+ if db == DB.Milvus.name:
55
+ return DB.Milvus.init_cls(dim=768, db_config=config, db_case_config=FLATConfig(metric_type="COSINE"), drop_old=True, pre_load=True)
56
+ elif db == DB.ZillizCloud.name:
57
+ return DB.ZillizCloud.init_cls(dim=768, db_config=config, db_case_config=AutoIndexConfig(metric_type="COSINE"), drop_old=True, pre_load=True)
58
+ else:
59
+ raise ValueError(f"unknown db: {db}")
60
+
61
+
62
+ if __name__ == "__main__":
63
+ parser = argparse.ArgumentParser()
64
+ parser.add_argument("-r", "--insert_rate", type=int, default="1000", help="insert entity row count per seconds, cps")
65
+ parser.add_argument("-d", "--db", type=str, default=DB.Milvus.name, help="db name")
66
+ parser.add_argument("-t", "--duration", type=int, default=300, help="stage search duration in seconds")
67
+ parser.add_argument("--use_s3", action='store_true', help="whether to use S3 dataset")
68
+
69
+ flags = parser.parse_args()
70
+
71
+ # TODO read uri, user, password from .env
72
+ config = {
73
+ "uri": "http://localhost:19530",
74
+ "user": "",
75
+ "password": "",
76
+ }
77
+
78
+ conc = (1, 15, 50)
79
+ search_stage = (0.5, 0.6, 0.7, 0.8, 0.9, 1.0)
80
+
81
+ db = get_db(flags.db, config)
82
+ test_read_write_runner(
83
+ db=db,
84
+ insert_rate=flags.insert_rate,
85
+ conc=conc,
86
+ search_stage=search_stage,
87
+ read_dur_after_write=flags.duration,
88
+ local=flags.use_s3)
@@ -17,7 +17,7 @@ class config:
17
17
 
18
18
  DEFAULT_DATASET_URL = env.str("DEFAULT_DATASET_URL", AWS_S3_URL)
19
19
  DATASET_LOCAL_DIR = env.path("DATASET_LOCAL_DIR", "/tmp/vectordb_bench/dataset")
20
- NUM_PER_BATCH = env.int("NUM_PER_BATCH", 5000)
20
+ NUM_PER_BATCH = env.int("NUM_PER_BATCH", 100)
21
21
 
22
22
  DROP_OLD = env.bool("DROP_OLD", True)
23
23
  USE_SHUFFLED_DATA = env.bool("USE_SHUFFLED_DATA", True)
@@ -32,6 +32,7 @@ class DB(Enum):
32
32
  PgVectoRS = "PgVectoRS"
33
33
  PgVectorScale = "PgVectorScale"
34
34
  PgDiskANN = "PgDiskANN"
35
+ AlloyDB = "AlloyDB"
35
36
  Redis = "Redis"
36
37
  MemoryDB = "MemoryDB"
37
38
  Chroma = "Chroma"
@@ -97,6 +98,10 @@ class DB(Enum):
97
98
  if self == DB.AWSOpenSearch:
98
99
  from .aws_opensearch.aws_opensearch import AWSOpenSearch
99
100
  return AWSOpenSearch
101
+
102
+ if self == DB.AlloyDB:
103
+ from .alloydb.alloydb import AlloyDB
104
+ return AlloyDB
100
105
 
101
106
  @property
102
107
  def config_cls(self) -> Type[DBConfig]:
@@ -156,6 +161,10 @@ class DB(Enum):
156
161
  if self == DB.AWSOpenSearch:
157
162
  from .aws_opensearch.config import AWSOpenSearchConfig
158
163
  return AWSOpenSearchConfig
164
+
165
+ if self == DB.AlloyDB:
166
+ from .alloydb.config import AlloyDBConfig
167
+ return AlloyDBConfig
159
168
 
160
169
  def case_config_cls(self, index_type: IndexType | None = None) -> Type[DBCaseConfig]:
161
170
  if self == DB.Milvus:
@@ -197,6 +206,10 @@ class DB(Enum):
197
206
  if self == DB.PgDiskANN:
198
207
  from .pgdiskann.config import _pgdiskann_case_config
199
208
  return _pgdiskann_case_config.get(index_type)
209
+
210
+ if self == DB.AlloyDB:
211
+ from .alloydb.config import _alloydb_case_config
212
+ return _alloydb_case_config.get(index_type)
200
213
 
201
214
  # DB.Pinecone, DB.Chroma, DB.Redis
202
215
  return EmptyDBCaseConfig
@@ -0,0 +1,372 @@
1
+ """Wrapper around the alloydb vector database over VectorDB"""
2
+
3
+ import logging
4
+ import pprint
5
+ from contextlib import contextmanager
6
+ from typing import Any, Generator, Optional, Tuple, Sequence
7
+
8
+ import numpy as np
9
+ import psycopg
10
+ from pgvector.psycopg import register_vector
11
+ from psycopg import Connection, Cursor, sql
12
+
13
+ from ..api import VectorDB
14
+ from .config import AlloyDBConfigDict, AlloyDBIndexConfig, AlloyDBScaNNConfig
15
+
16
+ log = logging.getLogger(__name__)
17
+
18
+
19
+ class AlloyDB(VectorDB):
20
+ """Use psycopg instructions"""
21
+
22
+ conn: psycopg.Connection[Any] | None = None
23
+ cursor: psycopg.Cursor[Any] | None = None
24
+
25
+ _filtered_search: sql.Composed
26
+ _unfiltered_search: sql.Composed
27
+
28
+ def __init__(
29
+ self,
30
+ dim: int,
31
+ db_config: AlloyDBConfigDict,
32
+ db_case_config: AlloyDBIndexConfig,
33
+ collection_name: str = "alloydb_collection",
34
+ drop_old: bool = False,
35
+ **kwargs,
36
+ ):
37
+ self.name = "AlloyDB"
38
+ self.db_config = db_config
39
+ self.case_config = db_case_config
40
+ self.table_name = collection_name
41
+ self.dim = dim
42
+
43
+ self._index_name = "alloydb_index"
44
+ self._primary_field = "id"
45
+ self._vector_field = "embedding"
46
+
47
+ # construct basic units
48
+ self.conn, self.cursor = self._create_connection(**self.db_config)
49
+
50
+ # create vector extension
51
+ self.cursor.execute("CREATE EXTENSION IF NOT EXISTS alloydb_scann CASCADE")
52
+ self.conn.commit()
53
+
54
+ log.info(f"{self.name} config values: {self.db_config}\n{self.case_config}")
55
+ if not any(
56
+ (
57
+ self.case_config.create_index_before_load,
58
+ self.case_config.create_index_after_load,
59
+ )
60
+ ):
61
+ err = f"{self.name} config must create an index using create_index_before_load or create_index_after_load"
62
+ log.error(err)
63
+ raise RuntimeError(
64
+ f"{err}\n{pprint.pformat(self.db_config)}\n{pprint.pformat(self.case_config)}"
65
+ )
66
+
67
+ if drop_old:
68
+ self._drop_index()
69
+ self._drop_table()
70
+ self._create_table(dim)
71
+ if self.case_config.create_index_before_load:
72
+ self._create_index()
73
+
74
+ self.cursor.close()
75
+ self.conn.close()
76
+ self.cursor = None
77
+ self.conn = None
78
+
79
+ @staticmethod
80
+ def _create_connection(**kwargs) -> Tuple[Connection, Cursor]:
81
+ conn = psycopg.connect(**kwargs)
82
+ register_vector(conn)
83
+ conn.autocommit = False
84
+ cursor = conn.cursor()
85
+
86
+ assert conn is not None, "Connection is not initialized"
87
+ assert cursor is not None, "Cursor is not initialized"
88
+ return conn, cursor
89
+
90
+ def _generate_search_query(self, filtered: bool=False) -> sql.Composed:
91
+ search_query = sql.Composed(
92
+ [
93
+ sql.SQL(
94
+ "SELECT id FROM public.{table_name} {where_clause} ORDER BY embedding "
95
+ ).format(
96
+ table_name=sql.Identifier(self.table_name),
97
+ where_clause=sql.SQL("WHERE id >= %s") if filtered else sql.SQL(""),
98
+ ),
99
+ sql.SQL(self.case_config.search_param()["metric_fun_op"]),
100
+ sql.SQL(" %s::vector LIMIT %s::int"),
101
+ ]
102
+ )
103
+ return search_query
104
+
105
+ @contextmanager
106
+ def init(self) -> Generator[None, None, None]:
107
+ """
108
+ Examples:
109
+ >>> with self.init():
110
+ >>> self.insert_embeddings()
111
+ >>> self.search_embedding()
112
+ """
113
+
114
+ self.conn, self.cursor = self._create_connection(**self.db_config)
115
+
116
+ # index configuration may have commands defined that we should set during each client session
117
+ session_options: Sequence[dict[str, Any]] = self.case_config.session_param()["session_options"]
118
+
119
+ if len(session_options) > 0:
120
+ for setting in session_options:
121
+ command = sql.SQL("SET {setting_name} " + "= {val};").format(
122
+ setting_name=sql.Identifier(setting['parameter']['setting_name']),
123
+ val=sql.Identifier(str(setting['parameter']['val'])),
124
+ )
125
+ log.debug(command.as_string(self.cursor))
126
+ self.cursor.execute(command)
127
+ self.conn.commit()
128
+
129
+ self._filtered_search = self._generate_search_query(filtered=True)
130
+ self._unfiltered_search = self._generate_search_query()
131
+
132
+ try:
133
+ yield
134
+ finally:
135
+ self.cursor.close()
136
+ self.conn.close()
137
+ self.cursor = None
138
+ self.conn = None
139
+
140
+ def _drop_table(self):
141
+ assert self.conn is not None, "Connection is not initialized"
142
+ assert self.cursor is not None, "Cursor is not initialized"
143
+ log.info(f"{self.name} client drop table : {self.table_name}")
144
+
145
+ self.cursor.execute(
146
+ sql.SQL("DROP TABLE IF EXISTS public.{table_name}").format(
147
+ table_name=sql.Identifier(self.table_name)
148
+ )
149
+ )
150
+ self.conn.commit()
151
+
152
+ def ready_to_load(self):
153
+ pass
154
+
155
+ def optimize(self):
156
+ self._post_insert()
157
+
158
+ def _post_insert(self):
159
+ log.info(f"{self.name} post insert before optimize")
160
+ if self.case_config.create_index_after_load:
161
+ self._drop_index()
162
+ self._create_index()
163
+
164
+ def _drop_index(self):
165
+ assert self.conn is not None, "Connection is not initialized"
166
+ assert self.cursor is not None, "Cursor is not initialized"
167
+ log.info(f"{self.name} client drop index : {self._index_name}")
168
+
169
+ drop_index_sql = sql.SQL("DROP INDEX IF EXISTS {index_name}").format(
170
+ index_name=sql.Identifier(self._index_name)
171
+ )
172
+ log.debug(drop_index_sql.as_string(self.cursor))
173
+ self.cursor.execute(drop_index_sql)
174
+ self.conn.commit()
175
+
176
+ def _set_parallel_index_build_param(self):
177
+ assert self.conn is not None, "Connection is not initialized"
178
+ assert self.cursor is not None, "Cursor is not initialized"
179
+
180
+ index_param = self.case_config.index_param()
181
+
182
+ if index_param["enable_pca"] is not None:
183
+ self.cursor.execute(
184
+ sql.SQL("SET scann.enable_pca TO {};").format(
185
+ index_param["enable_pca"]
186
+ )
187
+ )
188
+ self.cursor.execute(
189
+ sql.SQL("ALTER USER {} SET scann.enable_pca TO {};").format(
190
+ sql.Identifier(self.db_config["user"]),
191
+ index_param["enable_pca"],
192
+ )
193
+ )
194
+ self.conn.commit()
195
+
196
+ if index_param["maintenance_work_mem"] is not None:
197
+ self.cursor.execute(
198
+ sql.SQL("SET maintenance_work_mem TO {};").format(
199
+ index_param["maintenance_work_mem"]
200
+ )
201
+ )
202
+ self.cursor.execute(
203
+ sql.SQL("ALTER USER {} SET maintenance_work_mem TO {};").format(
204
+ sql.Identifier(self.db_config["user"]),
205
+ index_param["maintenance_work_mem"],
206
+ )
207
+ )
208
+ self.conn.commit()
209
+
210
+ if index_param["max_parallel_workers"] is not None:
211
+ self.cursor.execute(
212
+ sql.SQL("SET max_parallel_maintenance_workers TO '{}';").format(
213
+ index_param["max_parallel_workers"]
214
+ )
215
+ )
216
+ self.cursor.execute(
217
+ sql.SQL(
218
+ "ALTER USER {} SET max_parallel_maintenance_workers TO '{}';"
219
+ ).format(
220
+ sql.Identifier(self.db_config["user"]),
221
+ index_param["max_parallel_workers"],
222
+ )
223
+ )
224
+ self.cursor.execute(
225
+ sql.SQL("SET max_parallel_workers TO '{}';").format(
226
+ index_param["max_parallel_workers"]
227
+ )
228
+ )
229
+ self.cursor.execute(
230
+ sql.SQL(
231
+ "ALTER USER {} SET max_parallel_workers TO '{}';"
232
+ ).format(
233
+ sql.Identifier(self.db_config["user"]),
234
+ index_param["max_parallel_workers"],
235
+ )
236
+ )
237
+ self.cursor.execute(
238
+ sql.SQL(
239
+ "ALTER TABLE {} SET (parallel_workers = {});"
240
+ ).format(
241
+ sql.Identifier(self.table_name),
242
+ index_param["max_parallel_workers"],
243
+ )
244
+ )
245
+ self.conn.commit()
246
+
247
+ results = self.cursor.execute(
248
+ sql.SQL("SHOW max_parallel_maintenance_workers;")
249
+ ).fetchall()
250
+ results.extend(
251
+ self.cursor.execute(sql.SQL("SHOW max_parallel_workers;")).fetchall()
252
+ )
253
+ results.extend(
254
+ self.cursor.execute(sql.SQL("SHOW maintenance_work_mem;")).fetchall()
255
+ )
256
+ log.info(f"{self.name} parallel index creation parameters: {results}")
257
+
258
+ def _create_index(self):
259
+ assert self.conn is not None, "Connection is not initialized"
260
+ assert self.cursor is not None, "Cursor is not initialized"
261
+ log.info(f"{self.name} client create index : {self._index_name}")
262
+
263
+ index_param = self.case_config.index_param()
264
+ self._set_parallel_index_build_param()
265
+ options = []
266
+ for option in index_param["index_creation_with_options"]:
267
+ if option['val'] is not None:
268
+ options.append(
269
+ sql.SQL("{option_name} = {val}").format(
270
+ option_name=sql.Identifier(option['option_name']),
271
+ val=sql.Identifier(str(option['val'])),
272
+ )
273
+ )
274
+ if any(options):
275
+ with_clause = sql.SQL("WITH ({});").format(sql.SQL(", ").join(options))
276
+ else:
277
+ with_clause = sql.Composed(())
278
+
279
+ index_create_sql = sql.SQL(
280
+ """
281
+ CREATE INDEX IF NOT EXISTS {index_name} ON public.{table_name}
282
+ USING {index_type} (embedding {embedding_metric})
283
+ """
284
+ ).format(
285
+ index_name=sql.Identifier(self._index_name),
286
+ table_name=sql.Identifier(self.table_name),
287
+ index_type=sql.Identifier(index_param["index_type"]),
288
+ embedding_metric=sql.Identifier(index_param["metric"]),
289
+ )
290
+
291
+ index_create_sql_with_with_clause = (
292
+ index_create_sql + with_clause
293
+ ).join(" ")
294
+ log.debug(index_create_sql_with_with_clause.as_string(self.cursor))
295
+ self.cursor.execute(index_create_sql_with_with_clause)
296
+ self.conn.commit()
297
+
298
+ def _create_table(self, dim: int):
299
+ assert self.conn is not None, "Connection is not initialized"
300
+ assert self.cursor is not None, "Cursor is not initialized"
301
+
302
+ try:
303
+ log.info(f"{self.name} client create table : {self.table_name}")
304
+
305
+ # create table
306
+ self.cursor.execute(
307
+ sql.SQL(
308
+ "CREATE TABLE IF NOT EXISTS public.{table_name} (id BIGINT PRIMARY KEY, embedding vector({dim}));"
309
+ ).format(table_name=sql.Identifier(self.table_name), dim=dim)
310
+ )
311
+ self.conn.commit()
312
+ except Exception as e:
313
+ log.warning(
314
+ f"Failed to create alloydb table: {self.table_name} error: {e}"
315
+ )
316
+ raise e from None
317
+
318
+ def insert_embeddings(
319
+ self,
320
+ embeddings: list[list[float]],
321
+ metadata: list[int],
322
+ **kwargs: Any,
323
+ ) -> Tuple[int, Optional[Exception]]:
324
+ assert self.conn is not None, "Connection is not initialized"
325
+ assert self.cursor is not None, "Cursor is not initialized"
326
+
327
+ try:
328
+ metadata_arr = np.array(metadata)
329
+ embeddings_arr = np.array(embeddings)
330
+
331
+ with self.cursor.copy(
332
+ sql.SQL("COPY public.{table_name} FROM STDIN (FORMAT BINARY)").format(
333
+ table_name=sql.Identifier(self.table_name)
334
+ )
335
+ ) as copy:
336
+ copy.set_types(["bigint", "vector"])
337
+ for i, row in enumerate(metadata_arr):
338
+ copy.write_row((row, embeddings_arr[i]))
339
+ self.conn.commit()
340
+
341
+ if kwargs.get("last_batch"):
342
+ self._post_insert()
343
+
344
+ return len(metadata), None
345
+ except Exception as e:
346
+ log.warning(
347
+ f"Failed to insert data into alloydb table ({self.table_name}), error: {e}"
348
+ )
349
+ return 0, e
350
+
351
+ def search_embedding(
352
+ self,
353
+ query: list[float],
354
+ k: int = 100,
355
+ filters: dict | None = None,
356
+ timeout: int | None = None,
357
+ ) -> list[int]:
358
+ assert self.conn is not None, "Connection is not initialized"
359
+ assert self.cursor is not None, "Cursor is not initialized"
360
+
361
+ q = np.asarray(query)
362
+ if filters:
363
+ gt = filters.get("id")
364
+ result = self.cursor.execute(
365
+ self._filtered_search, (gt, q, k), prepare=True, binary=True
366
+ )
367
+ else:
368
+ result = self.cursor.execute(
369
+ self._unfiltered_search, (q, k), prepare=True, binary=True
370
+ )
371
+
372
+ return [int(i[0]) for i in result.fetchall()]