cmem-plugin-pgvector 0.7.0__tar.gz → 0.7.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: cmem-plugin-pgvector
3
- Version: 0.7.0
3
+ Version: 0.7.1
4
4
  Summary: Store and search for embedding vectors in a Postgres vector store.
5
5
  License: Apache-2.0
6
6
  Keywords: eccenca Corporate Memory,plugin
@@ -60,23 +60,15 @@ class PGVectorCollection(StringParameterType):
60
60
  password = depend_on_parameter_values[4]
61
61
  password = password if isinstance(password, str) else password.decrypt()
62
62
  result = []
63
- try:
64
- collections = get_collection_names(
65
- host=host, port=port, dbname=dbname, user=user, password=password
66
- )
67
- filtered_models = set()
68
- if query_terms:
69
- for term in query_terms:
70
- for collection in collections:
71
- if term in collection:
72
- filtered_models.add(collection)
73
- else:
74
- filtered_models = set(collections)
75
- result = [Autocompletion(value=f"{_}", label=f"{_}") for _ in filtered_models]
76
- except Exception as error:
77
- raise ValueError(
78
- "Failed to authenticate with OpenAI API, Please check URL and API key."
79
- ) from error
63
+ collections = get_collection_names(
64
+ host=host, port=port, dbname=dbname, user=user, password=password
65
+ )
66
+ filtered_collections = set()
67
+ for term in query_terms:
68
+ for collection in collections:
69
+ if term in collection:
70
+ filtered_collections.add(collection)
71
+ result = [Autocompletion(value=f"{_}", label=f"{_}") for _ in filtered_collections]
80
72
  result.sort(key=lambda x: x.label)
81
73
  return result
82
74
 
@@ -147,15 +147,6 @@ class PGVectorSearchPlugin(WorkflowPlugin):
147
147
  self.report = ExecutionReport()
148
148
  self.report.operation = "search"
149
149
  self.report.operation_desc = "searches"
150
-
151
- self.db = PGVector(
152
- collection_name=self.collection_name,
153
- connection=self.connection_string,
154
- embeddings=DummyEmbeddings(),
155
- use_jsonb=True,
156
- pre_delete_collection=False,
157
- distance_strategy=distance_strategy,
158
- )
159
150
  self._setup_ports()
160
151
 
161
152
  def _setup_ports(self) -> None:
@@ -237,6 +228,14 @@ class PGVectorSearchPlugin(WorkflowPlugin):
237
228
  ) -> Entities:
238
229
  """Run the workflow operator."""
239
230
  self.log.info("Start searching collection.")
231
+ self.db = PGVector(
232
+ collection_name=self.collection_name,
233
+ connection=self.connection_string,
234
+ embeddings=DummyEmbeddings(),
235
+ use_jsonb=True,
236
+ pre_delete_collection=False,
237
+ distance_strategy=self.distance_strategy,
238
+ )
240
239
  self.inputs = inputs
241
240
  self.execution_context = context
242
241
  try:
@@ -137,6 +137,7 @@ class PGVectorStorePlugin(WorkflowPlugin):
137
137
  self.embedding_path = embedding_path
138
138
  self.metadata_paths = metadata_paths
139
139
  self.source_path = source_path
140
+ self.pre_delete_collection = pre_delete_collection
140
141
 
141
142
  self.output_port = None
142
143
  self.input_ports = FixedNumberOfInputs([UnknownSchemaPort()])
@@ -149,14 +150,6 @@ class PGVectorStorePlugin(WorkflowPlugin):
149
150
  self.report.operation = "store"
150
151
  self.report.operation_desc = "vectors stored"
151
152
 
152
- self.db = PGVector(
153
- collection_name=self.collection_name,
154
- connection=self.connection_string,
155
- embeddings=None, # type: ignore # noqa: PGH003
156
- use_jsonb=True,
157
- pre_delete_collection=pre_delete_collection,
158
- )
159
-
160
153
  def _update_report(self, count: int) -> None:
161
154
  self.report.entity_count = count
162
155
  self.execution_context.report.update(self.report)
@@ -228,6 +221,13 @@ class PGVectorStorePlugin(WorkflowPlugin):
228
221
  ) -> None:
229
222
  """Run the workflow operator."""
230
223
  self.log.info("Start storing vectors.")
224
+ self.db = PGVector(
225
+ collection_name=self.collection_name,
226
+ connection=self.connection_string,
227
+ embeddings=None, # type: ignore # noqa: PGH003
228
+ use_jsonb=True,
229
+ pre_delete_collection=self.pre_delete_collection,
230
+ )
231
231
  self.inputs = inputs
232
232
  self.execution_context = context
233
233
  try:
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "cmem-plugin-pgvector"
3
- version = "0.7.0"
3
+ version = "0.7.1"
4
4
  license = "Apache-2.0"
5
5
  description = "Store and search for embedding vectors in a Postgres vector store."
6
6
  authors = ["eccenca GmbH <cmempy-developer@eccenca.com>"]
@@ -40,6 +40,7 @@ pytest-memray = { version = "^1.7.0", markers = "platform_system != 'Windows'"
40
40
  ruff = "^0.12.0"
41
41
  safety = "^1.10.3"
42
42
  aiohttp = "^3.10.11"
43
+ testcontainers = "^4.12.0"
43
44
 
44
45
  [build-system]
45
46
  requires = ["poetry-core>=1.0.0", "poetry-dynamic-versioning"]