diracx-db 0.0.1a45__py3-none-any.whl → 0.0.1a47__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
diracx/db/__main__.py CHANGED
@@ -31,7 +31,6 @@ async def init_sql():
31
31
  from diracx.db.sql.utils import BaseSQLDB
32
32
 
33
33
  for db_name, db_url in BaseSQLDB.available_urls().items():
34
-
35
34
  logger.info("Initialising %s", db_name)
36
35
  db = BaseSQLDB.available_implementations(db_name)[0](db_url)
37
36
  async with db.engine_context():
@@ -9,13 +9,19 @@ class JobParametersDB(BaseOSDB):
9
9
  fields = {
10
10
  "JobID": {"type": "long"},
11
11
  "timestamp": {"type": "date"},
12
+ "PilotAgent": {"type": "keyword"},
13
+ "Pilot_Reference": {"type": "keyword"},
14
+ "JobGroup": {"type": "keyword"},
12
15
  "CPUNormalizationFactor": {"type": "long"},
13
16
  "NormCPUTime(s)": {"type": "long"},
14
- "Memory(kB)": {"type": "long"},
17
+ "Memory(MB)": {"type": "long"},
18
+ "LocalAccount": {"type": "keyword"},
15
19
  "TotalCPUTime(s)": {"type": "long"},
16
- "MemoryUsed(kb)": {"type": "long"},
17
- "HostName": {"type": "keyword"},
20
+ "PayloadPID": {"type": "long"},
21
+ "HostName": {"type": "text"},
18
22
  "GridCE": {"type": "keyword"},
23
+ "CEQueue": {"type": "keyword"},
24
+ "BatchSystem": {"type": "keyword"},
19
25
  "ModelName": {"type": "keyword"},
20
26
  "Status": {"type": "keyword"},
21
27
  "JobType": {"type": "keyword"},
diracx/db/sql/dummy/db.py CHANGED
@@ -1,9 +1,9 @@
1
1
  from __future__ import annotations
2
2
 
3
- from sqlalchemy import func, insert, select
3
+ from sqlalchemy import insert
4
4
  from uuid_utils import UUID
5
5
 
6
- from diracx.db.sql.utils import BaseSQLDB, apply_search_filters
6
+ from diracx.db.sql.utils import BaseSQLDB
7
7
 
8
8
  from .schema import Base as DummyDBBase
9
9
  from .schema import Cars, Owners
@@ -22,18 +22,7 @@ class DummyDB(BaseSQLDB):
22
22
  metadata = DummyDBBase.metadata
23
23
 
24
24
  async def summary(self, group_by, search) -> list[dict[str, str | int]]:
25
- columns = [Cars.__table__.columns[x] for x in group_by]
26
-
27
- stmt = select(*columns, func.count(Cars.license_plate).label("count"))
28
- stmt = apply_search_filters(Cars.__table__.columns.__getitem__, stmt, search)
29
- stmt = stmt.group_by(*columns)
30
-
31
- # Execute the query
32
- return [
33
- dict(row._mapping)
34
- async for row in (await self.conn.stream(stmt))
35
- if row.count > 0 # type: ignore
36
- ]
25
+ return await self._summary(Cars, group_by, search)
37
26
 
38
27
  async def insert_owner(self, name: str) -> int:
39
28
  stmt = insert(Owners).values(name=name)
diracx/db/sql/job/db.py CHANGED
@@ -5,7 +5,7 @@ __all__ = ["JobDB"]
5
5
  from datetime import datetime, timezone
6
6
  from typing import TYPE_CHECKING, Any, Iterable
7
7
 
8
- from sqlalchemy import bindparam, case, delete, func, insert, select, update
8
+ from sqlalchemy import bindparam, case, delete, insert, select, update
9
9
 
10
10
  if TYPE_CHECKING:
11
11
  from sqlalchemy.sql.elements import BindParameter
@@ -13,7 +13,7 @@ if TYPE_CHECKING:
13
13
  from diracx.core.exceptions import InvalidQueryError
14
14
  from diracx.core.models import JobCommand, SearchSpec, SortSpec
15
15
 
16
- from ..utils import BaseSQLDB, apply_search_filters, apply_sort_constraints
16
+ from ..utils import BaseSQLDB, _get_columns
17
17
  from ..utils.functions import utcnow
18
18
  from .schema import (
19
19
  HeartBeatLoggingInfo,
@@ -25,17 +25,6 @@ from .schema import (
25
25
  )
26
26
 
27
27
 
28
- def _get_columns(table, parameters):
29
- columns = [x for x in table.columns]
30
- if parameters:
31
- if unrecognised_parameters := set(parameters) - set(table.columns.keys()):
32
- raise InvalidQueryError(
33
- f"Unrecognised parameters requested {unrecognised_parameters}"
34
- )
35
- columns = [c for c in columns if c.name in parameters]
36
- return columns
37
-
38
-
39
28
  class JobDB(BaseSQLDB):
40
29
  metadata = JobDBBase.metadata
41
30
 
@@ -54,20 +43,11 @@ class JobDB(BaseSQLDB):
54
43
  # to find a way to make it dynamic
55
44
  jdl_2_db_parameters = ["JobName", "JobType", "JobGroup"]
56
45
 
57
- async def summary(self, group_by, search) -> list[dict[str, str | int]]:
46
+ async def summary(
47
+ self, group_by: list[str], search: list[SearchSpec]
48
+ ) -> list[dict[str, str | int]]:
58
49
  """Get a summary of the jobs."""
59
- columns = _get_columns(Jobs.__table__, group_by)
60
-
61
- stmt = select(*columns, func.count(Jobs.job_id).label("count"))
62
- stmt = apply_search_filters(Jobs.__table__.columns.__getitem__, stmt, search)
63
- stmt = stmt.group_by(*columns)
64
-
65
- # Execute the query
66
- return [
67
- dict(row._mapping)
68
- async for row in (await self.conn.stream(stmt))
69
- if row.count > 0 # type: ignore
70
- ]
50
+ return await self._summary(table=Jobs, group_by=group_by, search=search)
71
51
 
72
52
  async def search(
73
53
  self,
@@ -80,34 +60,15 @@ class JobDB(BaseSQLDB):
80
60
  page: int | None = None,
81
61
  ) -> tuple[int, list[dict[Any, Any]]]:
82
62
  """Search for jobs in the database."""
83
- # Find which columns to select
84
- columns = _get_columns(Jobs.__table__, parameters)
85
-
86
- stmt = select(*columns)
87
-
88
- stmt = apply_search_filters(Jobs.__table__.columns.__getitem__, stmt, search)
89
- stmt = apply_sort_constraints(Jobs.__table__.columns.__getitem__, stmt, sorts)
90
-
91
- if distinct:
92
- stmt = stmt.distinct()
93
-
94
- # Calculate total count before applying pagination
95
- total_count_subquery = stmt.alias()
96
- total_count_stmt = select(func.count()).select_from(total_count_subquery)
97
- total = (await self.conn.execute(total_count_stmt)).scalar_one()
98
-
99
- # Apply pagination
100
- if page is not None:
101
- if page < 1:
102
- raise InvalidQueryError("Page must be a positive integer")
103
- if per_page < 1:
104
- raise InvalidQueryError("Per page must be a positive integer")
105
- stmt = stmt.offset((page - 1) * per_page).limit(per_page)
106
-
107
- # Execute the query
108
- return total, [
109
- dict(row._mapping) async for row in (await self.conn.stream(stmt))
110
- ]
63
+ return await self._search(
64
+ table=Jobs,
65
+ parameters=parameters,
66
+ search=search,
67
+ sorts=sorts,
68
+ distinct=distinct,
69
+ per_page=per_page,
70
+ page=page,
71
+ )
111
72
 
112
73
  async def create_job(self, compressed_original_jdl: str):
113
74
  """Used to insert a new job with original JDL. Returns inserted job id."""
@@ -89,7 +89,6 @@ class JobLoggingDB(BaseSQLDB):
89
89
  status_time,
90
90
  status_source,
91
91
  ) in rows:
92
-
93
92
  values[job_id].append(
94
93
  [
95
94
  status,
@@ -20,7 +20,6 @@ class PilotAgentsDB(BaseSQLDB):
20
20
  grid_type: str = "DIRAC",
21
21
  pilot_stamps: dict | None = None,
22
22
  ) -> None:
23
-
24
23
  if pilot_stamps is None:
25
24
  pilot_stamps = {}
26
25
 
@@ -13,6 +13,7 @@ from sqlalchemy import (
13
13
  Table,
14
14
  and_,
15
15
  delete,
16
+ exists,
16
17
  insert,
17
18
  literal,
18
19
  or_,
@@ -236,7 +237,10 @@ class SandboxMetadataDB(BaseSQLDB):
236
237
  """
237
238
  conditions = [
238
239
  # If it has assigned to a job but is no longer mapped it can be removed
239
- # and_(SandBoxes.Assigned, ~exists(SandBoxes.SBId == SBEntityMapping.SBId)),
240
+ and_(
241
+ SandBoxes.Assigned,
242
+ ~exists().where(SBEntityMapping.SBId == SandBoxes.SBId),
243
+ ),
240
244
  # If the sandbox is still unassigned after 15 days, remove it
241
245
  and_(~SandBoxes.Assigned, days_since(SandBoxes.LastAccessTime) >= 15),
242
246
  ]
@@ -3,6 +3,7 @@ from __future__ import annotations
3
3
  from .base import (
4
4
  BaseSQLDB,
5
5
  SQLDBUnavailableError,
6
+ _get_columns,
6
7
  apply_search_filters,
7
8
  apply_sort_constraints,
8
9
  )
@@ -10,6 +11,7 @@ from .functions import hash, substract_date, utcnow
10
11
  from .types import Column, DateNowColumn, EnumBackedBool, EnumColumn, NullColumn
11
12
 
12
13
  __all__ = (
14
+ "_get_columns",
13
15
  "utcnow",
14
16
  "Column",
15
17
  "NullColumn",
@@ -8,16 +8,20 @@ from abc import ABCMeta
8
8
  from collections.abc import AsyncIterator
9
9
  from contextvars import ContextVar
10
10
  from datetime import datetime
11
- from typing import Self, cast
11
+ from typing import Any, Self, cast
12
12
 
13
13
  from pydantic import TypeAdapter
14
- from sqlalchemy import DateTime, MetaData, select
14
+ from sqlalchemy import DateTime, MetaData, func, select
15
15
  from sqlalchemy.exc import OperationalError
16
16
  from sqlalchemy.ext.asyncio import AsyncConnection, AsyncEngine, create_async_engine
17
17
 
18
18
  from diracx.core.exceptions import InvalidQueryError
19
19
  from diracx.core.extensions import select_from_extension
20
- from diracx.core.models import SortDirection
20
+ from diracx.core.models import (
21
+ SearchSpec,
22
+ SortDirection,
23
+ SortSpec,
24
+ )
21
25
  from diracx.core.settings import SqlalchemyDsn
22
26
  from diracx.db.exceptions import DBUnavailableError
23
27
 
@@ -227,6 +231,71 @@ class BaseSQLDB(metaclass=ABCMeta):
227
231
  except OperationalError as e:
228
232
  raise SQLDBUnavailableError("Cannot ping the DB") from e
229
233
 
234
+ async def _search(
235
+ self,
236
+ table: Any,
237
+ parameters: list[str] | None,
238
+ search: list[SearchSpec],
239
+ sorts: list[SortSpec],
240
+ *,
241
+ distinct: bool = False,
242
+ per_page: int = 100,
243
+ page: int | None = None,
244
+ ) -> tuple[int, list[dict[str, Any]]]:
245
+ """Search for elements in a table."""
246
+ # Find which columns to select
247
+ columns = _get_columns(table.__table__, parameters)
248
+
249
+ stmt = select(*columns)
250
+
251
+ stmt = apply_search_filters(table.__table__.columns.__getitem__, stmt, search)
252
+ stmt = apply_sort_constraints(table.__table__.columns.__getitem__, stmt, sorts)
253
+
254
+ if distinct:
255
+ stmt = stmt.distinct()
256
+
257
+ # Calculate total count before applying pagination
258
+ total_count_subquery = stmt.alias()
259
+ total_count_stmt = select(func.count()).select_from(total_count_subquery)
260
+ total = (await self.conn.execute(total_count_stmt)).scalar_one()
261
+
262
+ # Apply pagination
263
+ if page is not None:
264
+ if page < 1:
265
+ raise InvalidQueryError("Page must be a positive integer")
266
+ if per_page < 1:
267
+ raise InvalidQueryError("Per page must be a positive integer")
268
+ stmt = stmt.offset((page - 1) * per_page).limit(per_page)
269
+
270
+ # Execute the query
271
+ return total, [
272
+ dict(row._mapping) async for row in (await self.conn.stream(stmt))
273
+ ]
274
+
275
+ async def _summary(
276
+ self, table: Any, group_by: list[str], search: list[SearchSpec]
277
+ ) -> list[dict[str, str | int]]:
278
+ """Get a summary of the elements of a table."""
279
+ columns = _get_columns(table.__table__, group_by)
280
+
281
+ pk_columns = list(table.__table__.primary_key.columns)
282
+ if not pk_columns:
283
+ raise ValueError(
284
+ "Model has no primary key and no count_column was provided."
285
+ )
286
+ count_col = pk_columns[0]
287
+
288
+ stmt = select(*columns, func.count(count_col).label("count"))
289
+ stmt = apply_search_filters(table.__table__.columns.__getitem__, stmt, search)
290
+ stmt = stmt.group_by(*columns)
291
+
292
+ # Execute the query
293
+ return [
294
+ dict(row._mapping)
295
+ async for row in (await self.conn.stream(stmt))
296
+ if row.count > 0 # type: ignore
297
+ ]
298
+
230
299
 
231
300
  def find_time_resolution(value):
232
301
  if isinstance(value, datetime):
@@ -258,6 +327,17 @@ def find_time_resolution(value):
258
327
  raise InvalidQueryError(f"Cannot parse {value=}")
259
328
 
260
329
 
330
+ def _get_columns(table, parameters):
331
+ columns = [x for x in table.columns]
332
+ if parameters:
333
+ if unrecognised_parameters := set(parameters) - set(table.columns.keys()):
334
+ raise InvalidQueryError(
335
+ f"Unrecognised parameters requested {unrecognised_parameters}"
336
+ )
337
+ columns = [c for c in columns if c.name in parameters]
338
+ return columns
339
+
340
+
261
341
  def apply_search_filters(column_mapping, stmt, search):
262
342
  for query in search:
263
343
  try:
@@ -300,6 +380,15 @@ def apply_search_filters(column_mapping, stmt, search):
300
380
  expr = column.like(query["value"])
301
381
  elif query["operator"] in "ilike":
302
382
  expr = column.ilike(query["value"])
383
+ elif query["operator"] == "not like":
384
+ expr = column.not_like(query["value"])
385
+ elif query["operator"] == "regex":
386
+ # We check the regex validity here
387
+ try:
388
+ re.compile(query["value"])
389
+ except re.error as e:
390
+ raise InvalidQueryError(f"Invalid regex {query['value']}") from e
391
+ expr = column.regexp_match(query["value"])
303
392
  else:
304
393
  raise InvalidQueryError(f"Unknown filter {query=}")
305
394
  stmt = stmt.where(expr)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diracx-db
3
- Version: 0.0.1a45
3
+ Version: 0.0.1a47
4
4
  Summary: TODO
5
5
  License: GPL-3.0-only
6
6
  Classifier: Intended Audience :: Science/Research
@@ -1,37 +1,37 @@
1
1
  diracx/db/__init__.py,sha256=2oeUeVwZq53bo_ZOflEYZsBn7tcR5Tzb2AIu0TAWELM,109
2
- diracx/db/__main__.py,sha256=tU4tp3OAClYCiPMxlRj524sZGBx9oy4CoWHd8pMuEEs,1715
2
+ diracx/db/__main__.py,sha256=3yaUP1ig-yaPSQM4wy6CtSXXHivQg-hIz2FeBt7joBc,1714
3
3
  diracx/db/exceptions.py,sha256=1nn-SZLG-nQwkxbvHjZqXhE5ouzWj1f3qhSda2B4ZEg,83
4
4
  diracx/db/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
5
5
  diracx/db/os/__init__.py,sha256=IZr6z6SefrRvuC8sTC4RmB3_wwOyEt1GzpDuwSMH8O4,112
6
- diracx/db/os/job_parameters.py,sha256=loAc-bo3u-RMAp_H1g8VRt8T-rCCsXp_d9aCvg5OS-A,1225
6
+ diracx/db/os/job_parameters.py,sha256=3w_CeA2z-cY5pWwXkGu-Fod27FobbUXuwVKK-jN037U,1479
7
7
  diracx/db/os/utils.py,sha256=V4T-taos64SFNcorfIr7mq5l5y88K6TzyCj1YqWk8VI,11562
8
8
  diracx/db/sql/__init__.py,sha256=JYu0b0IVhoXy3lX2m2r2dmAjsRS7IbECBUMEDvX0Te4,391
9
9
  diracx/db/sql/auth/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
10
10
  diracx/db/sql/auth/db.py,sha256=QJtBqMrhOf97UvMG0WpyjsgIRiu19v04FoDzXAyXtT0,8952
11
11
  diracx/db/sql/auth/schema.py,sha256=x2PEbmM_bNPdZUN5BMGMrdSmX8zkDeJ3P9XfhLBGBTs,3173
12
12
  diracx/db/sql/dummy/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
13
- diracx/db/sql/dummy/db.py,sha256=IW4FzG7ERKbhZvC32KL7Rodu2u-zKAf8BryO4VAdJew,1650
13
+ diracx/db/sql/dummy/db.py,sha256=MKSUSJI1BlRgK08tjCfkCkOz02asvJAeBw60pAdiGV8,1212
14
14
  diracx/db/sql/dummy/schema.py,sha256=9zI53pKlzc6qBezsyjkatOQrNZdGCjwgjQ8Iz_pyAXs,789
15
15
  diracx/db/sql/job/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
16
- diracx/db/sql/job/db.py,sha256=TnEc0fckiuMJAZg2v1_Pbwfn7kDPDam6TXp9ySuiddk,11910
16
+ diracx/db/sql/job/db.py,sha256=TsHbMVUO-87228hVbodGQclTgY2b7fI0XBsbNbCVgc4,10298
17
17
  diracx/db/sql/job/schema.py,sha256=eFgZshe6NEzOM2qI0HI9Y3abrqDMoQIwa9L0vZugHcU,5431
18
18
  diracx/db/sql/job_logging/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
19
- diracx/db/sql/job_logging/db.py,sha256=BYzlPuvdvHR7wdzQEVWMH_V5kL0bLBZtQkcugnSGbjs,5497
19
+ diracx/db/sql/job_logging/db.py,sha256=hyklARuEj3R1sSJ8UaObRprmsRx7RjbKAcbfgT9BwRg,5496
20
20
  diracx/db/sql/job_logging/schema.py,sha256=k6uBw-RHAcJ5GEleNpiWoXEJBhCiNG-y4xAgBKHZjjM,2524
21
21
  diracx/db/sql/pilot_agents/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
22
- diracx/db/sql/pilot_agents/db.py,sha256=7-cuCbh_KhM0jlybsHMWV-W66bHsPHIVBpbuqwjncj0,1232
22
+ diracx/db/sql/pilot_agents/db.py,sha256=6CQ0QGV4NhsGKVCygEtE4kmIjT89xJwrIMuYZTslWFE,1231
23
23
  diracx/db/sql/pilot_agents/schema.py,sha256=KeWnFSpYOTrT3-_rOCFjbjNnPNXKnUZiJVsu4vv5U2U,2149
24
24
  diracx/db/sql/sandbox_metadata/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
25
- diracx/db/sql/sandbox_metadata/db.py,sha256=DAmuk-PDGKq3eLV2EovDGnJI0GDiH5u8C74ARIy8MWo,10171
25
+ diracx/db/sql/sandbox_metadata/db.py,sha256=FtyPx6GAGJAH-lmuw8PQj6_KGHG6t3AC3-E9uWf-JNs,10236
26
26
  diracx/db/sql/sandbox_metadata/schema.py,sha256=V5gV2PHwzTbBz_th9ribLfE7Lqk8YGemDmvqq4jWQJ4,1530
27
27
  diracx/db/sql/task_queue/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
28
28
  diracx/db/sql/task_queue/db.py,sha256=2qul1D2tX2uCI92N591WK5xWHakG0pNibzDwKQ7W-I8,6246
29
29
  diracx/db/sql/task_queue/schema.py,sha256=5efAgvNYRkLlaJ2NzRInRfmVa3tyIzQu2l0oRPy4Kzw,3258
30
- diracx/db/sql/utils/__init__.py,sha256=QkvpqBuIAgkAOywAssYzdxSzUQVZlSUumK7mPxotXfM,547
31
- diracx/db/sql/utils/base.py,sha256=HYQuX16mgg9LAMtAEmbTmJFIN0OSMe1Hcb57dtl7LCc,12367
30
+ diracx/db/sql/utils/__init__.py,sha256=XYbv-AJAPl7bb8dETpjc07olmtXQ0h1MFUbLqjAphQE,585
31
+ diracx/db/sql/utils/base.py,sha256=snZFJmUJV-wweZLpio29MxuPFghfugpVMDC1iE_jM7w,15568
32
32
  diracx/db/sql/utils/functions.py,sha256=_E4tc9Gti6LuSh7QEyoqPJSvCuByVqvRenOXCzxsulE,4014
33
33
  diracx/db/sql/utils/types.py,sha256=yU-tXsu6hFGPsr9ba1n3ZjGPnHQI_06lbpkTeDCWJtg,1287
34
- diracx_db-0.0.1a45.dist-info/METADATA,sha256=ET2Uo-DegfUc6qRqvicSGR7PpWTtc4yXJKqoZQRbXyQ,675
35
- diracx_db-0.0.1a45.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
36
- diracx_db-0.0.1a45.dist-info/entry_points.txt,sha256=UPqhLvb9gui0kOyWeI_edtefcrHToZmQt1p76vIwujo,317
37
- diracx_db-0.0.1a45.dist-info/RECORD,,
34
+ diracx_db-0.0.1a47.dist-info/METADATA,sha256=z9GxhxY4-mwWkwLQ1Ue72mU28cXPAB2W4tr_UU2J6yA,675
35
+ diracx_db-0.0.1a47.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
36
+ diracx_db-0.0.1a47.dist-info/entry_points.txt,sha256=UPqhLvb9gui0kOyWeI_edtefcrHToZmQt1p76vIwujo,317
37
+ diracx_db-0.0.1a47.dist-info/RECORD,,