digitalkin 0.3.2.dev2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (131) hide show
  1. base_server/__init__.py +1 -0
  2. base_server/mock/__init__.py +5 -0
  3. base_server/mock/mock_pb2.py +39 -0
  4. base_server/mock/mock_pb2_grpc.py +102 -0
  5. base_server/server_async_insecure.py +125 -0
  6. base_server/server_async_secure.py +143 -0
  7. base_server/server_sync_insecure.py +103 -0
  8. base_server/server_sync_secure.py +122 -0
  9. digitalkin/__init__.py +8 -0
  10. digitalkin/__version__.py +8 -0
  11. digitalkin/core/__init__.py +1 -0
  12. digitalkin/core/common/__init__.py +9 -0
  13. digitalkin/core/common/factories.py +156 -0
  14. digitalkin/core/job_manager/__init__.py +1 -0
  15. digitalkin/core/job_manager/base_job_manager.py +288 -0
  16. digitalkin/core/job_manager/single_job_manager.py +354 -0
  17. digitalkin/core/job_manager/taskiq_broker.py +311 -0
  18. digitalkin/core/job_manager/taskiq_job_manager.py +541 -0
  19. digitalkin/core/task_manager/__init__.py +1 -0
  20. digitalkin/core/task_manager/base_task_manager.py +539 -0
  21. digitalkin/core/task_manager/local_task_manager.py +108 -0
  22. digitalkin/core/task_manager/remote_task_manager.py +87 -0
  23. digitalkin/core/task_manager/surrealdb_repository.py +266 -0
  24. digitalkin/core/task_manager/task_executor.py +249 -0
  25. digitalkin/core/task_manager/task_session.py +406 -0
  26. digitalkin/grpc_servers/__init__.py +1 -0
  27. digitalkin/grpc_servers/_base_server.py +486 -0
  28. digitalkin/grpc_servers/module_server.py +208 -0
  29. digitalkin/grpc_servers/module_servicer.py +516 -0
  30. digitalkin/grpc_servers/utils/__init__.py +1 -0
  31. digitalkin/grpc_servers/utils/exceptions.py +29 -0
  32. digitalkin/grpc_servers/utils/grpc_client_wrapper.py +88 -0
  33. digitalkin/grpc_servers/utils/grpc_error_handler.py +53 -0
  34. digitalkin/grpc_servers/utils/utility_schema_extender.py +97 -0
  35. digitalkin/logger.py +157 -0
  36. digitalkin/mixins/__init__.py +19 -0
  37. digitalkin/mixins/base_mixin.py +10 -0
  38. digitalkin/mixins/callback_mixin.py +24 -0
  39. digitalkin/mixins/chat_history_mixin.py +110 -0
  40. digitalkin/mixins/cost_mixin.py +76 -0
  41. digitalkin/mixins/file_history_mixin.py +93 -0
  42. digitalkin/mixins/filesystem_mixin.py +46 -0
  43. digitalkin/mixins/logger_mixin.py +51 -0
  44. digitalkin/mixins/storage_mixin.py +79 -0
  45. digitalkin/models/__init__.py +8 -0
  46. digitalkin/models/core/__init__.py +1 -0
  47. digitalkin/models/core/job_manager_models.py +36 -0
  48. digitalkin/models/core/task_monitor.py +70 -0
  49. digitalkin/models/grpc_servers/__init__.py +1 -0
  50. digitalkin/models/grpc_servers/models.py +275 -0
  51. digitalkin/models/grpc_servers/types.py +24 -0
  52. digitalkin/models/module/__init__.py +25 -0
  53. digitalkin/models/module/module.py +40 -0
  54. digitalkin/models/module/module_context.py +149 -0
  55. digitalkin/models/module/module_types.py +393 -0
  56. digitalkin/models/module/utility.py +146 -0
  57. digitalkin/models/services/__init__.py +10 -0
  58. digitalkin/models/services/cost.py +54 -0
  59. digitalkin/models/services/registry.py +42 -0
  60. digitalkin/models/services/storage.py +44 -0
  61. digitalkin/modules/__init__.py +11 -0
  62. digitalkin/modules/_base_module.py +517 -0
  63. digitalkin/modules/archetype_module.py +23 -0
  64. digitalkin/modules/tool_module.py +23 -0
  65. digitalkin/modules/trigger_handler.py +48 -0
  66. digitalkin/modules/triggers/__init__.py +12 -0
  67. digitalkin/modules/triggers/healthcheck_ping_trigger.py +45 -0
  68. digitalkin/modules/triggers/healthcheck_services_trigger.py +63 -0
  69. digitalkin/modules/triggers/healthcheck_status_trigger.py +52 -0
  70. digitalkin/py.typed +0 -0
  71. digitalkin/services/__init__.py +30 -0
  72. digitalkin/services/agent/__init__.py +6 -0
  73. digitalkin/services/agent/agent_strategy.py +19 -0
  74. digitalkin/services/agent/default_agent.py +13 -0
  75. digitalkin/services/base_strategy.py +22 -0
  76. digitalkin/services/communication/__init__.py +7 -0
  77. digitalkin/services/communication/communication_strategy.py +76 -0
  78. digitalkin/services/communication/default_communication.py +101 -0
  79. digitalkin/services/communication/grpc_communication.py +223 -0
  80. digitalkin/services/cost/__init__.py +14 -0
  81. digitalkin/services/cost/cost_strategy.py +100 -0
  82. digitalkin/services/cost/default_cost.py +114 -0
  83. digitalkin/services/cost/grpc_cost.py +138 -0
  84. digitalkin/services/filesystem/__init__.py +7 -0
  85. digitalkin/services/filesystem/default_filesystem.py +417 -0
  86. digitalkin/services/filesystem/filesystem_strategy.py +252 -0
  87. digitalkin/services/filesystem/grpc_filesystem.py +317 -0
  88. digitalkin/services/identity/__init__.py +6 -0
  89. digitalkin/services/identity/default_identity.py +15 -0
  90. digitalkin/services/identity/identity_strategy.py +14 -0
  91. digitalkin/services/registry/__init__.py +27 -0
  92. digitalkin/services/registry/default_registry.py +141 -0
  93. digitalkin/services/registry/exceptions.py +47 -0
  94. digitalkin/services/registry/grpc_registry.py +306 -0
  95. digitalkin/services/registry/registry_models.py +43 -0
  96. digitalkin/services/registry/registry_strategy.py +98 -0
  97. digitalkin/services/services_config.py +200 -0
  98. digitalkin/services/services_models.py +65 -0
  99. digitalkin/services/setup/__init__.py +1 -0
  100. digitalkin/services/setup/default_setup.py +219 -0
  101. digitalkin/services/setup/grpc_setup.py +343 -0
  102. digitalkin/services/setup/setup_strategy.py +145 -0
  103. digitalkin/services/snapshot/__init__.py +6 -0
  104. digitalkin/services/snapshot/default_snapshot.py +39 -0
  105. digitalkin/services/snapshot/snapshot_strategy.py +30 -0
  106. digitalkin/services/storage/__init__.py +7 -0
  107. digitalkin/services/storage/default_storage.py +228 -0
  108. digitalkin/services/storage/grpc_storage.py +214 -0
  109. digitalkin/services/storage/storage_strategy.py +273 -0
  110. digitalkin/services/user_profile/__init__.py +12 -0
  111. digitalkin/services/user_profile/default_user_profile.py +55 -0
  112. digitalkin/services/user_profile/grpc_user_profile.py +69 -0
  113. digitalkin/services/user_profile/user_profile_strategy.py +40 -0
  114. digitalkin/utils/__init__.py +29 -0
  115. digitalkin/utils/arg_parser.py +92 -0
  116. digitalkin/utils/development_mode_action.py +51 -0
  117. digitalkin/utils/dynamic_schema.py +483 -0
  118. digitalkin/utils/llm_ready_schema.py +75 -0
  119. digitalkin/utils/package_discover.py +357 -0
  120. digitalkin-0.3.2.dev2.dist-info/METADATA +602 -0
  121. digitalkin-0.3.2.dev2.dist-info/RECORD +131 -0
  122. digitalkin-0.3.2.dev2.dist-info/WHEEL +5 -0
  123. digitalkin-0.3.2.dev2.dist-info/licenses/LICENSE +430 -0
  124. digitalkin-0.3.2.dev2.dist-info/top_level.txt +4 -0
  125. modules/__init__.py +0 -0
  126. modules/cpu_intensive_module.py +280 -0
  127. modules/dynamic_setup_module.py +338 -0
  128. modules/minimal_llm_module.py +347 -0
  129. modules/text_transform_module.py +203 -0
  130. services/filesystem_module.py +200 -0
  131. services/storage_module.py +206 -0
@@ -0,0 +1,483 @@
1
+ """Dynamic schema utilities for runtime value refresh in Pydantic models.
2
+
3
+ This module provides a clean way to mark fields as dynamic using Annotated metadata,
4
+ allowing their schema values to be refreshed at runtime via sync or async fetchers.
5
+
6
+ Example:
7
+ from typing import Annotated
8
+ from digitalkin.utils import DynamicField
9
+
10
+ class AgentSetup(SetupModel):
11
+ model_name: Annotated[str, DynamicField(enum=fetch_models)] = Field(default="gpt-4")
12
+
13
+ See Also:
14
+ - Documentation: docs/api/dynamic_schema.md
15
+ - Tests: tests/utils/test_dynamic_schema.py
16
+ """
17
+
18
+ from __future__ import annotations
19
+
20
+ import asyncio
21
+ import time
22
+ import traceback
23
+ from collections.abc import Awaitable, Callable
24
+ from dataclasses import dataclass, field
25
+ from itertools import starmap
26
+ from typing import TYPE_CHECKING, Any, TypeVar
27
+
28
+ from digitalkin.logger import logger
29
+
30
+ if TYPE_CHECKING:
31
+ from pydantic.fields import FieldInfo
32
+
33
+ T = TypeVar("T")
34
+
35
+ # Fetcher callable type: sync or async function with no arguments
36
+ Fetcher = Callable[[], T | Awaitable[T]]
37
+
38
+ # Default timeout for fetcher resolution (None = no timeout)
39
+ DEFAULT_TIMEOUT: float | None = None
40
+
41
+
42
+ @dataclass
43
+ class ResolveResult:
44
+ """Result of resolving dynamic fetchers.
45
+
46
+ Provides structured access to resolved values and any errors that occurred.
47
+ This allows callers to handle partial failures gracefully.
48
+
49
+ Attributes:
50
+ values: Dict mapping key names to successfully resolved values.
51
+ errors: Dict mapping key names to exceptions that occurred during resolution.
52
+ """
53
+
54
+ values: dict[str, Any] = field(default_factory=dict)
55
+ errors: dict[str, Exception] = field(default_factory=dict)
56
+
57
+ @property
58
+ def success(self) -> bool:
59
+ """Check if all fetchers resolved successfully.
60
+
61
+ Returns:
62
+ True if no errors occurred, False otherwise.
63
+ """
64
+ return len(self.errors) == 0
65
+
66
+ @property
67
+ def partial(self) -> bool:
68
+ """Check if some but not all fetchers succeeded.
69
+
70
+ Returns:
71
+ True if there are both values and errors, False otherwise.
72
+ """
73
+ return len(self.values) > 0 and len(self.errors) > 0
74
+
75
+ def get(self, key: str, default: T | None = None) -> T | None:
76
+ """Get a resolved value by key.
77
+
78
+ Args:
79
+ key: The fetcher key name.
80
+ default: Default value if key not found or errored.
81
+
82
+ Returns:
83
+ The resolved value or default.
84
+ """
85
+ return self.values.get(key, default) # type: ignore[return-value]
86
+
87
+
88
+ class DynamicField:
89
+ """Metadata class for Annotated fields with dynamic fetchers.
90
+
91
+ Use with typing.Annotated to mark fields that need runtime value resolution.
92
+ Fetchers are callables (sync or async) that return values at runtime.
93
+
94
+ Args:
95
+ **fetchers: Mapping of key names to fetcher callables.
96
+ Each fetcher is a function (sync or async) that takes no arguments
97
+ and returns the value for that key (e.g., enum values, defaults).
98
+
99
+ Example:
100
+ from typing import Annotated
101
+
102
+ async def fetch_models() -> list[str]:
103
+ return await api.get_models()
104
+
105
+ class Setup(SetupModel):
106
+ model: Annotated[str, DynamicField(enum=fetch_models)] = Field(default="gpt-4")
107
+ """
108
+
109
+ __slots__ = ("fetchers",)
110
+
111
+ def __init__(self, **fetchers: Fetcher[Any]) -> None:
112
+ """Initialize with fetcher callables."""
113
+ self.fetchers: dict[str, Fetcher[Any]] = fetchers
114
+
115
+ def __repr__(self) -> str:
116
+ """Return string representation."""
117
+ keys = ", ".join(self.fetchers.keys())
118
+ return f"DynamicField({keys})"
119
+
120
+ def __eq__(self, other: object) -> bool:
121
+ """Check equality based on fetchers.
122
+
123
+ Returns:
124
+ True if fetchers are equal, NotImplemented for non-DynamicField types.
125
+ """
126
+ if not isinstance(other, DynamicField):
127
+ return NotImplemented
128
+ return self.fetchers == other.fetchers
129
+
130
+ def __hash__(self) -> int:
131
+ """Hash based on fetcher keys (fetchers themselves aren't hashable).
132
+
133
+ Returns:
134
+ Hash value based on sorted fetcher keys.
135
+ """
136
+ return hash(tuple(sorted(self.fetchers.keys())))
137
+
138
+
139
+ def get_dynamic_metadata(field_info: FieldInfo) -> DynamicField | None:
140
+ """Extract DynamicField metadata from a FieldInfo's metadata list.
141
+
142
+ Args:
143
+ field_info: The Pydantic FieldInfo object to inspect.
144
+
145
+ Returns:
146
+ The DynamicField metadata instance if found, None otherwise.
147
+ """
148
+ for meta in field_info.metadata:
149
+ if isinstance(meta, DynamicField):
150
+ return meta
151
+ return None
152
+
153
+
154
+ def has_dynamic(field_info: FieldInfo) -> bool:
155
+ """Check if a field has DynamicField metadata.
156
+
157
+ Args:
158
+ field_info: The Pydantic FieldInfo object to check.
159
+
160
+ Returns:
161
+ True if the field has DynamicField metadata, False otherwise.
162
+ """
163
+ return get_dynamic_metadata(field_info) is not None
164
+
165
+
166
+ def get_fetchers(field_info: FieldInfo) -> dict[str, Fetcher[Any]]:
167
+ """Extract fetchers from a field's DynamicField metadata.
168
+
169
+ Args:
170
+ field_info: The Pydantic FieldInfo object to extract from.
171
+
172
+ Returns:
173
+ Dict mapping key names to fetcher callables, empty if no DynamicField metadata.
174
+ """
175
+ meta = get_dynamic_metadata(field_info)
176
+ if meta is None:
177
+ return {}
178
+ return meta.fetchers
179
+
180
+
181
+ def _get_fetcher_info(fetcher: Fetcher[Any]) -> str:
182
+ """Get descriptive info about a fetcher for logging.
183
+
184
+ Args:
185
+ fetcher: The fetcher callable.
186
+
187
+ Returns:
188
+ A string describing the fetcher (module.name or repr).
189
+ """
190
+ if hasattr(fetcher, "__module__") and hasattr(fetcher, "__qualname__"):
191
+ return f"{fetcher.__module__}.{fetcher.__qualname__}"
192
+ if hasattr(fetcher, "__name__"):
193
+ return fetcher.__name__
194
+ return repr(fetcher)
195
+
196
+
197
+ async def _resolve_one(key: str, fetcher: Fetcher[Any]) -> tuple[str, Any]:
198
+ """Resolve a single fetcher.
199
+
200
+ Args:
201
+ key: The fetcher key name.
202
+ fetcher: The fetcher callable.
203
+
204
+ Returns:
205
+ Tuple of (key, resolved_value).
206
+
207
+ Raises:
208
+ Exception: If the fetcher raises an exception.
209
+ """
210
+ fetcher_info = _get_fetcher_info(fetcher)
211
+ logger.debug(
212
+ "Resolving fetcher '%s' using %s",
213
+ key,
214
+ fetcher_info,
215
+ extra={"fetcher_key": key, "fetcher": fetcher_info},
216
+ )
217
+
218
+ start_time = time.perf_counter()
219
+
220
+ try:
221
+ result = fetcher()
222
+ is_async = asyncio.iscoroutine(result)
223
+
224
+ if is_async:
225
+ logger.debug(
226
+ "Fetcher '%s' returned coroutine, awaiting...",
227
+ key,
228
+ extra={"fetcher_key": key, "is_async": True},
229
+ )
230
+ result = await result
231
+
232
+ except Exception as e:
233
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
234
+ logger.error(
235
+ "Fetcher '%s' (%s) failed after %.2fms: %s: %s",
236
+ key,
237
+ fetcher_info,
238
+ elapsed_ms,
239
+ type(e).__name__,
240
+ str(e) or "(no message)",
241
+ extra={
242
+ "fetcher_key": key,
243
+ "fetcher": fetcher_info,
244
+ "elapsed_ms": elapsed_ms,
245
+ "error_type": type(e).__name__,
246
+ "error_message": str(e),
247
+ "traceback": traceback.format_exc(),
248
+ },
249
+ )
250
+ raise
251
+
252
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
253
+
254
+ logger.debug(
255
+ "Fetcher '%s' resolved successfully in %.2fms, result type: %s",
256
+ key,
257
+ elapsed_ms,
258
+ type(result).__name__,
259
+ extra={
260
+ "fetcher_key": key,
261
+ "elapsed_ms": elapsed_ms,
262
+ "result_type": type(result).__name__,
263
+ },
264
+ )
265
+
266
+ return key, result
267
+
268
+
269
+ async def resolve(
270
+ fetchers: dict[str, Fetcher[Any]],
271
+ *,
272
+ timeout: float | None = DEFAULT_TIMEOUT,
273
+ ) -> dict[str, Any]:
274
+ """Resolve all dynamic fetchers to their actual values in parallel.
275
+
276
+ Fetchers are executed concurrently using asyncio.gather() for better
277
+ performance when multiple async fetchers are involved.
278
+
279
+ Args:
280
+ fetchers: Dict mapping key names to fetcher callables.
281
+ timeout: Optional timeout in seconds for all fetchers combined.
282
+ If None (default), no timeout is applied.
283
+
284
+ Returns:
285
+ Dict mapping key names to resolved values.
286
+
287
+ Raises:
288
+ asyncio.TimeoutError: If timeout is exceeded.
289
+ Exception: If any fetcher raises an exception, it is propagated.
290
+
291
+ Example:
292
+ fetchers = {"enum": fetch_models, "default": get_default}
293
+ resolved = await resolve(fetchers, timeout=5.0)
294
+ # resolved = {"enum": ["gpt-4", "gpt-3.5"], "default": "gpt-4"}
295
+ """
296
+ if not fetchers:
297
+ logger.debug("resolve() called with empty fetchers, returning {}")
298
+ return {}
299
+
300
+ fetcher_keys = list(fetchers.keys())
301
+ fetcher_infos = {k: _get_fetcher_info(f) for k, f in fetchers.items()}
302
+
303
+ logger.info(
304
+ "resolve() starting parallel resolution of %d fetcher(s): %s",
305
+ len(fetchers),
306
+ fetcher_keys,
307
+ extra={
308
+ "fetcher_count": len(fetchers),
309
+ "fetcher_keys": fetcher_keys,
310
+ "fetcher_infos": fetcher_infos,
311
+ "timeout": timeout,
312
+ },
313
+ )
314
+
315
+ start_time = time.perf_counter()
316
+
317
+ # Create tasks for parallel execution
318
+ tasks = list(starmap(_resolve_one, fetchers.items()))
319
+
320
+ # Execute with optional timeout
321
+ try:
322
+ if timeout is not None:
323
+ results = await asyncio.wait_for(asyncio.gather(*tasks), timeout=timeout)
324
+ else:
325
+ results = await asyncio.gather(*tasks)
326
+ except asyncio.TimeoutError:
327
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
328
+ logger.error(
329
+ "resolve() timed out after %.2fms (timeout=%.2fs)",
330
+ elapsed_ms,
331
+ timeout,
332
+ extra={"elapsed_ms": elapsed_ms, "timeout": timeout},
333
+ )
334
+ raise
335
+
336
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
337
+ logger.info(
338
+ "resolve() completed successfully in %.2fms, resolved %d fetcher(s)",
339
+ elapsed_ms,
340
+ len(results),
341
+ extra={"elapsed_ms": elapsed_ms, "resolved_count": len(results)},
342
+ )
343
+
344
+ return dict(results)
345
+
346
+
347
+ async def resolve_safe(
348
+ fetchers: dict[str, Fetcher[Any]],
349
+ *,
350
+ timeout: float | None = DEFAULT_TIMEOUT,
351
+ ) -> ResolveResult:
352
+ """Resolve fetchers with structured error handling.
353
+
354
+ Unlike `resolve()`, this function catches individual fetcher errors
355
+ and returns them in a structured result, allowing partial success.
356
+
357
+ Args:
358
+ fetchers: Dict mapping key names to fetcher callables.
359
+ timeout: Optional timeout in seconds for all fetchers combined.
360
+ If None (default), no timeout is applied. Note: timeout applies
361
+ to the entire operation, not individual fetchers.
362
+
363
+ Returns:
364
+ ResolveResult with values and any errors that occurred.
365
+
366
+ Example:
367
+ result = await resolve_safe(fetchers, timeout=5.0)
368
+ if result.success:
369
+ print("All resolved:", result.values)
370
+ elif result.partial:
371
+ print("Partial success:", result.values)
372
+ print("Errors:", result.errors)
373
+ else:
374
+ print("All failed:", result.errors)
375
+ """
376
+ if not fetchers:
377
+ logger.debug("resolve_safe() called with empty fetchers, returning empty ResolveResult")
378
+ return ResolveResult()
379
+
380
+ fetcher_keys = list(fetchers.keys())
381
+ fetcher_infos = {k: _get_fetcher_info(f) for k, f in fetchers.items()}
382
+
383
+ logger.info(
384
+ "resolve_safe() starting parallel resolution of %d fetcher(s): %s",
385
+ len(fetchers),
386
+ fetcher_keys,
387
+ extra={
388
+ "fetcher_count": len(fetchers),
389
+ "fetcher_keys": fetcher_keys,
390
+ "fetcher_infos": fetcher_infos,
391
+ "timeout": timeout,
392
+ },
393
+ )
394
+
395
+ start_time = time.perf_counter()
396
+ result = ResolveResult()
397
+
398
+ async def safe_resolve_one(key: str, fetcher: Fetcher[Any]) -> None:
399
+ """Resolve one fetcher, capturing errors."""
400
+ try:
401
+ _, value = await _resolve_one(key, fetcher)
402
+ result.values[key] = value
403
+ except Exception as e:
404
+ # Error already logged in _resolve_one, just capture it
405
+ result.errors[key] = e
406
+
407
+ # Create tasks for parallel execution
408
+ tasks = list(starmap(safe_resolve_one, fetchers.items()))
409
+
410
+ try:
411
+ if timeout is not None:
412
+ await asyncio.wait_for(asyncio.gather(*tasks), timeout=timeout)
413
+ else:
414
+ await asyncio.gather(*tasks)
415
+ except asyncio.TimeoutError as e:
416
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
417
+ # Add timeout error for any keys that didn't complete
418
+ resolved_keys = set(result.values.keys()) | set(result.errors.keys())
419
+ timed_out_keys = [key for key in fetchers if key not in resolved_keys]
420
+ for key in timed_out_keys:
421
+ result.errors[key] = e
422
+
423
+ logger.error(
424
+ "resolve_safe() timed out after %.2fms (timeout=%.2fs), %d succeeded, %d failed, %d timed out",
425
+ elapsed_ms,
426
+ timeout,
427
+ len(result.values),
428
+ len(result.errors) - len(timed_out_keys),
429
+ len(timed_out_keys),
430
+ extra={
431
+ "elapsed_ms": elapsed_ms,
432
+ "timeout": timeout,
433
+ "succeeded_keys": list(result.values.keys()),
434
+ "failed_keys": [k for k in result.errors if k not in timed_out_keys],
435
+ "timed_out_keys": timed_out_keys,
436
+ },
437
+ )
438
+
439
+ elapsed_ms = (time.perf_counter() - start_time) * 1000
440
+
441
+ # Log summary
442
+ if result.success:
443
+ logger.info(
444
+ "resolve_safe() completed successfully in %.2fms, all %d fetcher(s) resolved",
445
+ elapsed_ms,
446
+ len(result.values),
447
+ extra={
448
+ "elapsed_ms": elapsed_ms,
449
+ "success": True,
450
+ "resolved_count": len(result.values),
451
+ },
452
+ )
453
+ elif result.partial:
454
+ logger.warning(
455
+ "resolve_safe() completed with partial success in %.2fms: %d succeeded, %d failed",
456
+ elapsed_ms,
457
+ len(result.values),
458
+ len(result.errors),
459
+ extra={
460
+ "elapsed_ms": elapsed_ms,
461
+ "success": False,
462
+ "partial": True,
463
+ "resolved_count": len(result.values),
464
+ "error_count": len(result.errors),
465
+ "succeeded_keys": list(result.values.keys()),
466
+ "failed_keys": list(result.errors.keys()),
467
+ },
468
+ )
469
+ else:
470
+ logger.error(
471
+ "resolve_safe() completed with all failures in %.2fms: %d failed",
472
+ elapsed_ms,
473
+ len(result.errors),
474
+ extra={
475
+ "elapsed_ms": elapsed_ms,
476
+ "success": False,
477
+ "partial": False,
478
+ "error_count": len(result.errors),
479
+ "failed_keys": list(result.errors.keys()),
480
+ },
481
+ )
482
+
483
+ return result
@@ -0,0 +1,75 @@
1
+ """LLM format schema for Pydantic models.
2
+
3
+ This module provides functionality to generate JSON schemas for Pydantic models ready for LLMs.
4
+ """
5
+
6
+ import copy
7
+ from typing import Any
8
+
9
+ from pydantic import BaseModel
10
+ from pydantic.json_schema import GenerateJsonSchema, JsonSchemaValue
11
+
12
+
13
+ class CustomOrderSchema(GenerateJsonSchema):
14
+ """Custom schema generator to sort keys in a specific order."""
15
+
16
+ def sort(self, value: JsonSchemaValue, parent_key: str | None = None) -> JsonSchemaValue: # noqa: ARG002
17
+ """Sort the keys of the schema in a specific order.
18
+
19
+ Args:
20
+ value: The schema value to sort.
21
+ parent_key: The parent key of the schema value.
22
+
23
+ Returns:
24
+ The sorted schema value.
25
+ """
26
+ if isinstance(value, dict):
27
+ # Define your preferred order
28
+ preferred = ["title", "description", "type", "examples", "properties"]
29
+ # Collect all keys, putting preferred ones first
30
+ keys = preferred + [k for k in value if k not in preferred]
31
+ # Recurse for each value
32
+ return {k: self.sort(value[k], k) for k in keys if k in value}
33
+ if isinstance(value, list):
34
+ return [self.sort(v) for v in value]
35
+ return value
36
+
37
+
38
+ def inline_refs(schema: dict) -> dict:
39
+ """Recursively resolve and inline all $ref in the schema.
40
+
41
+ Args:
42
+ schema: The JSON schema to inline.
43
+
44
+ Returns:
45
+ The inlined JSON schema.
46
+ """
47
+ schema = copy.deepcopy(schema)
48
+ defs = schema.pop("$defs", {})
49
+
50
+ def _resolve(obj: Any) -> Any: # noqa: ANN401
51
+ if isinstance(obj, dict):
52
+ if "$ref" in obj:
53
+ ref = obj["$ref"]
54
+ if ref.startswith("#/$defs/"):
55
+ key = ref.split("/")[-1]
56
+ return _resolve(defs[key])
57
+ return {k: _resolve(v) for k, v in obj.items()}
58
+ if isinstance(obj, list):
59
+ return [_resolve(item) for item in obj]
60
+ return obj
61
+
62
+ return _resolve(schema)
63
+
64
+
65
+ def llm_ready_schema(model: type[BaseModel]) -> dict:
66
+ """Convert a Pydantic model to a JSON schema ready for LLMs.
67
+
68
+ Args:
69
+ model: The Pydantic model to convert.
70
+
71
+ Returns:
72
+ The JSON schema as a dictionary.
73
+ """
74
+ schema = model.model_json_schema(schema_generator=CustomOrderSchema)
75
+ return inline_refs(schema)