pyoco 0.5.0__tar.gz → 0.6.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (56) hide show
  1. {pyoco-0.5.0 → pyoco-0.6.0}/PKG-INFO +16 -9
  2. {pyoco-0.5.0 → pyoco-0.6.0}/README.md +15 -8
  3. {pyoco-0.5.0 → pyoco-0.6.0}/pyproject.toml +1 -1
  4. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/__init__.py +2 -1
  5. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/cli/main.py +133 -5
  6. pyoco-0.6.0/src/pyoco/core/exceptions.py +51 -0
  7. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/core/models.py +44 -3
  8. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/discovery/loader.py +46 -61
  9. pyoco-0.6.0/src/pyoco/discovery/plugins.py +210 -0
  10. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/schemas/config.py +10 -13
  11. pyoco-0.6.0/src/pyoco/support/__init__.py +21 -0
  12. pyoco-0.6.0/src/pyoco/support/collector.py +56 -0
  13. pyoco-0.6.0/src/pyoco/support/filters.py +56 -0
  14. pyoco-0.6.0/src/pyoco/support/renderer.py +188 -0
  15. pyoco-0.6.0/src/pyoco/support/service.py +42 -0
  16. pyoco-0.6.0/src/pyoco/support/writer.py +15 -0
  17. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco.egg-info/PKG-INFO +16 -9
  18. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco.egg-info/SOURCES.txt +7 -0
  19. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_e2e_socketless.py +0 -1
  20. pyoco-0.6.0/tests/test_e2e_support_info.py +77 -0
  21. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_integration_v030.py +0 -1
  22. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_socketless_basic.py +0 -1
  23. pyoco-0.5.0/src/pyoco/core/exceptions.py +0 -15
  24. pyoco-0.5.0/src/pyoco/discovery/plugins.py +0 -92
  25. {pyoco-0.5.0 → pyoco-0.6.0}/setup.cfg +0 -0
  26. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/cli/entry.py +0 -0
  27. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/client.py +0 -0
  28. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/core/base_task.py +0 -0
  29. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/core/context.py +0 -0
  30. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/core/engine.py +0 -0
  31. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/dsl/__init__.py +0 -0
  32. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/dsl/expressions.py +0 -0
  33. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/dsl/nodes.py +0 -0
  34. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/dsl/syntax.py +0 -0
  35. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/dsl/validator.py +0 -0
  36. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/__init__.py +0 -0
  37. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/api.py +0 -0
  38. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/metrics.py +0 -0
  39. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/models.py +0 -0
  40. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/store.py +0 -0
  41. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/server/webhook.py +0 -0
  42. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/socketless_reset.py +0 -0
  43. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/trace/backend.py +0 -0
  44. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/trace/console.py +0 -0
  45. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/worker/__init__.py +0 -0
  46. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/worker/client.py +0 -0
  47. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco/worker/runner.py +0 -0
  48. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco.egg-info/dependency_links.txt +0 -0
  49. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco.egg-info/requires.txt +0 -0
  50. {pyoco-0.5.0 → pyoco-0.6.0}/src/pyoco.egg-info/top_level.txt +0 -0
  51. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_cancellation.py +0 -0
  52. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_cli_cancellation.py +0 -0
  53. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_dsl.py +0 -0
  54. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_engine.py +0 -0
  55. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_engine_state.py +0 -0
  56. {pyoco-0.5.0 → pyoco-0.6.0}/tests/test_state_models.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pyoco
3
- Version: 0.5.0
3
+ Version: 0.6.0
4
4
  Summary: A workflow engine with sugar syntax
5
5
  Requires-Python: >=3.10
6
6
  Description-Content-Type: text/markdown
@@ -133,22 +133,29 @@ Or via CLI flag:
133
133
  pyoco run --non-cute ...
134
134
  ```
135
135
 
136
- ## 🔭 Observability Bridge (v0.5)
136
+ ## 🔭 Observability / Server (Archived)
137
137
 
138
- - `/metrics` exposes Prometheus counters (`pyoco_runs_total`, `pyoco_runs_in_progress`) and histograms (`pyoco_task_duration_seconds`, `pyoco_run_duration_seconds`). Point Grafana/Prometheus at it to watch pipelines without opening sockets.
139
- - `/runs` now accepts `status`, `flow`, `limit` query params; `/runs/{id}/logs?tail=100` fetches only the latest snippets for dashboards.
140
- - Webhook notifications fire when runs COMPLETE/FAIL—configure via `PYOCO_WEBHOOK_*` env vars and forward to Slack or your alerting stack.
141
- - Import `docs/grafana_pyoco_cute.json` for a lavender/orange starter dashboard (3 panels: in-progress count, completion trend, per-flow latency).
142
- - 詳細な手順は [docs/observability.md](docs/observability.md) を参照してください。
138
+ Observability and server-related docs are archived and out of scope for the current requirements.
139
+ See `docs/archive/observability.md` and `docs/archive/roadmap.md`.
143
140
 
144
141
  ## 🧩 Plug-ins
145
142
 
146
- Need to share domain-specific tasks? Publish an entry point under `pyoco.tasks` and pyoco will auto-load it. See [docs/plugins.md](docs/plugins.md) for the `PluginRegistry` decorator, example `pyproject.toml`, and `pyoco plugins list` CLI helper.
143
+ Need to share domain-specific tasks? Publish an entry point under `pyoco.tasks` and pyoco will auto-load it. We recommend **Task subclasses first** (callables still work with warnings). See [docs/plugins.md](docs/plugins.md) for examples, quickstart, and `pyoco plugins list` / `pyoco plugins lint`.
144
+
145
+ **Big data note:** pass handles, not copies. For large tensors/images, stash paths or handles in `ctx.artifacts`/`ctx.scratch` and let downstream tasks materialize only when needed. For lazy pipelines (e.g., DataPipe), log the pipeline when you actually iterate (typically the training task) instead of materializing upstream.
146
+
147
+ ## 🧭 Task Discovery (Security)
148
+
149
+ Pyoco does not allow configuring discovery scope in `flow.yaml` (the `discovery:` key is rejected) to reduce the risk of importing unexpected code.
150
+
151
+ - **Entry point plug-ins**: auto-loaded from `importlib.metadata.entry_points(group="pyoco.tasks")`
152
+ - **Extra imports (ops-controlled)**: set `PYOCO_DISCOVERY_MODULES` (comma/space-separated module names), e.g. `PYOCO_DISCOVERY_MODULES=tasks,myapp.extra_tasks`
153
+ - **Explicit tasks**: prefer `tasks.<name>.callable` in `flow.yaml` (see tutorials)
147
154
 
148
155
  ## 📚 Documentation
149
156
 
150
157
  - [Tutorials](docs/tutorial/index.md)
151
- - [Roadmap](docs/roadmap.md)
158
+ - [Roadmap (Archived)](docs/archive/roadmap.md)
152
159
 
153
160
  ## 💖 Contributing
154
161
 
@@ -121,22 +121,29 @@ Or via CLI flag:
121
121
  pyoco run --non-cute ...
122
122
  ```
123
123
 
124
- ## 🔭 Observability Bridge (v0.5)
124
+ ## 🔭 Observability / Server (Archived)
125
125
 
126
- - `/metrics` exposes Prometheus counters (`pyoco_runs_total`, `pyoco_runs_in_progress`) and histograms (`pyoco_task_duration_seconds`, `pyoco_run_duration_seconds`). Point Grafana/Prometheus at it to watch pipelines without opening sockets.
127
- - `/runs` now accepts `status`, `flow`, `limit` query params; `/runs/{id}/logs?tail=100` fetches only the latest snippets for dashboards.
128
- - Webhook notifications fire when runs COMPLETE/FAIL—configure via `PYOCO_WEBHOOK_*` env vars and forward to Slack or your alerting stack.
129
- - Import `docs/grafana_pyoco_cute.json` for a lavender/orange starter dashboard (3 panels: in-progress count, completion trend, per-flow latency).
130
- - 詳細な手順は [docs/observability.md](docs/observability.md) を参照してください。
126
+ Observability and server-related docs are archived and out of scope for the current requirements.
127
+ See `docs/archive/observability.md` and `docs/archive/roadmap.md`.
131
128
 
132
129
  ## 🧩 Plug-ins
133
130
 
134
- Need to share domain-specific tasks? Publish an entry point under `pyoco.tasks` and pyoco will auto-load it. See [docs/plugins.md](docs/plugins.md) for the `PluginRegistry` decorator, example `pyproject.toml`, and `pyoco plugins list` CLI helper.
131
+ Need to share domain-specific tasks? Publish an entry point under `pyoco.tasks` and pyoco will auto-load it. We recommend **Task subclasses first** (callables still work with warnings). See [docs/plugins.md](docs/plugins.md) for examples, quickstart, and `pyoco plugins list` / `pyoco plugins lint`.
132
+
133
+ **Big data note:** pass handles, not copies. For large tensors/images, stash paths or handles in `ctx.artifacts`/`ctx.scratch` and let downstream tasks materialize only when needed. For lazy pipelines (e.g., DataPipe), log the pipeline when you actually iterate (typically the training task) instead of materializing upstream.
134
+
135
+ ## 🧭 Task Discovery (Security)
136
+
137
+ Pyoco does not allow configuring discovery scope in `flow.yaml` (the `discovery:` key is rejected) to reduce the risk of importing unexpected code.
138
+
139
+ - **Entry point plug-ins**: auto-loaded from `importlib.metadata.entry_points(group="pyoco.tasks")`
140
+ - **Extra imports (ops-controlled)**: set `PYOCO_DISCOVERY_MODULES` (comma/space-separated module names), e.g. `PYOCO_DISCOVERY_MODULES=tasks,myapp.extra_tasks`
141
+ - **Explicit tasks**: prefer `tasks.<name>.callable` in `flow.yaml` (see tutorials)
135
142
 
136
143
  ## 📚 Documentation
137
144
 
138
145
  - [Tutorials](docs/tutorial/index.md)
139
- - [Roadmap](docs/roadmap.md)
146
+ - [Roadmap (Archived)](docs/archive/roadmap.md)
140
147
 
141
148
  ## 💖 Contributing
142
149
 
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "pyoco"
3
- version = "0.5.0"
3
+ version = "0.6.0"
4
4
  description = "A workflow engine with sugar syntax"
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.10"
@@ -2,10 +2,11 @@ from .core.models import Flow, Task
2
2
  from .core.engine import Engine
3
3
  from .dsl.syntax import task
4
4
  from .trace.console import ConsoleTraceBackend
5
+ from . import support
5
6
 
6
7
  def run(flow: Flow, params: dict = None, trace: bool = True, cute: bool = True):
7
8
  backend = ConsoleTraceBackend(style="cute" if cute else "plain")
8
9
  engine = Engine(trace_backend=backend)
9
10
  return engine.run(flow, params)
10
11
 
11
- __all__ = ["task", "Flow", "run"]
12
+ __all__ = ["task", "Flow", "run", "support"]
@@ -4,13 +4,22 @@ import sys
4
4
  import os
5
5
  import signal
6
6
  import time
7
+ from types import SimpleNamespace
7
8
  from ..schemas.config import PyocoConfig
8
9
  from ..discovery.loader import TaskLoader
9
10
  from ..core.models import Flow
10
11
  from ..core.engine import Engine
11
12
  from ..trace.console import ConsoleTraceBackend
12
13
  from ..client import Client
13
- from ..discovery.plugins import list_available_plugins
14
+ from ..support.service import SupportInfoService
15
+ from ..core.exceptions import (
16
+ SupportInfoError,
17
+ InvalidFormatError,
18
+ TaskNotFoundError,
19
+ InvalidFilterError,
20
+ OutputWriteError,
21
+ MissingTaskMetadataError,
22
+ )
14
23
 
15
24
  def main():
16
25
  parser = argparse.ArgumentParser(description="Pyoco Workflow Engine")
@@ -88,6 +97,32 @@ def main():
88
97
  plugins_sub = plugins_parser.add_subparsers(dest="plugins_command")
89
98
  plugins_list = plugins_sub.add_parser("list", help="List discovered plug-ins")
90
99
  plugins_list.add_argument("--json", action="store_true", help="Output JSON payload")
100
+ plugins_lint = plugins_sub.add_parser("lint", help="Validate plug-ins for upcoming requirements")
101
+ plugins_lint.add_argument("--json", action="store_true", help="Output JSON payload")
102
+
103
+ support_parser = subparsers.add_parser("support", help="Generate support info")
104
+ support_subparsers = support_parser.add_subparsers(dest="support_command")
105
+
106
+ support_tasks = support_subparsers.add_parser("tasks", help="List tasks for LLM support")
107
+ support_tasks.add_argument("--config", required=True, help="Path to flow.yaml")
108
+ support_tasks.add_argument("--format", default="prompt", choices=["prompt", "json", "md"])
109
+ support_tasks.add_argument("--output", help="Write output to file")
110
+ support_tasks.add_argument("--name", action="append", help="Filter by task name (repeatable)")
111
+ support_tasks.add_argument("--origin", action="append", help="Filter by origin (repeatable)")
112
+ support_tasks.add_argument("--tag", action="append", help="Filter by tag (repeatable)")
113
+
114
+ support_task = support_subparsers.add_parser("task", help="Show task detail for LLM support")
115
+ support_task.add_argument("--config", required=True, help="Path to flow.yaml")
116
+ support_task.add_argument("--name", required=True, help="Task name")
117
+ support_task.add_argument("--format", default="prompt", choices=["prompt", "json", "md"])
118
+ support_task.add_argument("--output", help="Write output to file")
119
+ support_task.add_argument("--origin", action="append", help="Filter by origin (repeatable)")
120
+ support_task.add_argument("--tag", action="append", help="Filter by tag (repeatable)")
121
+
122
+ support_guide = support_subparsers.add_parser("guide", help="Show flow.yaml guide for LLM support")
123
+ support_guide.add_argument("--config", required=True, help="Path to flow.yaml")
124
+ support_guide.add_argument("--format", default="prompt", choices=["prompt", "json", "md"])
125
+ support_guide.add_argument("--output", help="Write output to file")
91
126
 
92
127
  args = parser.parse_args()
93
128
 
@@ -120,18 +155,72 @@ def main():
120
155
  return
121
156
 
122
157
  if args.command == "plugins":
123
- infos = list_available_plugins()
158
+ reports = _collect_plugin_reports()
124
159
  if args.plugins_command == "list":
125
160
  if getattr(args, "json", False):
126
- print(json.dumps(infos, indent=2))
161
+ print(json.dumps(reports, indent=2))
127
162
  else:
128
- if not infos:
163
+ if not reports:
129
164
  print("No plug-ins registered under group 'pyoco.tasks'.")
130
165
  else:
131
166
  print("Discovered plug-ins:")
132
- for info in infos:
167
+ for info in reports:
133
168
  mod = info.get("module") or info.get("value")
134
169
  print(f" - {info.get('name')} ({mod})")
170
+ if info.get("error"):
171
+ print(f" ⚠️ error: {info['error']}")
172
+ continue
173
+ for task in info.get("tasks", []):
174
+ warn_msg = "; ".join(task.get("warnings", [])) or "ok"
175
+ print(f" • {task['name']} [{task['origin']}] ({warn_msg})")
176
+ for warn in info.get("warnings", []):
177
+ print(f" ⚠️ {warn}")
178
+ elif args.plugins_command == "lint":
179
+ issues = []
180
+ for info in reports:
181
+ prefix = info["name"]
182
+ if info.get("error"):
183
+ issues.append(f"{prefix}: {info['error']}")
184
+ continue
185
+ for warn in info.get("warnings", []):
186
+ issues.append(f"{prefix}: {warn}")
187
+ for task in info.get("tasks", []):
188
+ for warn in task.get("warnings", []):
189
+ issues.append(f"{prefix}.{task['name']}: {warn}")
190
+ payload = {"issues": issues, "reports": reports}
191
+ if getattr(args, "json", False):
192
+ print(json.dumps(payload, indent=2))
193
+ else:
194
+ if not issues:
195
+ print("✅ All plug-ins look good.")
196
+ else:
197
+ print("⚠️ Plug-in issues found:")
198
+ for issue in issues:
199
+ print(f" - {issue}")
200
+ if issues:
201
+ sys.exit(1)
202
+ else:
203
+ plugins_parser.print_help()
204
+ return
205
+
206
+ if args.command == "support":
207
+ if not args.support_command:
208
+ support_parser.print_help()
209
+ sys.exit(1)
210
+ filters = _build_support_filters(args)
211
+ try:
212
+ content = SupportInfoService().build(
213
+ kind=args.support_command,
214
+ config_path=args.config,
215
+ format=args.format,
216
+ filters=filters or None,
217
+ output_path=args.output,
218
+ )
219
+ except SupportInfoError as exc:
220
+ _print_support_error(exc)
221
+ sys.exit(1)
222
+ if not args.output:
223
+ print(content)
135
224
  return
136
225
 
137
226
  if args.command == "server":
@@ -368,6 +457,45 @@ def main():
368
457
  sys.exit(2 if args.dry_run else 1)
369
458
  return
370
459
 
460
+ def _collect_plugin_reports():
461
+ dummy = SimpleNamespace(tasks={})
462
+ loader = TaskLoader(dummy)
463
+ loader.load()
464
+ return loader.plugin_reports
465
+
466
+
467
+ def _build_support_filters(args):
468
+ filters = {}
469
+ if getattr(args, "name", None):
470
+ value = args.name
471
+ filters["name"] = value if isinstance(value, list) else [value]
472
+ if getattr(args, "origin", None):
473
+ filters["origin"] = args.origin
474
+ if getattr(args, "tag", None):
475
+ filters["tag"] = args.tag
476
+ return filters
477
+
478
+
479
+ def _print_support_error(exc: SupportInfoError) -> None:
480
+ if isinstance(exc, InvalidFormatError):
481
+ print(f"Invalid format: {exc.format}")
482
+ return
483
+ if isinstance(exc, TaskNotFoundError):
484
+ print(f"Task not found: {exc.name}")
485
+ return
486
+ if isinstance(exc, OutputWriteError):
487
+ print(f"Failed to write output: {exc.path}")
488
+ return
489
+ if isinstance(exc, InvalidFilterError):
490
+ print(f"Invalid filter: {exc.filter_value}")
491
+ return
492
+ if isinstance(exc, MissingTaskMetadataError):
493
+ fields = ",".join(exc.fields)
494
+ print(f"Missing task metadata: {exc.name} fields={fields}")
495
+ return
496
+ print(f"Error: {exc}")
497
+
498
+
371
499
  def _stream_logs(client, args):
372
500
  seen_seq = -1
373
501
  follow = args.follow
@@ -0,0 +1,51 @@
1
+ class ControlFlowError(Exception):
2
+ """Base error for control flow execution issues."""
3
+
4
+
5
+ class UntilMaxIterationsExceeded(ControlFlowError):
6
+ def __init__(self, expression: str, max_iter: int):
7
+ super().__init__(f"Until condition '{expression}' exceeded max_iter={max_iter}")
8
+ self.expression = expression
9
+ self.max_iter = max_iter
10
+
11
+
12
+ class SwitchNoMatch(ControlFlowError):
13
+ def __init__(self, expression: str):
14
+ super().__init__(f"Switch expression '{expression}' did not match any case.")
15
+ self.expression = expression
16
+
17
+
18
+ class SupportInfoError(Exception):
19
+ """Base error for support info generation."""
20
+
21
+
22
+ class InvalidFormatError(SupportInfoError):
23
+ def __init__(self, format: str):
24
+ self.format = format
25
+ super().__init__(f"Invalid format: {format}")
26
+
27
+
28
+ class TaskNotFoundError(SupportInfoError):
29
+ def __init__(self, name: str):
30
+ self.name = name
31
+ super().__init__(f"Task not found: {name}")
32
+
33
+
34
+ class InvalidFilterError(SupportInfoError):
35
+ def __init__(self, filter_value: str):
36
+ self.filter_value = filter_value
37
+ super().__init__(f"Invalid filter: {filter_value}")
38
+
39
+
40
+ class OutputWriteError(SupportInfoError):
41
+ def __init__(self, path: str):
42
+ self.path = path
43
+ super().__init__(f"Failed to write output: {path}")
44
+
45
+
46
+ class MissingTaskMetadataError(SupportInfoError):
47
+ def __init__(self, name: str, fields: list[str]):
48
+ self.name = name
49
+ self.fields = fields
50
+ field_list = ",".join(fields)
51
+ super().__init__(f"Missing task metadata: {name} fields={field_list}")
@@ -238,11 +238,10 @@ class Flow:
238
238
  # So `flow >> (A | B)` just adds A and B.
239
239
  # Then `(A | B) >> C` is handled by Branch.
240
240
  pass
241
-
242
- # Update tail
241
+
243
242
  if new_tasks:
244
243
  self._tail = set(new_tasks)
245
-
244
+
246
245
  return self
247
246
 
248
247
  def add_task(self, task: Task):
@@ -284,3 +283,45 @@ class Flow:
284
283
  tail_task.dependents.add(task)
285
284
  task.dependencies.add(tail_task)
286
285
  self._tail = {task}
286
+
287
+
288
+ @dataclass
289
+ class TaskIO:
290
+ name: str
291
+ type: str
292
+ required: bool
293
+ constraints: Optional[List[str]] = None
294
+
295
+ @classmethod
296
+ def from_dict(cls, data: Dict[str, Any]) -> "TaskIO":
297
+ return cls(
298
+ name=data.get("name"),
299
+ type=data.get("type"),
300
+ required=data.get("required"),
301
+ constraints=data.get("constraints"),
302
+ )
303
+
304
+
305
+ @dataclass
306
+ class TaskInfo:
307
+ name: str
308
+ summary: str
309
+ inputs: List[TaskIO]
310
+ outputs: List[TaskIO]
311
+ origin: Optional[str] = None
312
+ tags: Optional[List[str]] = None
313
+
314
+
315
+ @dataclass
316
+ class SupportFilters:
317
+ name: Optional[List[str]] = None
318
+ origin: Optional[List[str]] = None
319
+ tag: Optional[List[str]] = None
320
+
321
+
322
+ @dataclass
323
+ class SupportInfo:
324
+ kind: str
325
+ format: str
326
+ content: str
327
+ filters: SupportFilters
@@ -1,6 +1,5 @@
1
1
  import importlib
2
- import pkgutil
3
- import sys
2
+ import os
4
3
  from typing import Dict, List, Any, Set
5
4
  from ..core.models import Task
6
5
  from ..dsl.syntax import TaskWrapper
@@ -11,30 +10,28 @@ class TaskLoader:
11
10
  self.config = config
12
11
  self.strict = strict
13
12
  self.tasks: Dict[str, Task] = {}
13
+ self.task_infos: Dict[str, Any] = {}
14
14
  self._explicit_tasks: Set[str] = set()
15
15
  self.plugin_reports: List[Dict[str, Any]] = []
16
16
 
17
17
  def load(self):
18
18
  # Load explicitly defined tasks in config FIRST (Higher priority)
19
19
  for task_name, task_conf in self.config.tasks.items():
20
- if task_conf.callable:
21
- self._load_explicit_task(task_name, task_conf)
20
+ callable_path = self._conf_get(task_conf, "callable")
21
+ if callable_path:
22
+ self._load_explicit_task(task_name, task_conf, callable_path)
22
23
  self._explicit_tasks.add(task_name)
23
24
 
24
- # Load from packages
25
- for package in self.config.discovery.packages:
26
- self._load_package(package)
27
-
28
- # Load from entry points (simplified)
29
- for ep in self.config.discovery.entry_points:
30
- self._load_module(ep)
31
-
32
- # Load from glob modules
33
- for pattern in self.config.discovery.glob_modules:
34
- self._load_glob_modules(pattern)
25
+ self._load_env_modules()
35
26
 
36
27
  self._load_entry_point_plugins()
37
28
 
29
+ def _load_env_modules(self) -> None:
30
+ raw = os.getenv("PYOCO_DISCOVERY_MODULES", "")
31
+ modules = [item.strip() for item in raw.replace(",", " ").split() if item.strip()]
32
+ for module_name in modules:
33
+ self._load_module(module_name)
34
+
38
35
  def _register_task(self, name: str, task: Task):
39
36
  if name in self.tasks:
40
37
  if name in self._explicit_tasks:
@@ -51,24 +48,27 @@ class TaskLoader:
51
48
  # Apply config overlay if exists
52
49
  if self.config and name in self.config.tasks:
53
50
  conf = self.config.tasks[name]
54
- if not conf.callable:
55
- if conf.inputs:
56
- task.inputs.update(conf.inputs)
57
- if conf.outputs:
58
- task.outputs.extend(conf.outputs)
51
+ if not self._conf_get(conf, "callable"):
52
+ inputs = self._conf_get(conf, "inputs") or {}
53
+ outputs = self._conf_get(conf, "outputs") or []
54
+ if inputs:
55
+ task.inputs.update(inputs)
56
+ if outputs:
57
+ task.outputs.extend(outputs)
59
58
 
60
59
  self.tasks[name] = task
61
60
 
62
- def _load_package(self, package_name: str):
63
- try:
64
- pkg = importlib.import_module(package_name)
65
- if hasattr(pkg, '__path__'):
66
- for _, name, _ in pkgutil.iter_modules(pkg.__path__, pkg.__name__ + "."):
67
- self._load_module(name)
61
+ def _register_task_info(self, info: Any):
62
+ name = getattr(info, "name", None)
63
+ if not name:
64
+ return
65
+ if name in self.task_infos:
66
+ msg = f"Task metadata '{name}' already defined."
67
+ if self.strict:
68
+ raise ValueError(f"{msg} (Strict mode enabled)")
68
69
  else:
69
- self._scan_module(pkg)
70
- except ImportError as e:
71
- print(f"Warning: Could not import package {package_name}: {e}")
70
+ print(f"Warning: {msg} Overwriting.")
71
+ self.task_infos[name] = info
72
72
 
73
73
  def _load_module(self, module_name: str):
74
74
  try:
@@ -76,30 +76,6 @@ class TaskLoader:
76
76
  self._scan_module(mod)
77
77
  except ImportError as e:
78
78
  print(f"Warning: Could not import module {module_name}: {e}")
79
-
80
- def _load_glob_modules(self, pattern: str):
81
- import glob
82
- import os
83
-
84
- # Pattern is likely a file path glob, e.g. "jobs/*.py"
85
- # We need to convert file paths to module paths
86
- files = glob.glob(pattern, recursive=True)
87
- for file_path in files:
88
- if not file_path.endswith(".py"):
89
- continue
90
-
91
- # Convert path to module
92
- # This is tricky without knowing the root.
93
- # Assumption: running from root, and file path is relative to root.
94
- # e.g. "myproject/tasks/foo.py" -> "myproject.tasks.foo"
95
-
96
- rel_path = os.path.relpath(file_path)
97
- if rel_path.startswith(".."):
98
- # Out of tree, skip or warn
99
- continue
100
-
101
- module_name = rel_path.replace(os.sep, ".")[:-3] # strip .py
102
- self._load_module(module_name)
103
79
 
104
80
  def _load_entry_point_plugins(self):
105
81
  entries = iter_entry_points()
@@ -109,6 +85,7 @@ class TaskLoader:
109
85
  "value": ep.value,
110
86
  "module": getattr(ep, "module", ""),
111
87
  "tasks": [],
88
+ "warnings": [],
112
89
  }
113
90
  registry = PluginRegistry(self, ep.name)
114
91
  try:
@@ -116,7 +93,11 @@ class TaskLoader:
116
93
  if not callable(hook):
117
94
  raise TypeError("Entry point must be callable")
118
95
  hook(registry)
119
- info["tasks"] = list(registry.registered_names)
96
+ info["tasks"] = list(registry.records)
97
+ info["task_infos"] = list(registry.task_infos.values())
98
+ info["warnings"] = list(registry.warnings)
99
+ if not registry.records:
100
+ info["warnings"].append("no tasks registered")
120
101
  except Exception as exc:
121
102
  info["error"] = str(exc)
122
103
  if self.strict:
@@ -130,13 +111,17 @@ class TaskLoader:
130
111
  self._register_task(name, obj.task)
131
112
  elif isinstance(obj, Task):
132
113
  self._register_task(name, obj)
133
- elif callable(obj) and getattr(obj, '__pyoco_task__', False):
134
- # Convert to Task if not already
135
- pass
136
114
 
137
- def _load_explicit_task(self, name: str, conf: Any):
115
+ def _conf_get(self, conf: Any, key: str):
116
+ if hasattr(conf, key):
117
+ return getattr(conf, key)
118
+ if isinstance(conf, dict):
119
+ return conf.get(key)
120
+ return None
121
+
122
+ def _load_explicit_task(self, name: str, conf: Any, callable_path: str):
138
123
  # Load callable
139
- module_path, func_name = conf.callable.split(':')
124
+ module_path, func_name = callable_path.split(':')
140
125
  try:
141
126
  mod = importlib.import_module(module_path)
142
127
  obj = getattr(mod, func_name)
@@ -150,8 +135,8 @@ class TaskLoader:
150
135
 
151
136
  # Create a Task wrapper
152
137
  t = Task(func=real_func, name=name)
153
- t.inputs = conf.inputs
154
- t.outputs = conf.outputs
138
+ t.inputs = self._conf_get(conf, "inputs") or {}
139
+ t.outputs = self._conf_get(conf, "outputs") or []
155
140
  self.tasks[name] = t
156
141
  except (ImportError, AttributeError) as e:
157
142
  print(f"Error loading task {name}: {e}")