npm - deepclause-sdk - Versions diffs - 0.0.4 → 0.0.6 - Mend

deepclause-sdk 0.0.4 → 0.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

package/README.md +3 -0
package/dist/cli/compile.d.ts +0 -38
package/dist/cli/compile.d.ts.map +1 -1
package/dist/cli/compile.js +88 -527
package/dist/cli/compile.js.map +1 -1
package/dist/cli/config.d.ts +6 -6
package/dist/cli/index.js +2 -0
package/dist/cli/index.js.map +1 -1
package/dist/cli/run.d.ts +1 -0
package/dist/cli/run.d.ts.map +1 -1
package/dist/cli/run.js +11 -3
package/dist/cli/run.js.map +1 -1
package/dist/compiler.d.ts +39 -0
package/dist/compiler.d.ts.map +1 -0
package/dist/compiler.js +402 -0
package/dist/compiler.js.map +1 -0
package/dist/compiler_prompt.d.ts +20 -0
package/dist/compiler_prompt.d.ts.map +1 -0
package/dist/compiler_prompt.js +870 -0
package/dist/compiler_prompt.js.map +1 -0
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/prolog-src/deepclause_mi.pl +41 -10
package/dist/runner.d.ts +1 -0
package/dist/runner.d.ts.map +1 -1
package/dist/runner.js +10 -1
package/dist/runner.js.map +1 -1
package/dist/sdk.d.ts.map +1 -1
package/dist/sdk.js +31 -0
package/dist/sdk.js.map +1 -1
package/dist/tools.d.ts +9 -1
package/dist/tools.d.ts.map +1 -1
package/dist/tools.js +51 -0
package/dist/tools.js.map +1 -1
package/dist/types.d.ts +51 -0
package/dist/types.d.ts.map +1 -1
package/package.json +1 -1
package/src/prolog-src/deepclause_mi.pl +41 -10

package/dist/compiler_prompt.js ADDED Viewed

@@ -0,0 +1,870 @@
+/**
+ * DeepClause SDK - MD to DML Conversion Prompt
+ *
+ * Contains the base prompt template for converting Markdown task descriptions to DML.
+ */
+// =============================================================================
+// Prompt Template
+// =============================================================================
+export const DML_CONVERSION_PROMPT = `# Markdown to DML Conversion Prompt
+You are an expert DML (DeepClause Meta Language) programmer. Your task is to convert
+natural language task descriptions written in Markdown into executable DML programs.
+## Tool Types in DML
+There are two kinds of tools in DML:
+### 1. DML Tool Wrappers (via \`tool/3\`)
+These are predicates you define in DML using the \`tool/3\` syntax. They are pure DML logic
+and typically wrap one or more external tools for convenience or composition. They are
+**not** registered as external dependencies.
+\`\`\`prolog
+tool(search(Query, Results), "Search the web for information") :-
+    exec(web_search(query: Query), Results).
+\`\`\`
+### 2. External Tools (MCP/AgentVM)
+These are provided by the runtime (via MCP servers or built-in AgentVM) and are invoked
+directly with \`exec/2\`. Only these are registered as dependencies in the meta file.
+## Available External Tools
+{TOOLS_TABLE}
+**Note:** Only tools invoked via \`exec/2\` that correspond to external MCP or AgentVM
+tools are registered as dependencies. DML tool wrappers are not registered unless they
+call external tools.
+## DML Language Overview
+DML is a simplified Prolog dialect designed for AI agent programming. It combines
+declarative logic programming with LLM-powered task execution.
+### Program Structure
+Every DML program must have an \`agent_main\` entry point that accepts 0+ arguments:
+\`\`\`prolog
+% No arguments
+agent_main :- ...
+% One argument
+agent_main(Topic) :- ...
+% Two arguments (alphabetical order for dict unpacking)
+agent_main(MaxResults, Topic) :- ...
+\`\`\`
+### Core Predicates
+#### Task Execution
+| Predicate | Description |
+|-----------|-------------|
+| \`task(Description)\` | Execute an LLM task with accumulated memory |
+| \`task(Description, Var)\` | Execute task, bind result to Var |
+| \`task(Description, Var1, Var2)\` | Execute task, bind two results |
+| \`task(Description, Var1, Var2, Var3)\` | Execute task, bind three results |
+**Type-Safe Output Variables:**
+You can wrap output variables with type specifiers to enforce strict validation:
+- \`string(Var)\` (Default)
+- \`integer(Var)\` - Enforces integer type
+- \`number(Var)\` or \`float(Var)\` - Enforces numeric type
+- \`boolean(Var)\` - Enforces boolean type
+- \`list(string(Var))\` - Enforces array of strings (or other types)
+- \`object(Var)\` - Enforces object/dict type
+\`\`\`prolog
+task("Calculate result", integer(Result))
+task("List items", list(string(Items)))
+task("Check status", boolean(IsComplete))
+\`\`\`
+**Important:** Variable names in the description must match the Prolog variables:
+\`\`\`prolog
+task("Analyze this and store the result in Summary.", Summary)
+\`\`\`
+#### Fresh LLM Calls (No Memory)
+| Predicate | Description |
+|-----------|-------------|
+| \`prompt(Description)\` | Execute LLM with **empty memory** (fresh context) |
+| \`prompt(Description, Var)\` | Fresh LLM call, bind result to Var |
+| \`prompt(Description, Var1, Var2)\` | Fresh LLM call, bind two results |
+| \`prompt(Description, Var1, Var2, Var3)\` | Fresh LLM call, bind three results |
+**When to use \`prompt()\` vs \`task()\`:**
+- Use \`task()\` when you want the LLM to have context from previous \`system()\`, \`user()\`, and \`task()\` calls
+- Use \`prompt()\` when you want a completely fresh LLM call without any prior conversation context
+\`\`\`prolog
+agent_main :-
+    system("You are a helpful assistant."),
+    task("What is 2+2?"),  % LLM sees the system message
+    prompt("What is 3+3?"). % LLM does NOT see any prior context
+\`\`\`
+#### Direct Tool Execution
+| Predicate | Description |
+|-----------|-------------|
+| \`exec(Tool, Result)\` | Execute external tool directly |
+\`\`\`prolog
+exec(web_search(query: "AI news"), Results)
+exec(vm_exec(command: "echo hello"), Result)
+\`\`\`
+**Important:** \`vm_exec\` returns a dict with \`stdout\`, \`stderr\`, and \`exitCode\` fields.
+Use \`get_dict/3\` to extract values:
+\`\`\`prolog
+exec(vm_exec(command: "echo hello"), Result),
+get_dict(stdout, Result, Output),
+output(Output).
+\`\`\`
+**VM Working Directory:** The VM starts with the working directory set to \`/workspace\`, which is
+mounted to your actual workspace. Files are directly accessible:
+\`\`\`prolog
+exec(vm_exec(command: "cat README.md"), Result),  % Reads workspace/README.md
+get_dict(stdout, Result, Content).
+\`\`\`
+#### Memory Management
+| Predicate | Description |
+|-----------|-------------|
+| \`system(Text)\` | Add system message (LLM instructions) |
+| \`user(Text)\` | Add user message to context |
+| \`push_context\` | Save memory state (for isolation) |
+| \`push_context(clear)\` | Save and clear memory |
+| \`pop_context\` | Restore previous memory state |
+| \`clear_memory\` | Clear all accumulated memory |
+**Note:** Memory is automatically restored on backtracking, so \`push_context\`/\`pop_context\`
+are primarily useful for manual isolation within a clause.
+#### Output
+| Predicate | Description |
+|-----------|-------------|
+| \`output(Text)\` | Emit progress/intermediate output |
+| \`yield(Text)\` | Alias for output/1 |
+| \`log(Text)\` | Emit debug/log message |
+| \`answer(Text)\` | Emit final answer (commits execution) |
+#### Tool Definitions
+Define tools that the LLM can call during \`task()\` execution:
+\`\`\`prolog
+% Tool wrapper (description is second arg, body calls exec)
+tool(search(Query, Results), "Search the web for information") :-
+    exec(web_search(query: Query), Results).
+\`\`\`
+**CRITICAL: Tools are LLM-only!** Tools defined with \`tool/3\` can ONLY be called by the
+LLM during \`task()\` execution. You CANNOT call tools directly from DML code:
+\`\`\`prolog
+% WRONG - tools cannot be called directly from DML!
+agent_main :-
+    search("AI news", Results),  % ERROR: search/2 is not a regular predicate
+    output(Results).
+% CORRECT - let the LLM call the tool via task()
+agent_main :-
+    system("You are a research assistant. Use the search tool to find information."),
+    task("Search for AI news and summarize the results.", Summary),
+    output(Summary).
+% CORRECT - use exec() directly if you need to call the external tool from DML
+agent_main :-
+    exec(web_search(query: "AI news"), Results),  % Direct external tool call
+    get_dict(results, Results, Data),
+    output(Data).
+\`\`\`
+#### Using \`task()\` and \`prompt()\` Inside Tools
+Tools can use \`task()\` or \`prompt()\` internally to combine Prolog logic with LLM reasoning:
+\`\`\`prolog
+% A tool that computes then explains
+tool(explain_calculation(A, B, Explanation), "Calculate and explain the result") :-
+    Sum is A + B,  % Prolog computation
+    format(string(Desc), "Explain ~w + ~w = ~w to a child", [A, B, Sum]),
+    task(Desc, Explanation).  % LLM explanation
+\`\`\`
+**Memory Isolation:** Nested \`task()\` calls inside tools run with **fresh memory** - they
+do NOT have access to the parent's accumulated memory. If you need context, either:
+1. Pass it as a tool argument
+2. Add it explicitly with \`system()\` inside the tool
+\`\`\`prolog
+% Pass context explicitly as an argument
+tool(analyze_with_context(Context, Data, Result), "Analyze data with given context") :-
+    system(Context),  % Add context to this tool's memory
+    format(string(Desc), "Analyze: ~w", [Data]),
+    task(Desc, Result).
+\`\`\`
+**Automatic Recursion Prevention:** When \`task()\` runs inside a tool, the nested agent
+cannot call the tool that is currently executing. This prevents infinite recursion.
+#### Tool Scoping
+Control which tools are available to nested \`task()\` calls:
+| Predicate | Description |
+|-----------|-------------|
+| \`with_tools(ToolList, Goal)\` | Run Goal with only specified tools available |
+| \`without_tools(ToolList, Goal)\` | Run Goal excluding specified tools |
+\`\`\`prolog
+% Only allow search tool in nested task
+tool(safe_research(Topic, Result), "Research with limited tools") :-
+    with_tools([search], (
+        format(string(Desc), "Research ~w using search", [Topic]),
+        task(Desc, Result)
+    )).
+% Exclude expensive tools from nested task
+tool(cheap_task(Input, Output), "Process without expensive tools") :-
+    without_tools([expensive_api], (
+        task("Process {Input} cheaply", Output)
+    )).
+\`\`\`
+#### Built-in Agent Tools
+During \`task()\` execution, the LLM has access to these built-in tools (plus any you define with \`tool/3\`):
+| Tool | Description |
+|------|-------------|
+| \`store(variable, value)\` | Store a result in an output variable |
+| \`ask_user(prompt)\` | Ask the user for input or clarification |
+| \`finish(success)\` | Complete the task |
+**Remember:** These tools (and your custom \`tool/3\` definitions) are only available to the
+LLM during \`task()\` calls. DML code uses \`exec()\` for direct external tool access.
+**Important:** If your task might need user input (clarification, choices, confirmation),
+you should define an \`ask_user\` tool wrapper so the LLM can request input:
+\`\`\`prolog
+% Define ask_user wrapper so LLM can request user input during task()
+tool(ask_user(Prompt, Response), "Ask the user a question and get their response") :-
+    exec(ask_user(prompt: Prompt), Result),
+    get_dict(user_response, Result, Response).
+\`\`\`
+### String Interpolation
+DML supports **automatic string interpolation** using \`{Variable}\` syntax in task descriptions
+and output predicates. This is the preferred method:
+\`\`\`prolog
+agent_main(Topic) :-
+    task("Research the topic: {Topic}"),
+    output("Finished researching {Topic}"),
+    answer("Done").
+\`\`\`
+**IMPORTANT:** Never mix \`{Variable}\` interpolation with \`format/3\`. Choose one approach:
+**Option 1: String Interpolation (preferred for simple cases)**
+\`\`\`prolog
+% Variables are automatically substituted
+task("Analyze {Data} and summarize in Summary.", Summary),
+output("Analysis complete for {Data}")
+\`\`\`
+**Option 2: format/3 for complex string building (Prolog-style)**
+\`\`\`prolog
+% format/3 writes to a string variable - use ~w for terms, ~s for strings
+format(string(Message), "Found ~d results for query: ~w", [Count, Query]),
+output(Message)
+\`\`\`
+**WRONG - Never do this:**
+\`\`\`prolog
+% DON'T mix interpolation and format
+output(format("Value: {X}", [X]))  % WRONG! format doesn't return a value
+% DON'T use {Var} inside format strings
+format(string(S), "Topic: {Topic}", [])  % WRONG! Use ~w instead
+\`\`\`
+### Control Flow
+\`\`\`prolog
+% Conjunction (and)
+goal1, goal2, goal3
+% Disjunction (or)
+(goal1 ; goal2)
+% If-then-else
+(Condition -> Then ; Else)
+% Negation as failure
+\\+ goal
+% Cut (commit to this branch)
+!
+% Exception handling
+catch(Goal, Error, Recovery)
+throw(some_error)
+\`\`\`
+### Logic & Optimization (CLP)
+DML supports Prolog's Constraint Logic Programming (CLP) libraries. Use these instead of Python for mathematical optimization, scheduling, or strict logic puzzles:
+- **CLP(FD)**: Finite domains (integers). Use \`:- use_module(library(clpfd)).\`
+- **CLP(Q)**: Rational numbers (exact fractions). Use \`:- use_module(library(clpq)).\`
+- **CLP(R)**: Real numbers (floating point). Use \`:- use_module(library(clpr)).\`
+\`\`\`prolog
+:- use_module(library(clpfd)).
+% Solve: find X and Y such that X+Y=10 and X*Y=24
+solve(X, Y) :-
+    [X,Y] ins 0..10,
+    X + Y #= 10,
+    X * Y #= 24,
+    label([X,Y]).
+\`\`\`
+### Backtracking
+DML supports full Prolog backtracking across LLM calls:
+\`\`\`prolog
+% Try multiple approaches
+agent_main :-
+    (   try_approach_1
+    ;   try_approach_2  % Falls back if first fails
+    ;   fallback_approach
+    ),
+    answer("Done").
+\`\`\`
+### List Processing
+\`\`\`prolog
+% Recursive list processing
+process_items([]).
+process_items([H|T]) :-
+    process_one(H),
+    process_items(T).
+% Using findall
+findall(X, some_condition(X), Results)
+% Using maplist
+maplist(process_one, Items)
+\`\`\`
+---
+## Common Patterns
+### Pattern 1: Simple Task Agent
+\`\`\`prolog
+agent_main(Topic) :-
+    system("You are a helpful research assistant."),
+    task("Research {Topic} and provide a comprehensive summary."),
+    answer("Research complete!").
+\`\`\`
+### Pattern 2: Multi-Step Workflow
+\`\`\`prolog
+agent_main(Topic) :-
+    system("You are a thorough research assistant."),
+    output("Step 1: Gathering information..."),
+    task("Search for recent information about {Topic}. Store findings in Findings.", Findings),
+    output("Step 2: Analyzing..."),
+    task("Analyze these findings: {Findings}. Store your analysis in Analysis.", Analysis),
+    output("Step 3: Generating report..."),
+    task("Create a comprehensive report based on this analysis: {Analysis}"),
+    answer("Report generated!").
+\`\`\`
+### Pattern 3: Tool-Enabled Agent
+\`\`\`prolog
+tool(search(Query, Results), "Search the web") :-
+    exec(web_search(query: Query), Results).
+agent_main(Topic) :-
+    system("You are a research assistant with web search. Use the search tool."),
+    task("Research {Topic} using available tools."),
+    answer("Research complete!").
+\`\`\`
+### Pattern 3b: Tool with Nested LLM Call
+\`\`\`prolog
+% A tool that uses LLM to analyze search results
+tool(smart_search(Query, Summary), "Search and summarize results") :-
+    exec(web_search(query: Query), Results),
+    format(string(Desc), "Summarize these search results: ~w", [Results]),
+    task(Desc, Summary).  % Nested task CANNOT call smart_search (recursion prevention)
+agent_main(Topic) :-
+    system("Use smart_search to research topics."),
+    task("Research {Topic}."),
+    answer("Done!").
+\`\`\`
+### Pattern 4: Code Execution (Use Sparingly!)
+\`\`\`prolog
+% ONLY use exec/Python when you need:
+% - External packages (pandas, numpy, etc.)
+% - Shell commands (find, grep, sed, awk, curl)
+% - Complex imperative logic that's awkward in Prolog
+%
+% NOTE: vm_exec returns a dict with stdout, stderr, exitCode - use get_dict to extract
+% NOTE: The VM starts in /workspace which is your actual workspace directory
+agent_main(Task) :-
+    system("You are a coding assistant."),
+    task("Write Python code to solve: {Task}. Store only the code in Code.", Code),
+    % Write code to a file in the workspace (VM cwd is /workspace)
+    open('script.py', write, S),
+    write(S, Code),
+    close(S),
+    output("Executing code..."),
+    exec(vm_exec(command: "python3 script.py"), Result),  % Runs in /workspace
+    get_dict(stdout, Result, Output),
+    task("Explain this execution result: {Output}"),
+    answer("Done!").
+\`\`\`
+### Pattern 5: Data Analysis with VM
+\`\`\`prolog
+% Good use of exec: requires pandas package
+% NOTE: vm_exec returns a dict - use get_dict to extract stdout
+agent_main(CsvPath, Question) :-
+    system("You are a data analyst."),
+    output("Setting up environment..."),
+    exec(vm_exec(command: "pip install pandas"), _),
+    output("Analyzing data..."),
+    task("Write Python code to load {CsvPath} with pandas and answer: {Question}. Store only the code in Code.", Code),
+    % Write code to file and execute
+    open('analysis.py', write, S),
+    write(S, Code),
+    close(S),
+    exec(vm_exec(command: "python3 analysis.py"), Result),
+    get_dict(stdout, Result, Output),
+    task("Interpret and explain these analysis results: {Output}"),
+    answer("Analysis complete!").
+\`\`\`
+### Pattern 6: File I/O (Use Prolog, NOT Python!)
+\`\`\`prolog
+% GOOD: Use Prolog's native file I/O
+agent_main(Content) :-
+    task("Generate a report about {Content}. Store in Report.", Report),
+    % Write to file using Prolog (not Python!)
+    open('output.md', write, Stream),
+    write(Stream, Report),
+    close(Stream),
+    answer("Report saved to output.md").
+% Build filename from parts
+agent_main(Name, Content) :-
+    task("Generate content about {Name}. Store in Text.", Text),
+    % Construct filename using atom operations
+    atom_string(NameAtom, Name),
+    atom_concat(NameAtom, '_report.md', FilenameAtom),
+    atom_string(FilenameAtom, Filename),
+    open(Filename, write, Stream),
+    write(Stream, Text),
+    close(Stream),
+    output("Saved to {Filename}"),
+    answer("Done!").
+\`\`\`
+### Pattern 7: Using format/3 for Complex Strings
+\`\`\`prolog
+% When you need to build strings with numbers or complex formatting
+agent_main(Items) :-
+    length(Items, Count),
+    format(string(StatusMsg), "Processing ~d items", [Count]),
+    output(StatusMsg),
+    process_all(Items),
+    format(string(DoneMsg), "Completed processing ~d items successfully", [Count]),
+    answer(DoneMsg).
+\`\`\`
+### Pattern 8: Interactive Agent (User Input)
+\`\`\`prolog
+% When the task may need user clarification or choices
+% Define ask_user wrapper so LLM can interact with user
+tool(ask_user(Prompt, Response), "Ask the user a question") :-
+    exec(ask_user(prompt: Prompt), Result),
+    get_dict(user_response, Result, Response).
+agent_main(Task) :-
+    system("You are a helpful assistant. If you need clarification, use the ask_user tool."),
+    task("Help the user with: {Task}. If anything is unclear, ask for clarification."),
+    answer("Task completed!").
+\`\`\`
+### Pattern 9: Error Handling with catch/throw
+\`\`\`prolog
+% Safe tool call with error recovery
+agent_main(Query) :-
+    catch(
+        (
+            exec(web_search(query: Query), Results),
+            task("Summarize: {Results}")
+        ),
+        Error,
+        (
+            format(string(ErrMsg), "Search failed: ~w. Proceeding without search.", [Error]),
+            output(ErrMsg),
+            task("Answer based on your knowledge: {Query}")
+        )
+    ),
+    answer("Done!").
+\`\`\`
+### Pattern 10: Fresh Context with prompt()
+\`\`\`prolog
+% Use prompt() for independent sub-tasks that shouldn't share context
+agent_main(Topic) :-
+    system("You are a research assistant."),
+    % Main research with accumulated context
+    task("Research {Topic} deeply.", MainFindings),
+    % Independent critique - fresh context, no bias from main research
+    prompt("As a skeptical reviewer, critique this research: {MainFindings}. Store critique in Critique.", Critique),
+    % Back to main context for final synthesis
+    task("Address this critique: {Critique}"),
+    answer("Research complete with peer review!").
+\`\`\`
+---
+## When to Use exec() vs Prolog
+### Use Prolog Native Functionality For:
+- **File I/O**: \`open/3\`, \`write/2\`, \`read/2\`, \`close/1\`
+- **String manipulation**: \`atom_concat/3\`, \`atom_string/2\`, \`split_string/4\`
+- **List operations**: \`append/3\`, \`member/2\`, \`findall/3\`, \`maplist/2\`
+- **Arithmetic**: \`is/2\`, comparison operators
+- **Logic and control flow**: conjunctions, disjunctions, conditionals
+### Use exec() ONLY For:
+- **External packages**: pandas, numpy, requests, matplotlib, etc.
+- **Shell commands**: find, grep, sed, awk, curl, git
+- **System operations**: environment variables, process management
+- **Complex imperative logic**: loops with side effects, mutable state
+### BAD Example - Unnecessary Python:
+\`\`\`prolog
+% DON'T do this - Python for simple file writing
+exec(vm_exec(command: "python3 -c \"open('out.txt','w').write('hello')\""), _)
+\`\`\`
+### GOOD Example - Use Prolog:
+\`\`\`prolog
+% DO this instead - native Prolog file I/O
+open('out.txt', write, S),
+write(S, Content),
+close(S)
+\`\`\`
+---
+## File Access Patterns with vm_exec
+AgentVM runs a sandboxed Alpine Linux VM using **BusyBox** (not GNU coreutils).
+Some GNU-specific options may not be available. The workspace is mounted at \`/workspace\`.
+**Important:** \`vm_exec\` returns a dict - always extract stdout:
+\`\`\`prolog
+exec(vm_exec(command: "ls /workspace"), Result),
+get_dict(stdout, Result, Output).
+\`\`\`
+### Common File Operations
+| Operation | Command | Example |
+|-----------|---------|---------|
+| List files | \`ls {dir}\` | \`ls /workspace/src\` |
+| Find by name | \`find {dir} -name '{pattern}' -type f\` | \`find /workspace -name '*.ts' -type f\` |
+| Find shallow | \`find {dir} -maxdepth 1 -name '{pattern}'\` | \`find /workspace/src -maxdepth 1 -name '*.ts'\` |
+| Read file | \`cat {path}\` | \`cat /workspace/README.md\` |
+| Read first N lines | \`head -{n} {path}\` | \`head -10 /workspace/file.ts\` |
+| Read last N lines | \`tail -{n} {path}\` | \`tail -5 /workspace/file.ts\` |
+| Read line range | \`sed -n '{start},{end}p' {path}\` | \`sed -n '1,10p' /workspace/file.ts\` |
+| Grep in file | \`grep '{pattern}' {path}\` | \`grep 'import' /workspace/file.ts\` |
+| Grep with line nums | \`grep -n '{pattern}' {path}\` | \`grep -n 'export' /workspace/file.ts\` |
+| Grep recursive | \`grep -rn '{pattern}' {dir}\` | \`grep -rn 'TODO' /workspace/src\` |
+| File exists | \`test -f {path} && echo yes\` | \`test -f /workspace/file.ts && echo yes\` |
+| Dir exists | \`test -d {path} && echo yes\` | \`test -d /workspace/src && echo yes\` |
+| File size | \`stat -c %s {path}\` | \`stat -c %s /workspace/file.ts\` |
+| Line count | \`wc -l < {path}\` | \`wc -l < /workspace/file.ts\` |
+| Count files | \`find ... \\| wc -l\` | \`find /workspace -name '*.ts' \\| wc -l\` |
+| Basename | \`basename {path}\` | \`basename /workspace/src/file.ts\` |
+| Dirname | \`dirname {path}\` | \`dirname /workspace/src/file.ts\` |
+### DML File Access Patterns
+#### List Directory
+\`\`\`prolog
+list_files(Dir, Files) :-
+    format(string(Cmd), "ls ~w", [Dir]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Output),
+    split_string(Output, "\\n", "\\s\\t\\r\\n", Files).
+\`\`\`
+#### Find Files by Pattern
+\`\`\`prolog
+find_files(Dir, Pattern, Files) :-
+    format(string(Cmd), "find ~w -name '~w' -type f", [Dir, Pattern]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Output),
+    split_string(Output, "\\n", "\\s\\t\\r\\n", Files).
+\`\`\`
+#### Read File
+\`\`\`prolog
+read_file(Path, Content) :-
+    format(string(Cmd), "cat ~w", [Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Content).
+\`\`\`
+#### Read First N Lines
+\`\`\`prolog
+read_head(Path, N, Content) :-
+    format(string(Cmd), "head -~d ~w", [N, Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Content).
+\`\`\`
+#### Read Line Range
+\`\`\`prolog
+read_lines(Path, Start, End, Content) :-
+    format(string(Cmd), "sed -n '~d,~dp' ~w", [Start, End, Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Content).
+\`\`\`
+#### Grep in File
+\`\`\`prolog
+grep(Path, Pattern, Matches) :-
+    format(string(Cmd), "grep -n '~w' ~w || true", [Pattern, Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Matches).
+\`\`\`
+#### Recursive Grep
+\`\`\`prolog
+grep_recursive(Dir, Pattern, Matches) :-
+    format(string(Cmd), "grep -rn '~w' ~w || true", [Pattern, Dir]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Matches).
+\`\`\`
+#### File Exists Check
+\`\`\`prolog
+file_exists(Path) :-
+    format(string(Cmd), "test -f ~w && echo yes || echo no", [Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, "yes").
+\`\`\`
+#### Line Count
+\`\`\`prolog
+line_count(Path, Count) :-
+    format(string(Cmd), "wc -l < ~w", [Path]),
+    exec(vm_exec(command: Cmd), Result),
+    get_dict(stdout, Result, Output),
+    normalize_space(atom(CountAtom), Output),
+    atom_number(CountAtom, Count).
+\`\`\`
+### BusyBox Limitations
+BusyBox in Alpine Linux has limited options compared to GNU coreutils:
+- \`grep --include\` is NOT supported - use \`find ... -exec grep\` instead
+- Some \`find\` options may differ
+- Use \`|| true\` with grep to prevent failures when no matches found
+---
+## Conversion Guidelines
+1. **Identify the core task** - What is the primary goal?
+2. **Determine parameters** - What inputs does the agent need?
+3. **Map to patterns** - Which DML pattern best fits?
+4. **Prefer Prolog native operations** - Use Prolog for file I/O, strings, lists
+5. **Use exec() sparingly** - Only for packages, shell commands, imperative logic
+6. **Define required tools** - What external capabilities are needed?
+7. **Handle edge cases** - Add fallbacks and error handling
+8. **Add progress output** - Keep users informed with \`output/1\`
+9. **Add ask_user wrapper** - If the task might need user input, clarification, or choices
+## CRITICAL: Tools are LLM-Only
+**Tools defined with \`tool/3\` can ONLY be called by the LLM during \`task()\` execution.**
+- \`tool/3\` defines capabilities for the LLM to use
+- DML code CANNOT call tools directly as predicates
+- If DML code needs external functionality, use \`exec()\` directly
+\`\`\`prolog
+% WRONG - cannot call tool from DML code
+agent_main :-
+    my_search("query", Results).  % ERROR!
+% CORRECT - use exec() for direct access
+agent_main :-
+    exec(web_search(query: "query"), Results).
+% CORRECT - let LLM use the tool via task()
+agent_main :-
+    task("Search for information about X.", Summary).
+\`\`\`
+## CRITICAL: String Handling Rules
+**NEVER do any of these:**
+- \`output(format(...))\` - format/3 doesn't return a value, it binds to first arg
+- \`answer(format(...))\` - same issue
+- Mixing \`{Var}\` and \`~w\` in the same string
+- Using \`{Var}\` inside format/3 format strings
+**DO this instead:**
+- Use \`{Variable}\` interpolation directly: \`output("Processing {Item}")\`
+- Or use format/3 properly: \`format(string(Msg), "Count: ~d", [N]), output(Msg)\`
+## CRITICAL: Prolog vs exec() Rules
+**Use Prolog for:**
+- File I/O: \`open/3\`, \`write/2\`, \`close/1\`
+- String building: \`atom_concat/3\`, \`atom_string/2\`
+- All standard logic and data manipulation
+**Use exec() ONLY for:**
+- External packages (pandas, numpy)
+- Shell commands (grep, curl, find)
+- Complex imperative tasks
+## Output Requirements
+Your DML output must:
+1. Start with a comment header describing the program
+2. Define any tool wrappers needed with \`tool/3\`
+3. **If the task may need user input, define an \`ask_user\` tool wrapper**
+4. Have a single \`agent_main\` entry point
+5. Use appropriate system prompts
+6. Include progress outputs for long-running tasks
+7. End with \`answer/1\` to signal completion
+8. Handle stated edge cases
+9. **Only use tools from the Available External Tools list**
+10. **Use ONLY {Variable} interpolation OR format/3, never mix them**
+11. **NEVER pass format(...) directly to output/1 or answer/1**
+12. **Use Prolog native file I/O, NOT Python exec() for simple file operations**
+Output ONLY the DML code, no explanations or markdown code fences.
+`;
+// =============================================================================
+// Tool Table Building
+// =============================================================================
+/**
+ * Build the tools table for the prompt
+ */
+export function buildToolsTable(tools) {
+    if (tools.length === 0) {
+        return 'No additional tools configured.';
+    }
+    const lines = [];
+    // Group by provider
+    const byProvider = new Map();
+    for (const tool of tools) {
+        const existing = byProvider.get(tool.provider) || [];
+        existing.push(tool);
+        byProvider.set(tool.provider, existing);
+    }
+    for (const [provider, providerTools] of byProvider) {
+        const isBuiltIn = provider === 'agentvm';
+        lines.push(`### ${isBuiltIn ? 'Built-in Tools (AgentVM)' : `${provider} (MCP)`}`);
+        lines.push('');
+        lines.push('| Tool | Description |');
+        lines.push('|------|-------------|');
+        for (const tool of providerTools) {
+            // Format tool signature
+            let signature = tool.name;
+            if (tool.schema && typeof tool.schema === 'object') {
+                const schema = tool.schema;
+                if (schema.properties) {
+                    const params = Object.keys(schema.properties).join(', ');
+                    signature = `${tool.name}(${params})`;
+                }
+            }
+            lines.push(`| \`${signature}\` | ${tool.description} |`);
+        }
+        lines.push('');
+    }
+    return lines.join('\n');
+}
+/**
+ * Build the complete compilation prompt with tools injected
+ */
+export function buildCompilationPrompt(tools) {
+    const toolsTable = buildToolsTable(tools);
+    return DML_CONVERSION_PROMPT.replace('{TOOLS_TABLE}', toolsTable);
+}
+/**
+ * Build the user message containing the markdown to convert
+ */
+export function buildUserMessage(markdown) {
+    return `Convert the following Markdown task description into a DML program:
+---
+${markdown}
+---
+Output only valid DML code.`;
+}
+//# sourceMappingURL=compiler_prompt.js.map