npm - @interf/compiler - Versions diffs - 0.1.12 → 0.2.1 - Mend

@interf/compiler 0.1.12 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (282) hide show

package/README.md +197 -192
package/dist/commands/benchmark.d.ts.map +1 -1
package/dist/commands/benchmark.js +65 -84
package/dist/commands/benchmark.js.map +1 -1
package/dist/commands/compile.d.ts.map +1 -1
package/dist/commands/compile.js +19 -3
package/dist/commands/compile.js.map +1 -1
package/dist/commands/create.d.ts +3 -0
package/dist/commands/create.d.ts.map +1 -1
package/dist/commands/create.js +39 -14
package/dist/commands/create.js.map +1 -1
package/dist/commands/default.d.ts.map +1 -1
package/dist/commands/default.js +2 -0
package/dist/commands/default.js.map +1 -1
package/dist/commands/init.d.ts.map +1 -1
package/dist/commands/init.js +8 -63
package/dist/commands/init.js.map +1 -1
package/dist/index.d.ts +11 -29
package/dist/index.d.ts.map +1 -1
package/dist/index.js +7 -16
package/dist/index.js.map +1 -1
package/dist/lib/agent-args.d.ts +4 -0
package/dist/lib/agent-args.d.ts.map +1 -0
package/dist/lib/agent-args.js +42 -0
package/dist/lib/agent-args.js.map +1 -0
package/dist/lib/agent-constants.d.ts +6 -0
package/dist/lib/agent-constants.d.ts.map +1 -0
package/dist/lib/agent-constants.js +29 -0
package/dist/lib/agent-constants.js.map +1 -0
package/dist/lib/agent-detection.d.ts +8 -0
package/dist/lib/agent-detection.d.ts.map +1 -0
package/dist/lib/agent-detection.js +66 -0
package/dist/lib/agent-detection.js.map +1 -0
package/dist/lib/agent-execution.d.ts +3 -0
package/dist/lib/agent-execution.d.ts.map +1 -0
package/dist/lib/agent-execution.js +207 -0
package/dist/lib/agent-execution.js.map +1 -0
package/dist/lib/agent-logs.d.ts +3 -0
package/dist/lib/agent-logs.d.ts.map +1 -0
package/dist/lib/agent-logs.js +18 -0
package/dist/lib/agent-logs.js.map +1 -0
package/dist/lib/agent-preflight.d.ts +8 -0
package/dist/lib/agent-preflight.d.ts.map +1 -0
package/dist/lib/agent-preflight.js +77 -0
package/dist/lib/agent-preflight.js.map +1 -0
package/dist/lib/agent-render.d.ts +9 -0
package/dist/lib/agent-render.d.ts.map +1 -0
package/dist/lib/agent-render.js +219 -0
package/dist/lib/agent-render.js.map +1 -0
package/dist/lib/agent-status.d.ts +4 -0
package/dist/lib/agent-status.d.ts.map +1 -0
package/dist/lib/agent-status.js +59 -0
package/dist/lib/agent-status.js.map +1 -0
package/dist/lib/agent-types.d.ts +31 -0
package/dist/lib/agent-types.d.ts.map +1 -0
package/dist/lib/agent-types.js +2 -0
package/dist/lib/agent-types.js.map +1 -0
package/dist/lib/agents.d.ts +7 -49
package/dist/lib/agents.d.ts.map +1 -1
package/dist/lib/agents.js +8 -554
package/dist/lib/agents.js.map +1 -1
package/dist/lib/benchmark-execution.d.ts +9 -0
package/dist/lib/benchmark-execution.d.ts.map +1 -0
package/dist/lib/benchmark-execution.js +488 -0
package/dist/lib/benchmark-execution.js.map +1 -0
package/dist/lib/benchmark-paths.d.ts +11 -0
package/dist/lib/benchmark-paths.d.ts.map +1 -0
package/dist/lib/benchmark-paths.js +38 -0
package/dist/lib/benchmark-paths.js.map +1 -0
package/dist/lib/benchmark-specs.d.ts +8 -0
package/dist/lib/benchmark-specs.d.ts.map +1 -0
package/dist/lib/benchmark-specs.js +115 -0
package/dist/lib/benchmark-specs.js.map +1 -0
package/dist/lib/benchmark-targets.d.ts +5 -0
package/dist/lib/benchmark-targets.d.ts.map +1 -0
package/dist/lib/benchmark-targets.js +72 -0
package/dist/lib/benchmark-targets.js.map +1 -0
package/dist/lib/benchmark-types.d.ts +19 -0
package/dist/lib/benchmark-types.d.ts.map +1 -0
package/dist/lib/benchmark-types.js +2 -0
package/dist/lib/benchmark-types.js.map +1 -0
package/dist/lib/benchmark.d.ts +4 -29
package/dist/lib/benchmark.d.ts.map +1 -1
package/dist/lib/benchmark.js +3 -324
package/dist/lib/benchmark.js.map +1 -1
package/dist/lib/bundled-templates.d.ts +5 -0
package/dist/lib/bundled-templates.d.ts.map +1 -0
package/dist/lib/bundled-templates.js +23 -0
package/dist/lib/bundled-templates.js.map +1 -0
package/dist/lib/config.d.ts +1 -0
package/dist/lib/config.d.ts.map +1 -1
package/dist/lib/config.js +2 -0
package/dist/lib/config.js.map +1 -1
package/dist/lib/eval-packs.d.ts +204 -0
package/dist/lib/eval-packs.d.ts.map +1 -0
package/dist/lib/eval-packs.js +177 -0
package/dist/lib/eval-packs.js.map +1 -0
package/dist/lib/execution-profile.d.ts +18 -0
package/dist/lib/execution-profile.d.ts.map +1 -0
package/dist/lib/execution-profile.js +85 -0
package/dist/lib/execution-profile.js.map +1 -0
package/dist/lib/interf-bootstrap.d.ts +4 -0
package/dist/lib/interf-bootstrap.d.ts.map +1 -1
package/dist/lib/interf-bootstrap.js +71 -68
package/dist/lib/interf-bootstrap.js.map +1 -1
package/dist/lib/interf-compile-plan.d.ts +12 -0
package/dist/lib/interf-compile-plan.d.ts.map +1 -0
package/dist/lib/interf-compile-plan.js +143 -0
package/dist/lib/interf-compile-plan.js.map +1 -0
package/dist/lib/interf-detect.d.ts.map +1 -1
package/dist/lib/interf-detect.js +11 -10
package/dist/lib/interf-detect.js.map +1 -1
package/dist/lib/interf-scaffold.d.ts +1 -10
package/dist/lib/interf-scaffold.d.ts.map +1 -1
package/dist/lib/interf-scaffold.js +25 -362
package/dist/lib/interf-scaffold.js.map +1 -1
package/dist/lib/interf-workflow-package.d.ts +4 -0
package/dist/lib/interf-workflow-package.d.ts.map +1 -0
package/dist/lib/interf-workflow-package.js +131 -0
package/dist/lib/interf-workflow-package.js.map +1 -0
package/dist/lib/interf.d.ts +2 -1
package/dist/lib/interf.d.ts.map +1 -1
package/dist/lib/interf.js +2 -1
package/dist/lib/interf.js.map +1 -1
package/dist/lib/local-workflows.d.ts.map +1 -1
package/dist/lib/local-workflows.js +8 -12
package/dist/lib/local-workflows.js.map +1 -1
package/dist/lib/logger.d.ts +4 -0
package/dist/lib/logger.d.ts.map +1 -0
package/dist/lib/logger.js +11 -0
package/dist/lib/logger.js.map +1 -0
package/dist/lib/obsidian.d.ts.map +1 -1
package/dist/lib/obsidian.js +7 -3
package/dist/lib/obsidian.js.map +1 -1
package/dist/lib/parse.d.ts +2 -2
package/dist/lib/parse.d.ts.map +1 -1
package/dist/lib/parse.js +11 -7
package/dist/lib/parse.js.map +1 -1
package/dist/lib/registry.js +3 -3
package/dist/lib/registry.js.map +1 -1
package/dist/lib/runtime-acceptance.d.ts +4 -0
package/dist/lib/runtime-acceptance.d.ts.map +1 -0
package/dist/lib/runtime-acceptance.js +123 -0
package/dist/lib/runtime-acceptance.js.map +1 -0
package/dist/lib/runtime-contracts.d.ts +4 -0
package/dist/lib/runtime-contracts.d.ts.map +1 -0
package/dist/lib/runtime-contracts.js +63 -0
package/dist/lib/runtime-contracts.js.map +1 -0
package/dist/lib/runtime-paths.d.ts +8 -0
package/dist/lib/runtime-paths.d.ts.map +1 -0
package/dist/lib/runtime-paths.js +28 -0
package/dist/lib/runtime-paths.js.map +1 -0
package/dist/lib/runtime-prompt.d.ts +3 -0
package/dist/lib/runtime-prompt.d.ts.map +1 -0
package/dist/lib/runtime-prompt.js +59 -0
package/dist/lib/runtime-prompt.js.map +1 -0
package/dist/lib/runtime-reconcile.d.ts +6 -0
package/dist/lib/runtime-reconcile.d.ts.map +1 -0
package/dist/lib/runtime-reconcile.js +339 -0
package/dist/lib/runtime-reconcile.js.map +1 -0
package/dist/lib/runtime-runs.d.ts +12 -0
package/dist/lib/runtime-runs.d.ts.map +1 -0
package/dist/lib/runtime-runs.js +337 -0
package/dist/lib/runtime-runs.js.map +1 -0
package/dist/lib/runtime-types.d.ts +42 -0
package/dist/lib/runtime-types.d.ts.map +1 -0
package/dist/lib/runtime-types.js +2 -0
package/dist/lib/runtime-types.js.map +1 -0
package/dist/lib/runtime.d.ts +6 -58
package/dist/lib/runtime.d.ts.map +1 -1
package/dist/lib/runtime.js +5 -614
package/dist/lib/runtime.js.map +1 -1
package/dist/lib/schema.d.ts +156 -13
package/dist/lib/schema.d.ts.map +1 -1
package/dist/lib/schema.js +113 -4
package/dist/lib/schema.js.map +1 -1
package/dist/lib/source-config.d.ts +13 -0
package/dist/lib/source-config.d.ts.map +1 -0
package/dist/lib/source-config.js +75 -0
package/dist/lib/source-config.js.map +1 -0
package/dist/lib/state-artifacts.d.ts +15 -0
package/dist/lib/state-artifacts.d.ts.map +1 -0
package/dist/lib/state-artifacts.js +24 -0
package/dist/lib/state-artifacts.js.map +1 -0
package/dist/lib/state-health.d.ts +9 -0
package/dist/lib/state-health.d.ts.map +1 -0
package/dist/lib/state-health.js +330 -0
package/dist/lib/state-health.js.map +1 -0
package/dist/lib/state-io.d.ts +15 -0
package/dist/lib/state-io.d.ts.map +1 -0
package/dist/lib/state-io.js +219 -0
package/dist/lib/state-io.js.map +1 -0
package/dist/lib/state-paths.d.ts +5 -0
package/dist/lib/state-paths.d.ts.map +1 -0
package/dist/lib/state-paths.js +19 -0
package/dist/lib/state-paths.js.map +1 -0
package/dist/lib/state-view.d.ts +7 -0
package/dist/lib/state-view.d.ts.map +1 -0
package/dist/lib/state-view.js +147 -0
package/dist/lib/state-view.js.map +1 -0
package/dist/lib/state.d.ts +6 -46
package/dist/lib/state.d.ts.map +1 -1
package/dist/lib/state.js +5 -632
package/dist/lib/state.js.map +1 -1
package/dist/lib/summarize-plan.d.ts +1 -0
package/dist/lib/summarize-plan.d.ts.map +1 -1
package/dist/lib/summarize-plan.js +10 -0
package/dist/lib/summarize-plan.js.map +1 -1
package/dist/lib/user-config.js +2 -2
package/dist/lib/user-config.js.map +1 -1
package/dist/lib/validate-helpers.d.ts +21 -0
package/dist/lib/validate-helpers.d.ts.map +1 -0
package/dist/lib/validate-helpers.js +72 -0
package/dist/lib/validate-helpers.js.map +1 -0
package/dist/lib/validate-interface.d.ts +2 -0
package/dist/lib/validate-interface.d.ts.map +1 -1
package/dist/lib/validate-interface.js +103 -53
package/dist/lib/validate-interface.js.map +1 -1
package/dist/lib/validate-kb.d.ts +8 -0
package/dist/lib/validate-kb.d.ts.map +1 -1
package/dist/lib/validate-kb.js +53 -24
package/dist/lib/validate-kb.js.map +1 -1
package/dist/lib/validate.d.ts +1 -1
package/dist/lib/validate.d.ts.map +1 -1
package/dist/lib/validate.js +5 -2
package/dist/lib/validate.js.map +1 -1
package/dist/lib/workflow-definitions.d.ts +1 -1
package/dist/lib/workflow-definitions.d.ts.map +1 -1
package/dist/lib/workflow-definitions.js +90 -166
package/dist/lib/workflow-definitions.js.map +1 -1
package/dist/lib/workflow-helpers.d.ts.map +1 -1
package/dist/lib/workflow-helpers.js +6 -3
package/dist/lib/workflow-helpers.js.map +1 -1
package/dist/lib/workflow-stage-runner.d.ts +41 -0
package/dist/lib/workflow-stage-runner.d.ts.map +1 -0
package/dist/lib/workflow-stage-runner.js +106 -0
package/dist/lib/workflow-stage-runner.js.map +1 -0
package/dist/lib/workflow-starter-docs.d.ts +9 -0
package/dist/lib/workflow-starter-docs.d.ts.map +1 -0
package/dist/lib/workflow-starter-docs.js +18 -0
package/dist/lib/workflow-starter-docs.js.map +1 -0
package/dist/lib/workflows-interface-contracts.d.ts +24 -0
package/dist/lib/workflows-interface-contracts.d.ts.map +1 -0
package/dist/lib/workflows-interface-contracts.js +304 -0
package/dist/lib/workflows-interface-contracts.js.map +1 -0
package/dist/lib/workflows-interface.d.ts +3 -10
package/dist/lib/workflows-interface.d.ts.map +1 -1
package/dist/lib/workflows-interface.js +117 -365
package/dist/lib/workflows-interface.js.map +1 -1
package/dist/lib/workflows-kb.d.ts.map +1 -1
package/dist/lib/workflows-kb.js +79 -55
package/dist/lib/workflows-kb.js.map +1 -1
package/dist/lib/workflows.d.ts.map +1 -1
package/dist/lib/workflows.js +1 -1
package/dist/lib/workflows.js.map +1 -1
package/package.json +15 -4
package/skills/interface/analyze/SKILL.md +79 -28
package/skills/interface/compile/SKILL.md +27 -28
package/skills/interface/create/SKILL.md +53 -230
package/skills/interface/create/references/compile-plan-format.md +31 -31
package/skills/interface/create/references/workflows.md +17 -32
package/skills/interface/query/SKILL.md +15 -1
package/skills/interface/retrieve/SKILL.md +32 -65
package/skills/knowledge-base/compile/SKILL.md +59 -83
package/skills/knowledge-base/compile/references/stage-claims.md +1 -1
package/skills/knowledge-base/compile/references/stage-entities.md +2 -2
package/skills/knowledge-base/query/SKILL.md +13 -1
package/skills/knowledge-base/summarize/SKILL.md +54 -24
package/templates/interface/README.md +13 -12
package/templates/interface/interfaces.md +14 -11
package/templates/knowledge-base/README.md +0 -1
package/templates/knowledge-base/registry.md +15 -15
package/templates/workflow-package/README.md +16 -0
package/templates/workflow-package/create/SKILL.md +8 -0
package/templates/workflow-package/interface-query/SKILL.md +29 -0
package/templates/workflow-package/interface-stage/SKILL.md +13 -0
package/templates/workflow-package/knowledge-base-query/SKILL.md +36 -0
package/templates/workflow-package/knowledge-base-stage/SKILL.md +13 -0
package/templates/workflow-starters/interface/interf/README.md +13 -0
package/templates/workflow-starters/interface/interf/create/SKILL.md +15 -0
package/templates/workflow-starters/knowledge-base/interf/README.md +13 -0
package/templates/workflow-starters/knowledge-base/karpathy/README.md +13 -0

package/README.md CHANGED Viewed

@@ -1,272 +1,277 @@
 # Interf
-The open-source knowledge compiler.
+Interf Knowledge Compiler uses local agents such as Claude Code and Codex to run a data-processing workflow over your files.
-Interf compiles folders into knowledge bases and task-specific interfaces: agent-ready workspaces with proof, structure, and benchmarks.
+It creates a workspace with notes and navigation so the agent can see what is in the folder and what to retrieve.
-- compile any folder into a knowledge base
-- create focused interfaces for specific tasks
-- run evals and benchmarks on your own files
+Then you test that workspace on your evals.
-Most LLM knowledge-base repos optimize for a demo. Interf optimizes for proof. It keeps your files on disk, compiles a visible folder an agent can actually use, and makes workflows compete on your evals instead of on marketing claims.
+- your files stay on your machine
+- you choose the local agent
+- you decide what must be true
-## Why Interf
+Agents start missing things when a task spans PDFs, charts, and several files in one folder. That usually shows up when the job depends on:
-Interf is built around three ideas:
+- reading reports and filings
+- extracting a number from a chart
+- understanding what is inside a folder before doing work
+- pulling context together across several files
+- checking the raw source when the answer has to be exact
-- the product surface is the compiled folder, not a hidden service
-- the workflow should leave proof of work on disk
-- the method should be benchmarkable on your task
+The workspace exists so the agent does not have to rediscover the folder from scratch on every run.
-That gives you a simple loop:
+The point is proof on your data, not generic AI claims.
-1. point Interf at a folder
-2. compile a knowledge base
-3. create an interface for a job
-4. run evals and benchmarks to see what actually works
+The simplest way to use Interf is to compare the same task before and after compilation:
-## Core concepts
+- run the task on the raw folder
+- compile the folder with Interf
+- run the same task again from the workspace
+- if you want a recorded pass/fail result, add evals and run `interf benchmark`
-- **Source folder**: your real files stay where they are
-- **Knowledge base**: `interf/{name}/`, the shared compiled layer over that folder
-- **Interface**: `interf/{name}/interfaces/{interface-name}/`, a task-specific surface on top of one knowledge base
-- **Workflow**: the reusable method package that defines the compile pipeline
-- **Benchmark**: running evals across compiled knowledge bases or interfaces on the same folder
+## Quick Start
-One source folder can host multiple knowledge bases under `interf/` when you want to compare workflows like `interf` vs `karpathy` on the same data.
+Requirements:
-## Interf primitives
+- Node.js 20+
+- a local coding agent: Claude Code or Codex
-Interf gives you a few strong primitives instead of a giant abstraction layer:
+Install and check setup:
-- **workflow package**: `workflow.json` plus local `workflow/` docs define the method
-- **stage contract**: every compile stage gets a deterministic acceptance boundary
-- **declarative acceptance**: workflows can declare extra acceptance rules in `workflow.json`
-- **CLI enforcement**: the CLI checks whether a stage actually complied instead of trusting the agent's summary
-- **benchmark specs**: file-based evals let you compare workflows and interfaces on the same folder
-That is the core product promise:
-- define what the agent should do in plain English
-- give the agent local workspace docs and stage contracts
-- validate the result deterministically
-For workflow authors, the important surface is:
-- `workflow.json`
-- `workflow/create/`
-- `workflow/compile/stages/<stage>/`
-- `workflow/use/query/`
-- [`docs/workflow-spec.md`](./docs/workflow-spec.md)
-## What the agent sees
-The compiled folder is the agent-facing product surface: an agent-ready workspace.
-Important files in a KB or interface:
+```bash
+npm install -g @interf/compiler
+interf doctor
+```
-- `interf.json` = what this workspace is
-- `AGENTS.md` = where to start and how to navigate
-- `workflow/` = the editable local method package
-- `home.md` = entry document
-- `summaries/`, `knowledge/`, and `briefs/` = compiled outputs
+Then run Interf in any folder:
-Manual query/use works like this:
+```bash
+cd ~/my-folder
+interf init
+interf compile
+interf benchmark
+```
-- open the KB or interface folder
-- read `AGENTS.md`
-- follow `workflow/use/query/SKILL.md`
-- for interfaces, use local interface artifacts first, then the parent KB loop, then raw files if needed
+That is the whole first loop:
-Interf does not require globally installed slash skills for workspace behavior. Local `workflow/.../SKILL.md` files are workspace instruction docs routed by `AGENTS.md` and stage contracts.
+- point Interf at a folder you already have
+- compile the workspace
+- ask the agent to use it
+- add evals later when you want to check the result more formally
-## Quick start
+`interf init` chooses your local agent and can attach the current folder right away. It does not move or replace your files.
-Install the published package:
+Fastest sample loop:
 ```bash
-npm install -g @interf/compiler
+cp -r examples/benchmark-demo /tmp/interf-demo
+cd /tmp/interf-demo
+interf init
+interf compile
+interf benchmark
 ```
-Or install from source while contributing:
+If you want a task-specific workspace for one job, add an interface:
 ```bash
-npm install
-npm run build
-npm install -g .
+interf create interface
+interf compile
+interf benchmark
 ```
-Initialize Interf in any folder:
-```bash
-cd ~/my-notes
-interf init
+## Start With One Small Eval
+`interf.config.json` is where you write what must be true.
+Use it for:
+- broad checks on the folder as a whole
+- task-specific checks for one interface
+Example shape:
+```json
+{
+  "knowledge_base": {
+    "name": "uk-office-market-report",
+    "evals": [
+      {
+        "question": "What was Bristol annual take-up in 2018, in millions of square feet?",
+        "answer": "About 0.5 million square feet. Accept answers between 0.3 and 0.6 if they clearly refer to Bristol annual take-up in 2018."
+      }
+    ]
+  },
+  "interfaces": [
+    {
+      "name": "market-briefing",
+      "about": "Prepare a short briefing from the office market report.",
+      "evals": [
+        {
+          "question": "What was Bristol availability in 2018, in millions of square feet?",
+          "answer": "About 0.6 million square feet. Accept answers between 0.5 and 0.7 if they clearly refer to Bristol availability in 2018."
+        },
+        {
+          "question": "Did Bristol annual take-up rise or fall between 2016 and 2018?",
+          "answer": "It fell. The chart shows roughly 0.7 to 0.8 million square feet in 2016 and about 0.5 million square feet in 2018."
+        }
+      ]
+    }
+  ]
+}
 ```
-That flow can:
+Good first evals are small and practical:
-- choose an executor like Claude Code or Codex
-- optionally install global helper skills
-- attach the current folder as a knowledge base
-- compile the knowledge base immediately
+- one exact number from a chart, table, or filing
+- one short statement that should be true or false
+- one simple comparison across years, files, or sections
-Then you can:
+Then run:
 ```bash
-interf create interface
 interf compile
 interf benchmark
 ```
-## Example layout
+If the benchmark does not show an improvement over raw files, keep iterating or move to the experiment loop described below.
-```text
-source-folder/
-  ...your files...
-  interf/
-    workflows/
-    benchmarks/
-    {knowledge-base-name}/
-      interf.json
-      AGENTS.md
-      CLAUDE.md
-      home.md
-      workflow/
-      summaries/
-      knowledge/
-      interfaces/
-        {interface-name}/
-          interf.json
-          compile-plan.md
-          AGENTS.md
-          CLAUDE.md
-          home.md
-          workflow/
-          knowledge/
-          briefs/
-          summaries/
-```
+## Compare Three Things
-## Commands
+Compare:
-- `interf init` = global setup first; if run inside a normal folder, it can also attach and compile a knowledge base there
-- `interf create` = chooser when type is omitted
-- `interf create knowledge-base` = attach current folder
-- `interf create interface` = create an interface for the current folder's knowledge base
-- `interf create workflow` = create a reusable workflow package
-- `interf compile` = compile the current knowledge base or interface
-- `interf benchmark` = compare compiled knowledge bases or interfaces with file-based evals
-- `interf doctor` = preflight local executor setup before a real compile
-- `interf status` = show deterministic health
-- `interf verify <check>` = internal deterministic referee for major workflow steps
-- `interf reset <scope>` = reset generated state while keeping source files
+1. the raw folder
+2. the workspace
+3. an interface for one specific job
-## Workflows
+`interf benchmark` is how you compare those on the same evals.
-A workflow is a package, not just a prompt.
+That gives you one clear question:
-It has two layers:
+- is the raw folder enough?
+- does the workspace retrieve better?
+- does a dedicated interface do better than both?
-- machine layer: `workflow.json`
-- human/agent layer: `workflow/` docs
+## What `interf compile` Actually Does
-Typical reusable workflow package:
+`interf compile` runs a workflow over your folder.
-```text
-interf/workflows/knowledge-base/<workflow-id>/
-  workflow.json
-  README.md
-  create/
-    SKILL.md
-  compile/
-    stages/
-      <stage-id>/
-        SKILL.md
-  use/
-    query/
-      SKILL.md
-```
+That workflow is the compilation pipeline:
+- read the files
+- write processed notes and navigation files
+- build the workspace your agent can use
+- optionally build an interface for one specific job
+The default workflow is built in. If you want a different method, you can define your own workflow package and benchmark it on the same folder.
+## Experiment Loop
+Interf Knowledge Compiler also supports an experiment loop above compile + benchmark.
-Interf keeps the public command surface stable while letting workflows vary the internal stage pipeline. The engine still owns contract kinds, required artifacts, and state flow.
+It runs controlled experiments against the same folder and the same evals. Each attempt reruns the compilation workflow, reruns the benchmark, and records what changed. It stops when:
-## Benchmarks and evals
+- the evals pass
+- or the experiment budget is exhausted
-Interf is benchmark-first.
+In practice, that means:
-You can:
+- `retry_policy.max_attempts_per_profile` controls how many experiment attempts each compile profile gets
+- stronger diagnostic profiles can be used only after the default ones fail
+- the loop is still judged on the same eval truth from your folder
+- failure summaries can be captured between attempts for diagnosis
-- build multiple knowledge bases over the same folder
-- compare workflows on the same source set
-- compare interfaces for the same business task
-- inspect proofs, outputs, and costs locally
+Today that advanced path is configured through eval packs and explained in the deeper docs. The workflow is the part you change. The experiment loop is the controller that runs those experiments against the same evals with a fixed attempt budget.
-Reusable benchmark specs and saved runs live under:
+Use the simple loop first. Use the experiment loop when you want to test workflow or profile changes against the same evals until one passes or the attempt budget runs out.
+## Use It With Your Agent
+If you already work through Claude Code, Codex, OpenClaw, or Hermes, the agent can run this loop for you.
+Paste something like this into Claude Code, Codex, OpenClaw, or Hermes:
 ```text
-source-folder/
-  interf/
-    benchmarks/
-      knowledge-base/*.json
-      interface/*.json
-      runs/
+Install @interf/compiler, run `interf init` in this folder, and use the local agent executor.
+If `interf.config.json` is missing, draft evals for what must be true for this task and ask me to confirm them.
+Then run `interf compile` and `interf benchmark`.
+Tell me whether the processed workspace beat raw files, and only recommend it if it did.
 ```
-This is the trust loop: don't trust a repo because it says its knowledge base is better. Run the benchmark on your folder.
+That is the basic loop:
-## Builder docs
+- the user or agent defines what must be true
+- Interf prepares processed data for retrieval
+- the benchmark shows whether that helped
-If you want to create your own workflows, start here:
+## What Gets Created
-1. [`docs/workflow-spec.md`](./docs/workflow-spec.md)
-2. [`docs/runtime-contract.md`](./docs/runtime-contract.md)
-3. [`docs/architecture.md`](./docs/architecture.md)
+After compile, Interf writes into `./interf/` beside your source files.
-## Maintainer test loop
+- `interf/<name>/` is the shared workspace over the folder
+- `interf/<name>/interfaces/<name>/` is a task-specific workspace for one job
+- `interf/benchmarks/runs/...` stores saved benchmark runs
-Smoke suite:
+Inside those workspaces you will see things like:
-```bash
-npm test
-```
+- summaries of source files
+- navigation notes and entrypoints for agents
+- task-specific outputs for one interface
+- benchmark artifacts you can inspect later
-Real executor end-to-end:
+In the CLI, the main Interf workspace is called a **knowledge base**. A task-specific workspace inside it is called an **interface**.
-```bash
-npm run test:e2e
-npm run test:e2e:compare
-```
+## When To Create An Interface
-Cached quick real-executor loop:
+Start with one workspace.
-```bash
-npm run test:e2e:quick
-npm run test:full
-```
+Create an interface when your agent needs outputs shaped for one specific job, for example:
+- weekly briefing
+- diligence on a deal room
+- extracting chart values from research PDFs
+- a focused research assistant for one question set
-Underlying acceptance commands:
+If that workspace is enough for the job, you do not need an interface yet.
+## Custom Workflows
+Interf ships with a default workflow.
+If you want to change how compilation happens on your data, this is the part you customize:
 ```bash
-npm run test:acceptance-live
-npm run test:acceptance-compare
-npm run test:acceptance-cache:refresh
-npm run test:acceptance-quick:create-interface
-npm run test:acceptance-quick:query-interface
+interf create workflow
+interf verify workflow --path <path>
 ```
-The cached quick fixture lives under `.interf-test-cache/latest-quick/`.
-`npm test` is the fast smoke/integration suite. When you want a real agent/executor end-to-end run, use `npm run test:e2e` or `npm run test:e2e:quick`.
-`npm run test:full` is the convenient day-to-day command: smoke suite plus cached quick real-executor checks.
+Then benchmark that workflow on the same folder and the same evals.
+Workflow package docs live in [docs/workflow-spec.md](./docs/workflow-spec.md).
+## Core Commands
+- `interf init` = choose your local executor and optionally attach the current folder
+- `interf create knowledge-base` = create the shared processed workspace for this folder
+- `interf create interface` = create a task-specific workspace on top
+- `interf create workflow` = create a reusable local workflow package
+- `interf compile` = build the current workspace
+- `interf benchmark` = compare raw files vs processed workspaces on your evals
+- `interf doctor` = check local executor setup
+- `interf verify <check>` = run deterministic checks on major workflow steps
+- `interf reset <scope>` = remove generated state while keeping source files
-## Design choices
+## More Docs
-- filesystem-first, not service-first
-- workflow packages over hidden orchestration
-- contract-checked stages instead of prompt-only trust
-- benchmarkability as a core product feature
-- local control: your files stay on disk and run in your environment
+- [docs/workflow-spec.md](./docs/workflow-spec.md) for custom workflow packages
+- [docs/runtime-contract.md](./docs/runtime-contract.md) for the exact on-disk contract
+- [docs/architecture.md](./docs/architecture.md) for the deeper system model
+- [docs/eval-loop.md](./docs/eval-loop.md) for the advanced benchmark and experiment loop
-Interf is not trying to win by hiding complexity. It is trying to make the method visible, enforceable, and comparable.
+Maintainers should use [CONTRIBUTING.md](./CONTRIBUTING.md) for test and release gates.
 ## License
-Code is licensed under Apache 2.0. The `Interf` name and branding are reserved; see [`TRADEMARKS.md`](./TRADEMARKS.md).
+Code is licensed under Apache 2.0. The `Interf` name and branding are reserved; see [TRADEMARKS.md](./TRADEMARKS.md).

package/dist/commands/benchmark.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"benchmark.d.ts","sourceRoot":"","sources":["../../src/commands/benchmark.ts"],"names":[],"mappings":"~~AAuBA~~,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,OAAO,CAAC;~~AAkY3C~~,eAAO,MAAM,gBAAgB,EAAE,~~aAmD9B~~,CAAC"}
1	+ {"version":3,"file":"benchmark.d.ts","sourceRoot":"","sources":["../../src/commands/benchmark.ts"],"names":[],"mappings":"AA0BA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,OAAO,CAAC;AA2W3C,eAAO,MAAM,gBAAgB,EAAE,aA8D9B,CAAC"}