PyPI - openkb - Versions diffs - 0.1.4.dev0__tar.gz → 0.3.0__tar.gz - Mend

openkb 0.1.4.dev0tar.gz → 0.3.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

openkb-0.3.0/.claude-plugin/marketplace.json +31 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/.env.example +1 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/.github/workflows/publish.yml +14 -17
{openkb-0.1.4.dev0 → openkb-0.3.0}/.gitignore +1 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/PKG-INFO +126 -21
{openkb-0.1.4.dev0 → openkb-0.3.0}/README.md +123 -19
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/chat.py +89 -5
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/compiler.py +357 -29
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/linter.py +1 -1
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/query.py +44 -2
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/tools.py +50 -6
openkb-0.3.0/openkb/cli.py +1958 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/converter.py +1 -1
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/lint.py +83 -7
openkb-0.3.0/openkb/prompts/__init__.py +21 -0
openkb-0.3.0/openkb/prompts/skill_create.md +214 -0
openkb-0.3.0/openkb/skill/__init__.py +101 -0
openkb-0.3.0/openkb/skill/creator.py +209 -0
openkb-0.3.0/openkb/skill/evaluator.py +490 -0
openkb-0.3.0/openkb/skill/generator.py +81 -0
openkb-0.3.0/openkb/skill/marketplace.py +120 -0
openkb-0.3.0/openkb/skill/tools.py +100 -0
openkb-0.3.0/openkb/skill/validator.py +265 -0
openkb-0.3.0/openkb/skill/workspace.py +197 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/state.py +23 -0
openkb-0.3.0/openkb/url_ingest.py +280 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/pyproject.toml +7 -3
openkb-0.3.0/skills/openkb/SKILL.md +175 -0
openkb-0.3.0/skills/openkb/references/commands.md +69 -0
openkb-0.3.0/skills/openkb/references/wiki-schema.md +119 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_add_command.py +4 -6
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_agent_tools.py +0 -2
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_chat_slash_commands.py +1 -1
openkb-0.3.0/tests/test_cli.py +367 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_compiler.py +10 -10
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_config.py +0 -2
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_converter.py +1 -4
openkb-0.3.0/tests/test_feedback.py +241 -0
openkb-0.3.0/tests/test_generator.py +60 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_images.py +0 -3
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_indexer.py +0 -2
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_lint.py +111 -3
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_linter.py +0 -1
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_list_status.py +19 -1
openkb-0.3.0/tests/test_marketplace.py +187 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_query.py +0 -1
openkb-0.3.0/tests/test_remove.py +1118 -0
openkb-0.3.0/tests/test_skill_chat_slash.py +105 -0
openkb-0.3.0/tests/test_skill_cli.py +396 -0
openkb-0.3.0/tests/test_skill_creator.py +109 -0
openkb-0.3.0/tests/test_skill_evaluator.py +411 -0
openkb-0.3.0/tests/test_skill_name_validation.py +37 -0
openkb-0.3.0/tests/test_skill_tools.py +67 -0
openkb-0.3.0/tests/test_skill_validator.py +410 -0
openkb-0.3.0/tests/test_skill_workspace.py +171 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_state.py +0 -2
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_tree_renderer.py +0 -1
openkb-0.3.0/tests/test_url_ingest.py +621 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_watcher.py +1 -2
openkb-0.3.0/tests/test_write_kb_file.py +79 -0
openkb-0.3.0/uv.lock +3652 -0
openkb-0.1.4.dev0/openkb/cli.py +0 -758
openkb-0.1.4.dev0/tests/test_cli.py +0 -160
{openkb-0.1.4.dev0 → openkb-0.3.0}/LICENSE +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/config.yaml.example +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/__init__.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/__main__.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/__init__.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/_markdown.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/agent/chat_session.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/config.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/images.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/indexer.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/log.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/schema.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/tree_renderer.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/openkb/watcher.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/conftest.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_chat_session.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_lint_cli.py +0 -0
{openkb-0.1.4.dev0 → openkb-0.3.0}/tests/test_markdown_renderer.py +0 -0

openkb-0.3.0/.claude-plugin/marketplace.json ADDED Viewed

@@ -0,0 +1,31 @@
+{
+  "name": "vectify",
+  "owner": {
+    "name": "Ray",
+    "email": "ray@vectify.ai"
+  },
+  "metadata": {
+    "description": "Skills for navigating an OpenKB-compiled knowledge base from agent CLIs (Claude Code, Codex, Gemini CLI).",
+    "version": "0.1.4"
+  },
+  "plugins": [
+    {
+      "name": "openkb",
+      "description": "Navigate an OpenKB-compiled wiki: discover documents and concepts via openkb CLI commands, read concept and summary pages directly, and follow wikilinks across the knowledge graph.",
+      "source": "./",
+      "strict": false,
+      "version": "0.1.4",
+      "author": {
+        "name": "Ray",
+        "email": "ray@vectify.ai"
+      },
+      "homepage": "https://github.com/VectifyAI/OpenKB",
+      "repository": "https://github.com/VectifyAI/OpenKB",
+      "license": "Apache-2.0",
+      "keywords": ["knowledge-base", "wiki", "openkb", "rag", "agent-skill"],
+      "skills": [
+        "./skills/openkb"
+      ]
+    }
+  ]
+}

{openkb-0.1.4.dev0 → openkb-0.3.0}/.env.example RENAMED Viewed

@@ -2,4 +2,5 @@
 # OpenAI:    LLM_API_KEY=sk-...
 # Anthropic: LLM_API_KEY=sk-ant-...
 # Gemini:    LLM_API_KEY=AIza...
+# DeepSeek:  LLM_API_KEY=sk-...
 LLM_API_KEY=your-key-here

{openkb-0.1.4.dev0 → openkb-0.3.0}/.github/workflows/publish.yml RENAMED Viewed

@@ -1,16 +1,20 @@
 name: Publish to PyPI
 # Release flow:
-#   1. Bump `version` in pyproject.toml on main.
-#   2. `git tag -a vX.Y.Z -m "Release X.Y.Z" && git push origin vX.Y.Z`
-#      The tag MUST match pyproject.toml's version exactly (with the `v` prefix).
-#   3. This workflow builds the package, publishes to PyPI via OIDC trusted
-#      publishing, and creates a GitHub Release with auto-generated notes.
+#   1. `git tag -a vX.Y.Z -m "Release X.Y.Z" && git push origin vX.Y.Z`
+#   2. This workflow builds the package (hatch-vcs derives the version from
+#      the tag automatically — pyproject.toml has no static version field),
+#      publishes to PyPI via OIDC trusted publishing, and creates a GitHub
+#      Release with auto-generated notes.
+#
+# Tag must follow PEP 440: `v0.1.4`, `v0.2.0rc1`, `v0.1.4.dev0`. The
+# leading `v` is stripped by hatch-vcs when computing the package version.
 #
 # Do not run `python -m build && twine upload` locally — that bypasses the
-# version check and leaves no GitHub Release. PyPI rejects duplicate
-# version uploads, so if the workflow fails after PyPI publish succeeded,
-# manually create the missing GitHub Release with `gh release create vX.Y.Z`.
+# GitHub Release creation and produces a release without an attached
+# changelog. PyPI rejects duplicate version uploads, so if the workflow
+# fails after PyPI publish succeeded, manually create the missing GitHub
+# Release with `gh release create vX.Y.Z`.
 on:
   push:
@@ -26,20 +30,13 @@ jobs:
       contents: write   # Create GitHub Release
     steps:
       - uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332  # v4.2.2
+        with:
+          fetch-depth: 0   # hatch-vcs needs full history + tags
       - uses: actions/setup-python@f677139bbe7f9c59b41e40162b753c062f5d49a3  # v5.2.0
         with:
           python-version: "3.12"
-      - name: Verify tag matches pyproject.toml version
-        run: |
-          tag="${GITHUB_REF_NAME#v}"
-          pkg_version=$(python -c "import tomllib,pathlib; print(tomllib.loads(pathlib.Path('pyproject.toml').read_text())['project']['version'])")
-          if [ "$tag" != "$pkg_version" ]; then
-            echo "::error::Tag v$tag does not match pyproject.toml version $pkg_version"
-            exit 1
-          fi
       - name: Install build tools
         run: pip install build

{openkb-0.1.4.dev0 → openkb-0.3.0}/.gitignore RENAMED Viewed

@@ -13,6 +13,7 @@ venv/
 raw/
 wiki/
 .openkb/
+output/
 # Local only
 docs/

{openkb-0.1.4.dev0 → openkb-0.3.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: openkb
-Version: 0.1.4.dev0
+Version: 0.3.0
 Summary: OpenKB: Open LLM Knowledge Base, powered by PageIndex
 Project-URL: Repository, https://github.com/VectifyAI/OpenKB
 Project-URL: Homepage, https://github.com/VectifyAI/OpenKB
@@ -22,13 +22,14 @@ Requires-Python: >=3.10
 Requires-Dist: click>=8.0
 Requires-Dist: json-repair
 Requires-Dist: litellm
-Requires-Dist: markitdown[all]
+Requires-Dist: markitdown[docx,pptx,xls,xlsx]>=0.1.5
 Requires-Dist: openai-agents
 Requires-Dist: pageindex==0.3.0.dev1
 Requires-Dist: prompt-toolkit>=3.0
 Requires-Dist: python-dotenv
 Requires-Dist: pyyaml
 Requires-Dist: rich>=13.0
+Requires-Dist: trafilatura>=2.0
 Requires-Dist: watchdog>=3.0
 Provides-Extra: dev
 Requires-Dist: pytest; extra == 'dev'
@@ -59,17 +60,7 @@ The idea is based on a [concept](https://x.com/karpathy/status/20398056595256445
 Traditional RAG rediscovers knowledge from scratch on every query. Nothing accumulates. OpenKB compiles knowledge once into a persistent wiki, then keeps it current. Cross-references already exist. Contradictions are flagged. Synthesis reflects everything consumed.
-### Features
-- **Broad format support** — PDF, Word, Markdown, PowerPoint, HTML, Excel, text, and more via markitdown
-- **Scale to long documents** — Long and complex documents are handled via [PageIndex](https://github.com/VectifyAI/PageIndex) tree indexing, enabling accurate, vectorless long-context retrieval
-- **Native multi-modality** — Retrieves and understands figures, tables, and images, not just text
-- **Compiled Wiki** — LLM manages and compiles your documents into summaries, concept pages, and cross-links, all kept in sync
-- **Query** — Ask questions (one-off) against your wiki. The LLM navigates your compiled knowledge to answer
-- **Interactive Chat** — Multi-turn conversations with persisted sessions you can resume across runs
-- **Lint** — Health checks find contradictions, gaps, orphans, and stale content
-- **Watch mode** — Drop files into `raw/`, wiki updates automatically
-- **Obsidian compatible** — Wiki is plain `.md` files with `[[wikilinks]]`. Open in Obsidian for graph view and browsing
+OpenKB has two layers: a **wiki foundation** that compiles and maintains your knowledge, and **generators** (query / chat / Skill Factory) that turn it into useful output. See [Usage](#️-usage) for the full command list.
 # 🚀 Getting Started
@@ -109,13 +100,17 @@ openkb init
 # 3. Add documents
 openkb add paper.pdf
-openkb add ~/papers/  # Add a whole directory
+openkb add ~/papers/                            # Add a whole directory
+openkb add https://arxiv.org/pdf/2509.11420     # Or fetch from a URL
 # 4. Ask a question
 openkb query "What are the main findings?"
 # 5. Or chat interactively
 openkb chat
+# 6. Or distill your wiki into a redistributable skill
+openkb skill new my-expert "Reason like an expert on <topic-from-your-docs>"
 ```
 ### Set up your LLM
@@ -145,7 +140,7 @@ raw/                              You drop files here
  │                         Wiki Compilation (using LLM)
  │                                     │
  ▼                                     ▼
-wiki/
+wiki/                                  │            ← the foundation
  ├── index.md            Knowledge base overview
  ├── log.md              Operations timeline
  ├── AGENTS.md           Wiki schema (LLM instructions)
@@ -154,6 +149,13 @@ wiki/
  ├── concepts/           Cross-document synthesis ← the good stuff
  ├── explorations/       Saved query results
  └── reports/            Lint reports
+                                       │
+                ┌──────────────────────┼──────────────────────┐
+                ▼                      ▼                      ▼
+            query / chat         Skill Factory          (future)
+          (LLM answers from     openkb skill new       ppt / podcast /
+            the wiki)           → output/skills/        report / …
+                                + marketplace.json
 ```
 ### Short vs. Long Document Handling
@@ -180,26 +182,43 @@ A single source might touch 10-15 wiki pages. Knowledge accumulates: each docume
 # ⚙️ Usage
-### Commands
+OpenKB commands fall into two layers: the **wiki foundation** (compile + manage your knowledge) and **generators** (turn that wiki into useful output).
+## 🧱 Wiki Foundation — compile and maintain
 | Command | Description |
 |---|---|
 | `openkb init` | Initialize a new knowledge base (interactive) |
-| <code>openkb&nbsp;add&nbsp;&lt;file_or_dir&gt;</code> | Add documents and compile to wiki |
-| <code>openkb&nbsp;query&nbsp;"question"</code> | Ask a question over the knowledge base (use `--save` to save the answer to `wiki/explorations/`) |
-| `openkb chat` | Start an interactive multi-turn chat (use `--resume`, `--list`, `--delete` to manage sessions) |
+| <code>openkb&nbsp;add&nbsp;&lt;file_or_dir_or_URL&gt;</code> | Add documents and compile to wiki. URL ingest auto-detects PDF (saved as `.pdf` → PageIndex / markitdown) vs HTML (trafilatura main-content extract → `.md`) |
+| <code>openkb&nbsp;remove&nbsp;&lt;doc&gt;</code> | Remove a document and clean up its wiki pages, images, registry, and PageIndex state (use `--dry-run` to preview, `--keep-raw` / `--keep-empty-concepts` to retain artifacts) |
 | `openkb watch` | Watch `raw/` and auto-compile new files |
 | `openkb lint` | Run structural + knowledge health checks |
 | `openkb list` | List indexed documents and concepts |
 | `openkb status` | Show knowledge base stats |
+| <code>openkb&nbsp;feedback&nbsp;["msg"]</code> | File feedback by opening a prefilled GitHub issue (use `--type bug/feature/question` to tag the issue) |
 <!-- | `openkb lint --fix` | Auto-fix what it can | -->
-### Interactive Chat
+## ✨ Generators — turn the wiki into output
+A "generator" reads from the compiled wiki and produces something usable: an answer, a conversation, a skill folder. The wiki is the substrate; generators are the surfaces.
+| Command | Output |
+|---|---|
+| <code>openkb&nbsp;query&nbsp;"question"</code> | A grounded answer with citations (use `--save` to persist to `wiki/explorations/`) |
+| `openkb chat` | Interactive multi-turn session over the wiki (use `--resume`, `--list`, `--delete` to manage sessions) |
+| <code>openkb&nbsp;skill&nbsp;new&nbsp;&lt;name&gt;&nbsp;"&lt;intent&gt;"</code> | A redistributable Anthropic Skill at `<kb>/output/skills/<name>/` + auto-updated `marketplace.json` |
+| <code>openkb&nbsp;skill&nbsp;validate&nbsp;[name]</code> | Structural lint of compiled skills (frontmatter, file sizes, wikilinks, scripts/ stdlib check with `--strict`). Auto-runs at end of `skill new` |
+| <code>openkb&nbsp;skill&nbsp;eval&nbsp;&lt;name&gt;</code> | Trigger-accuracy evaluation — does the `description:` field actually fire? LLM generates eval prompts; grader LLM scores activation. `--save` persists the eval set |
+| <code>openkb&nbsp;skill&nbsp;history&nbsp;&lt;name&gt;</code> / <code>openkb&nbsp;skill&nbsp;rollback&nbsp;&lt;name&gt;</code> | Iteration workspace — every overwrite saves the previous version to `output/skills/<name>-workspace/iteration-N/` with a structural diff. Rollback restores any iteration |
+### Query & Chat — ask the wiki
-`openkb chat` opens an interactive chat session over your wiki knowledge base. Unlike the one-shot `openkb query`, each turn carries the conversation history, so you can dig into a topic without re-typing context.
+`openkb query "..."` answers a single question. `openkb chat` is interactive — each turn carries history, so you can dig into a topic without re-typing context. Both use the same underlying wiki and the same retrieval primitives (PageIndex for long docs, direct concept reads for short).
 ```bash
+openkb query "What does the literature say about attention scaling?"
 openkb chat                       # start a new session
 openkb chat --resume              # resume the most recent session
 openkb chat --resume 20260411     # resume by id (unique prefix works)
@@ -213,11 +232,70 @@ Inside a chat, type `/` to access slash commands (Tab to complete):
 - `/status` — show knowledge base status
 - `/list` — list all documents
 - `/add <path>` — add a document or directory without leaving the chat
+- `/skill new <name> "<intent>"` — compile a skill from this chat (see below)
 - `/save [name]` — export the transcript to `wiki/explorations/`
 - `/clear` — start a fresh session (the current one stays on disk)
 - `/lint` — run knowledge base lint
 - `/exit` — exit (Ctrl-D also works)
+### 🛠 Skill Factory — *Drop in a book. Out comes a digital expert.*
+The newest generator. `openkb skill new` distills any subset of your wiki into an [Anthropic Skill](https://docs.claude.com/en/docs/build-with-claude/skills) — a portable folder that **Claude Code, Codex CLI, Gemini CLI, and Cursor** all install and load natively. Drop in a book's worth of papers; out comes a specialist that other agents can call on.
+```bash
+openkb skill new karpathy-thinking \
+  "Reason about transformers and attention in Karpathy's style"
+```
+This produces:
+```
+<kb>/output/skills/karpathy-thinking/
+├── SKILL.md                   # YAML frontmatter + when-to-use + approach
+├── references/                # depth material the agent loads on demand
+│   ├── methodology.md
+│   └── key-quotes.md
+└── (scripts/)                 # optional, only if intent implies computation
+```
+…plus an auto-updated `<kb>/.claude-plugin/marketplace.json` so the whole KB is one-line installable.
+**Install locally:**
+```bash
+cp -r output/skills/karpathy-thinking ~/.claude/skills/
+```
+**Share with others** — push your KB to GitHub, then anyone runs:
+```bash
+npx skills@latest add <your-org>/<your-repo>
+```
+**Iterate from chat** — compilation is one-shot, but follow-up edits aren't. Inside `openkb chat`, you can refine without re-running the whole pipeline:
+```
+/skill new karpathy-thinking "Reason about transformers like Karpathy"
+[generation streams]
+> description is too generic, make it about transformer implementations specifically
+[agent edits SKILL.md frontmatter in place]
+```
+**Quality gates** — structural validation, trigger-accuracy + body-coverage evaluation, and full history/rollback:
+```bash
+# Lint structure (auto-runs at end of `skill new`)
+openkb skill validate karpathy-thinking
+openkb skill validate --strict          # treat warnings as failures
+# Does the description actually fire when it should?
+openkb skill eval karpathy-thinking --save
+# History + rollback if a new iteration regresses
+openkb skill history karpathy-thinking
+openkb skill rollback karpathy-thinking --to 2
+```
 ### Configuration
 Settings are initialized by `openkb init`, and stored in `.openkb/config.yaml`:
@@ -272,6 +350,33 @@ OpenKB's wiki is a directory of Markdown files with `[[wikilinks]]`. Obsidian re
 3. Use graph view to see knowledge connections
 4. Use Obsidian Web Clipper to add web articles to `raw/`
+### Using with Claude Code / Codex / Gemini CLI
+OpenKB ships a `SKILL.md` so any agent CLI can read your compiled wiki — no extra runtime, no MCP setup, just install the skill once.
+**Claude Code**:
+```
+/plugin marketplace add VectifyAI/OpenKB
+/plugin install openkb@vectify
+```
+**Gemini CLI**:
+```bash
+gemini skills install https://github.com/VectifyAI/OpenKB.git --path skills/openkb --consent
+```
+**OpenAI Codex CLI** (no marketplace command yet — manual symlink):
+```bash
+git clone https://github.com/VectifyAI/OpenKB.git ~/openkb-src
+mkdir -p ~/.agents/skills
+ln -s ~/openkb-src/skills/openkb ~/.agents/skills/openkb
+```
+The skill is read-only — it won't run `openkb add`, `remove`, or `lint --fix` without you asking. See [`skills/openkb/SKILL.md`](skills/openkb/SKILL.md) for the full instruction set.
 # 🧭 Learn More
 ### Compared to Karpathy's Approach

{openkb-0.1.4.dev0 → openkb-0.3.0}/README.md RENAMED Viewed

@@ -22,17 +22,7 @@ The idea is based on a [concept](https://x.com/karpathy/status/20398056595256445
 Traditional RAG rediscovers knowledge from scratch on every query. Nothing accumulates. OpenKB compiles knowledge once into a persistent wiki, then keeps it current. Cross-references already exist. Contradictions are flagged. Synthesis reflects everything consumed.
-### Features
-- **Broad format support** — PDF, Word, Markdown, PowerPoint, HTML, Excel, text, and more via markitdown
-- **Scale to long documents** — Long and complex documents are handled via [PageIndex](https://github.com/VectifyAI/PageIndex) tree indexing, enabling accurate, vectorless long-context retrieval
-- **Native multi-modality** — Retrieves and understands figures, tables, and images, not just text
-- **Compiled Wiki** — LLM manages and compiles your documents into summaries, concept pages, and cross-links, all kept in sync
-- **Query** — Ask questions (one-off) against your wiki. The LLM navigates your compiled knowledge to answer
-- **Interactive Chat** — Multi-turn conversations with persisted sessions you can resume across runs
-- **Lint** — Health checks find contradictions, gaps, orphans, and stale content
-- **Watch mode** — Drop files into `raw/`, wiki updates automatically
-- **Obsidian compatible** — Wiki is plain `.md` files with `[[wikilinks]]`. Open in Obsidian for graph view and browsing
+OpenKB has two layers: a **wiki foundation** that compiles and maintains your knowledge, and **generators** (query / chat / Skill Factory) that turn it into useful output. See [Usage](#️-usage) for the full command list.
 # 🚀 Getting Started
@@ -72,13 +62,17 @@ openkb init
 # 3. Add documents
 openkb add paper.pdf
-openkb add ~/papers/  # Add a whole directory
+openkb add ~/papers/                            # Add a whole directory
+openkb add https://arxiv.org/pdf/2509.11420     # Or fetch from a URL
 # 4. Ask a question
 openkb query "What are the main findings?"
 # 5. Or chat interactively
 openkb chat
+# 6. Or distill your wiki into a redistributable skill
+openkb skill new my-expert "Reason like an expert on <topic-from-your-docs>"
 ```
 ### Set up your LLM
@@ -108,7 +102,7 @@ raw/                              You drop files here
  │                         Wiki Compilation (using LLM)
  │                                     │
  ▼                                     ▼
-wiki/
+wiki/                                  │            ← the foundation
  ├── index.md            Knowledge base overview
  ├── log.md              Operations timeline
  ├── AGENTS.md           Wiki schema (LLM instructions)
@@ -117,6 +111,13 @@ wiki/
  ├── concepts/           Cross-document synthesis ← the good stuff
  ├── explorations/       Saved query results
  └── reports/            Lint reports
+                                       │
+                ┌──────────────────────┼──────────────────────┐
+                ▼                      ▼                      ▼
+            query / chat         Skill Factory          (future)
+          (LLM answers from     openkb skill new       ppt / podcast /
+            the wiki)           → output/skills/        report / …
+                                + marketplace.json
 ```
 ### Short vs. Long Document Handling
@@ -143,26 +144,43 @@ A single source might touch 10-15 wiki pages. Knowledge accumulates: each docume
 # ⚙️ Usage
-### Commands
+OpenKB commands fall into two layers: the **wiki foundation** (compile + manage your knowledge) and **generators** (turn that wiki into useful output).
+## 🧱 Wiki Foundation — compile and maintain
 | Command | Description |
 |---|---|
 | `openkb init` | Initialize a new knowledge base (interactive) |
-| <code>openkb&nbsp;add&nbsp;&lt;file_or_dir&gt;</code> | Add documents and compile to wiki |
-| <code>openkb&nbsp;query&nbsp;"question"</code> | Ask a question over the knowledge base (use `--save` to save the answer to `wiki/explorations/`) |
-| `openkb chat` | Start an interactive multi-turn chat (use `--resume`, `--list`, `--delete` to manage sessions) |
+| <code>openkb&nbsp;add&nbsp;&lt;file_or_dir_or_URL&gt;</code> | Add documents and compile to wiki. URL ingest auto-detects PDF (saved as `.pdf` → PageIndex / markitdown) vs HTML (trafilatura main-content extract → `.md`) |
+| <code>openkb&nbsp;remove&nbsp;&lt;doc&gt;</code> | Remove a document and clean up its wiki pages, images, registry, and PageIndex state (use `--dry-run` to preview, `--keep-raw` / `--keep-empty-concepts` to retain artifacts) |
 | `openkb watch` | Watch `raw/` and auto-compile new files |
 | `openkb lint` | Run structural + knowledge health checks |
 | `openkb list` | List indexed documents and concepts |
 | `openkb status` | Show knowledge base stats |
+| <code>openkb&nbsp;feedback&nbsp;["msg"]</code> | File feedback by opening a prefilled GitHub issue (use `--type bug/feature/question` to tag the issue) |
 <!-- | `openkb lint --fix` | Auto-fix what it can | -->
-### Interactive Chat
+## ✨ Generators — turn the wiki into output
-`openkb chat` opens an interactive chat session over your wiki knowledge base. Unlike the one-shot `openkb query`, each turn carries the conversation history, so you can dig into a topic without re-typing context.
+A "generator" reads from the compiled wiki and produces something usable: an answer, a conversation, a skill folder. The wiki is the substrate; generators are the surfaces.
+| Command | Output |
+|---|---|
+| <code>openkb&nbsp;query&nbsp;"question"</code> | A grounded answer with citations (use `--save` to persist to `wiki/explorations/`) |
+| `openkb chat` | Interactive multi-turn session over the wiki (use `--resume`, `--list`, `--delete` to manage sessions) |
+| <code>openkb&nbsp;skill&nbsp;new&nbsp;&lt;name&gt;&nbsp;"&lt;intent&gt;"</code> | A redistributable Anthropic Skill at `<kb>/output/skills/<name>/` + auto-updated `marketplace.json` |
+| <code>openkb&nbsp;skill&nbsp;validate&nbsp;[name]</code> | Structural lint of compiled skills (frontmatter, file sizes, wikilinks, scripts/ stdlib check with `--strict`). Auto-runs at end of `skill new` |
+| <code>openkb&nbsp;skill&nbsp;eval&nbsp;&lt;name&gt;</code> | Trigger-accuracy evaluation — does the `description:` field actually fire? LLM generates eval prompts; grader LLM scores activation. `--save` persists the eval set |
+| <code>openkb&nbsp;skill&nbsp;history&nbsp;&lt;name&gt;</code> / <code>openkb&nbsp;skill&nbsp;rollback&nbsp;&lt;name&gt;</code> | Iteration workspace — every overwrite saves the previous version to `output/skills/<name>-workspace/iteration-N/` with a structural diff. Rollback restores any iteration |
+### Query & Chat — ask the wiki
+`openkb query "..."` answers a single question. `openkb chat` is interactive — each turn carries history, so you can dig into a topic without re-typing context. Both use the same underlying wiki and the same retrieval primitives (PageIndex for long docs, direct concept reads for short).
 ```bash
+openkb query "What does the literature say about attention scaling?"
 openkb chat                       # start a new session
 openkb chat --resume              # resume the most recent session
 openkb chat --resume 20260411     # resume by id (unique prefix works)
@@ -176,11 +194,70 @@ Inside a chat, type `/` to access slash commands (Tab to complete):
 - `/status` — show knowledge base status
 - `/list` — list all documents
 - `/add <path>` — add a document or directory without leaving the chat
+- `/skill new <name> "<intent>"` — compile a skill from this chat (see below)
 - `/save [name]` — export the transcript to `wiki/explorations/`
 - `/clear` — start a fresh session (the current one stays on disk)
 - `/lint` — run knowledge base lint
 - `/exit` — exit (Ctrl-D also works)
+### 🛠 Skill Factory — *Drop in a book. Out comes a digital expert.*
+The newest generator. `openkb skill new` distills any subset of your wiki into an [Anthropic Skill](https://docs.claude.com/en/docs/build-with-claude/skills) — a portable folder that **Claude Code, Codex CLI, Gemini CLI, and Cursor** all install and load natively. Drop in a book's worth of papers; out comes a specialist that other agents can call on.
+```bash
+openkb skill new karpathy-thinking \
+  "Reason about transformers and attention in Karpathy's style"
+```
+This produces:
+```
+<kb>/output/skills/karpathy-thinking/
+├── SKILL.md                   # YAML frontmatter + when-to-use + approach
+├── references/                # depth material the agent loads on demand
+│   ├── methodology.md
+│   └── key-quotes.md
+└── (scripts/)                 # optional, only if intent implies computation
+```
+…plus an auto-updated `<kb>/.claude-plugin/marketplace.json` so the whole KB is one-line installable.
+**Install locally:**
+```bash
+cp -r output/skills/karpathy-thinking ~/.claude/skills/
+```
+**Share with others** — push your KB to GitHub, then anyone runs:
+```bash
+npx skills@latest add <your-org>/<your-repo>
+```
+**Iterate from chat** — compilation is one-shot, but follow-up edits aren't. Inside `openkb chat`, you can refine without re-running the whole pipeline:
+```
+/skill new karpathy-thinking "Reason about transformers like Karpathy"
+[generation streams]
+> description is too generic, make it about transformer implementations specifically
+[agent edits SKILL.md frontmatter in place]
+```
+**Quality gates** — structural validation, trigger-accuracy + body-coverage evaluation, and full history/rollback:
+```bash
+# Lint structure (auto-runs at end of `skill new`)
+openkb skill validate karpathy-thinking
+openkb skill validate --strict          # treat warnings as failures
+# Does the description actually fire when it should?
+openkb skill eval karpathy-thinking --save
+# History + rollback if a new iteration regresses
+openkb skill history karpathy-thinking
+openkb skill rollback karpathy-thinking --to 2
+```
 ### Configuration
 Settings are initialized by `openkb init`, and stored in `.openkb/config.yaml`:
@@ -235,6 +312,33 @@ OpenKB's wiki is a directory of Markdown files with `[[wikilinks]]`. Obsidian re
 3. Use graph view to see knowledge connections
 4. Use Obsidian Web Clipper to add web articles to `raw/`
+### Using with Claude Code / Codex / Gemini CLI
+OpenKB ships a `SKILL.md` so any agent CLI can read your compiled wiki — no extra runtime, no MCP setup, just install the skill once.
+**Claude Code**:
+```
+/plugin marketplace add VectifyAI/OpenKB
+/plugin install openkb@vectify
+```
+**Gemini CLI**:
+```bash
+gemini skills install https://github.com/VectifyAI/OpenKB.git --path skills/openkb --consent
+```
+**OpenAI Codex CLI** (no marketplace command yet — manual symlink):
+```bash
+git clone https://github.com/VectifyAI/OpenKB.git ~/openkb-src
+mkdir -p ~/.agents/skills
+ln -s ~/openkb-src/skills/openkb ~/.agents/skills/openkb
+```
+The skill is read-only — it won't run `openkb add`, `remove`, or `lint --fix` without you asking. See [`skills/openkb/SKILL.md`](skills/openkb/SKILL.md) for the full instruction set.
 # 🧭 Learn More
 ### Compared to Karpathy's Approach

openkb 0.1.4.dev0__tar.gz → 0.3.0__tar.gz

openkb 0.1.4.dev0tar.gz → 0.3.0tar.gz