kyber-chat 1.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- kyber/__init__.py +6 -0
- kyber/__main__.py +8 -0
- kyber/agent/__init__.py +8 -0
- kyber/agent/context.py +224 -0
- kyber/agent/loop.py +687 -0
- kyber/agent/memory.py +109 -0
- kyber/agent/skills.py +244 -0
- kyber/agent/subagent.py +379 -0
- kyber/agent/tools/__init__.py +6 -0
- kyber/agent/tools/base.py +102 -0
- kyber/agent/tools/filesystem.py +191 -0
- kyber/agent/tools/message.py +86 -0
- kyber/agent/tools/registry.py +73 -0
- kyber/agent/tools/shell.py +141 -0
- kyber/agent/tools/spawn.py +65 -0
- kyber/agent/tools/task_status.py +53 -0
- kyber/agent/tools/web.py +163 -0
- kyber/bridge/package.json +26 -0
- kyber/bridge/src/index.ts +50 -0
- kyber/bridge/src/server.ts +104 -0
- kyber/bridge/src/types.d.ts +3 -0
- kyber/bridge/src/whatsapp.ts +185 -0
- kyber/bridge/tsconfig.json +16 -0
- kyber/bus/__init__.py +6 -0
- kyber/bus/events.py +37 -0
- kyber/bus/queue.py +81 -0
- kyber/channels/__init__.py +6 -0
- kyber/channels/base.py +121 -0
- kyber/channels/discord.py +304 -0
- kyber/channels/feishu.py +263 -0
- kyber/channels/manager.py +161 -0
- kyber/channels/telegram.py +302 -0
- kyber/channels/whatsapp.py +141 -0
- kyber/cli/__init__.py +1 -0
- kyber/cli/commands.py +736 -0
- kyber/config/__init__.py +6 -0
- kyber/config/loader.py +95 -0
- kyber/config/schema.py +205 -0
- kyber/cron/__init__.py +6 -0
- kyber/cron/service.py +346 -0
- kyber/cron/types.py +59 -0
- kyber/dashboard/__init__.py +5 -0
- kyber/dashboard/server.py +122 -0
- kyber/dashboard/static/app.js +458 -0
- kyber/dashboard/static/favicon.png +0 -0
- kyber/dashboard/static/index.html +107 -0
- kyber/dashboard/static/kyber_logo.png +0 -0
- kyber/dashboard/static/styles.css +608 -0
- kyber/heartbeat/__init__.py +5 -0
- kyber/heartbeat/service.py +130 -0
- kyber/providers/__init__.py +6 -0
- kyber/providers/base.py +69 -0
- kyber/providers/litellm_provider.py +227 -0
- kyber/providers/transcription.py +65 -0
- kyber/session/__init__.py +5 -0
- kyber/session/manager.py +202 -0
- kyber/skills/README.md +47 -0
- kyber/skills/github/SKILL.md +48 -0
- kyber/skills/skill-creator/SKILL.md +371 -0
- kyber/skills/summarize/SKILL.md +67 -0
- kyber/skills/tmux/SKILL.md +121 -0
- kyber/skills/tmux/scripts/find-sessions.sh +112 -0
- kyber/skills/tmux/scripts/wait-for-text.sh +83 -0
- kyber/skills/weather/SKILL.md +49 -0
- kyber/utils/__init__.py +5 -0
- kyber/utils/helpers.py +91 -0
- kyber_chat-1.0.0.dist-info/METADATA +35 -0
- kyber_chat-1.0.0.dist-info/RECORD +71 -0
- kyber_chat-1.0.0.dist-info/WHEEL +4 -0
- kyber_chat-1.0.0.dist-info/entry_points.txt +2 -0
- kyber_chat-1.0.0.dist-info/licenses/LICENSE +21 -0
kyber/session/manager.py
ADDED
|
@@ -0,0 +1,202 @@
|
|
|
1
|
+
"""Session management for conversation history."""
|
|
2
|
+
|
|
3
|
+
import json
|
|
4
|
+
from pathlib import Path
|
|
5
|
+
from dataclasses import dataclass, field
|
|
6
|
+
from datetime import datetime
|
|
7
|
+
from typing import Any
|
|
8
|
+
|
|
9
|
+
from loguru import logger
|
|
10
|
+
|
|
11
|
+
from kyber.utils.helpers import ensure_dir, safe_filename
|
|
12
|
+
|
|
13
|
+
|
|
14
|
+
@dataclass
|
|
15
|
+
class Session:
|
|
16
|
+
"""
|
|
17
|
+
A conversation session.
|
|
18
|
+
|
|
19
|
+
Stores messages in JSONL format for easy reading and persistence.
|
|
20
|
+
"""
|
|
21
|
+
|
|
22
|
+
key: str # channel:chat_id
|
|
23
|
+
messages: list[dict[str, Any]] = field(default_factory=list)
|
|
24
|
+
created_at: datetime = field(default_factory=datetime.now)
|
|
25
|
+
updated_at: datetime = field(default_factory=datetime.now)
|
|
26
|
+
metadata: dict[str, Any] = field(default_factory=dict)
|
|
27
|
+
|
|
28
|
+
def add_message(self, role: str, content: str, **kwargs: Any) -> None:
|
|
29
|
+
"""Add a message to the session."""
|
|
30
|
+
msg = {
|
|
31
|
+
"role": role,
|
|
32
|
+
"content": content,
|
|
33
|
+
"timestamp": datetime.now().isoformat(),
|
|
34
|
+
**kwargs
|
|
35
|
+
}
|
|
36
|
+
self.messages.append(msg)
|
|
37
|
+
self.updated_at = datetime.now()
|
|
38
|
+
|
|
39
|
+
def get_history(self, max_messages: int = 50) -> list[dict[str, Any]]:
|
|
40
|
+
"""
|
|
41
|
+
Get message history for LLM context.
|
|
42
|
+
|
|
43
|
+
Args:
|
|
44
|
+
max_messages: Maximum messages to return.
|
|
45
|
+
|
|
46
|
+
Returns:
|
|
47
|
+
List of messages in LLM format.
|
|
48
|
+
"""
|
|
49
|
+
# Get recent messages
|
|
50
|
+
recent = self.messages[-max_messages:] if len(self.messages) > max_messages else self.messages
|
|
51
|
+
|
|
52
|
+
# Convert to LLM format (just role and content)
|
|
53
|
+
return [{"role": m["role"], "content": m["content"]} for m in recent]
|
|
54
|
+
|
|
55
|
+
def clear(self) -> None:
|
|
56
|
+
"""Clear all messages in the session."""
|
|
57
|
+
self.messages = []
|
|
58
|
+
self.updated_at = datetime.now()
|
|
59
|
+
|
|
60
|
+
|
|
61
|
+
class SessionManager:
|
|
62
|
+
"""
|
|
63
|
+
Manages conversation sessions.
|
|
64
|
+
|
|
65
|
+
Sessions are stored as JSONL files in the sessions directory.
|
|
66
|
+
"""
|
|
67
|
+
|
|
68
|
+
def __init__(self, workspace: Path):
|
|
69
|
+
self.workspace = workspace
|
|
70
|
+
self.sessions_dir = ensure_dir(Path.home() / ".kyber" / "sessions")
|
|
71
|
+
self._cache: dict[str, Session] = {}
|
|
72
|
+
|
|
73
|
+
def _get_session_path(self, key: str) -> Path:
|
|
74
|
+
"""Get the file path for a session."""
|
|
75
|
+
safe_key = safe_filename(key.replace(":", "_"))
|
|
76
|
+
return self.sessions_dir / f"{safe_key}.jsonl"
|
|
77
|
+
|
|
78
|
+
def get_or_create(self, key: str) -> Session:
|
|
79
|
+
"""
|
|
80
|
+
Get an existing session or create a new one.
|
|
81
|
+
|
|
82
|
+
Args:
|
|
83
|
+
key: Session key (usually channel:chat_id).
|
|
84
|
+
|
|
85
|
+
Returns:
|
|
86
|
+
The session.
|
|
87
|
+
"""
|
|
88
|
+
# Check cache
|
|
89
|
+
if key in self._cache:
|
|
90
|
+
return self._cache[key]
|
|
91
|
+
|
|
92
|
+
# Try to load from disk
|
|
93
|
+
session = self._load(key)
|
|
94
|
+
if session is None:
|
|
95
|
+
session = Session(key=key)
|
|
96
|
+
|
|
97
|
+
self._cache[key] = session
|
|
98
|
+
return session
|
|
99
|
+
|
|
100
|
+
def _load(self, key: str) -> Session | None:
|
|
101
|
+
"""Load a session from disk."""
|
|
102
|
+
path = self._get_session_path(key)
|
|
103
|
+
|
|
104
|
+
if not path.exists():
|
|
105
|
+
return None
|
|
106
|
+
|
|
107
|
+
try:
|
|
108
|
+
messages = []
|
|
109
|
+
metadata = {}
|
|
110
|
+
created_at = None
|
|
111
|
+
|
|
112
|
+
with open(path) as f:
|
|
113
|
+
for line in f:
|
|
114
|
+
line = line.strip()
|
|
115
|
+
if not line:
|
|
116
|
+
continue
|
|
117
|
+
|
|
118
|
+
data = json.loads(line)
|
|
119
|
+
|
|
120
|
+
if data.get("_type") == "metadata":
|
|
121
|
+
metadata = data.get("metadata", {})
|
|
122
|
+
created_at = datetime.fromisoformat(data["created_at"]) if data.get("created_at") else None
|
|
123
|
+
else:
|
|
124
|
+
messages.append(data)
|
|
125
|
+
|
|
126
|
+
return Session(
|
|
127
|
+
key=key,
|
|
128
|
+
messages=messages,
|
|
129
|
+
created_at=created_at or datetime.now(),
|
|
130
|
+
metadata=metadata
|
|
131
|
+
)
|
|
132
|
+
except Exception as e:
|
|
133
|
+
logger.warning(f"Failed to load session {key}: {e}")
|
|
134
|
+
return None
|
|
135
|
+
|
|
136
|
+
def save(self, session: Session) -> None:
|
|
137
|
+
"""Save a session to disk."""
|
|
138
|
+
path = self._get_session_path(session.key)
|
|
139
|
+
|
|
140
|
+
with open(path, "w") as f:
|
|
141
|
+
# Write metadata first
|
|
142
|
+
metadata_line = {
|
|
143
|
+
"_type": "metadata",
|
|
144
|
+
"created_at": session.created_at.isoformat(),
|
|
145
|
+
"updated_at": session.updated_at.isoformat(),
|
|
146
|
+
"metadata": session.metadata
|
|
147
|
+
}
|
|
148
|
+
f.write(json.dumps(metadata_line) + "\n")
|
|
149
|
+
|
|
150
|
+
# Write messages
|
|
151
|
+
for msg in session.messages:
|
|
152
|
+
f.write(json.dumps(msg) + "\n")
|
|
153
|
+
|
|
154
|
+
self._cache[session.key] = session
|
|
155
|
+
|
|
156
|
+
def delete(self, key: str) -> bool:
|
|
157
|
+
"""
|
|
158
|
+
Delete a session.
|
|
159
|
+
|
|
160
|
+
Args:
|
|
161
|
+
key: Session key.
|
|
162
|
+
|
|
163
|
+
Returns:
|
|
164
|
+
True if deleted, False if not found.
|
|
165
|
+
"""
|
|
166
|
+
# Remove from cache
|
|
167
|
+
self._cache.pop(key, None)
|
|
168
|
+
|
|
169
|
+
# Remove file
|
|
170
|
+
path = self._get_session_path(key)
|
|
171
|
+
if path.exists():
|
|
172
|
+
path.unlink()
|
|
173
|
+
return True
|
|
174
|
+
return False
|
|
175
|
+
|
|
176
|
+
def list_sessions(self) -> list[dict[str, Any]]:
|
|
177
|
+
"""
|
|
178
|
+
List all sessions.
|
|
179
|
+
|
|
180
|
+
Returns:
|
|
181
|
+
List of session info dicts.
|
|
182
|
+
"""
|
|
183
|
+
sessions = []
|
|
184
|
+
|
|
185
|
+
for path in self.sessions_dir.glob("*.jsonl"):
|
|
186
|
+
try:
|
|
187
|
+
# Read just the metadata line
|
|
188
|
+
with open(path) as f:
|
|
189
|
+
first_line = f.readline().strip()
|
|
190
|
+
if first_line:
|
|
191
|
+
data = json.loads(first_line)
|
|
192
|
+
if data.get("_type") == "metadata":
|
|
193
|
+
sessions.append({
|
|
194
|
+
"key": path.stem.replace("_", ":"),
|
|
195
|
+
"created_at": data.get("created_at"),
|
|
196
|
+
"updated_at": data.get("updated_at"),
|
|
197
|
+
"path": str(path)
|
|
198
|
+
})
|
|
199
|
+
except Exception:
|
|
200
|
+
continue
|
|
201
|
+
|
|
202
|
+
return sorted(sessions, key=lambda x: x.get("updated_at", ""), reverse=True)
|
kyber/skills/README.md
ADDED
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
# kyber Skills
|
|
2
|
+
|
|
3
|
+
This directory contains built-in skills that extend kyber's capabilities.
|
|
4
|
+
|
|
5
|
+
## Skill Format (AgentSkills-compatible)
|
|
6
|
+
|
|
7
|
+
Each skill is a directory containing a `SKILL.md` file with:
|
|
8
|
+
- YAML frontmatter (`name`, `description`, optional `metadata`)
|
|
9
|
+
- Markdown instructions for the agent
|
|
10
|
+
|
|
11
|
+
Kyber uses the [AgentSkills](https://opencode.ai/docs/skills/) format, which is also used by OpenClaw. Skills from either ecosystem work in Kyber without modification.
|
|
12
|
+
|
|
13
|
+
## Skill Locations & Precedence
|
|
14
|
+
|
|
15
|
+
Skills are loaded from three places (highest priority first):
|
|
16
|
+
|
|
17
|
+
1. **Workspace skills**: `~/.kyber/workspace/skills/`
|
|
18
|
+
2. **Managed/local skills**: `~/.kyber/skills/`
|
|
19
|
+
3. **Bundled skills**: shipped with kyber (this directory)
|
|
20
|
+
|
|
21
|
+
If the same skill name exists in multiple locations, the higher-priority one wins.
|
|
22
|
+
|
|
23
|
+
## OpenClaw Compatibility
|
|
24
|
+
|
|
25
|
+
Kyber understands both `"kyber"` and `"openclaw"` metadata namespaces in frontmatter. An OpenClaw skill like:
|
|
26
|
+
|
|
27
|
+
```yaml
|
|
28
|
+
metadata: {"openclaw":{"emoji":"♊️","requires":{"bins":["gemini"]}}}
|
|
29
|
+
```
|
|
30
|
+
|
|
31
|
+
works identically to:
|
|
32
|
+
|
|
33
|
+
```yaml
|
|
34
|
+
metadata: {"kyber":{"emoji":"♊️","requires":{"bins":["gemini"]}}}
|
|
35
|
+
```
|
|
36
|
+
|
|
37
|
+
To use an OpenClaw skill, drop its folder into `~/.kyber/skills/` or your workspace `skills/` directory.
|
|
38
|
+
|
|
39
|
+
## Available Built-in Skills
|
|
40
|
+
|
|
41
|
+
| Skill | Description |
|
|
42
|
+
|-------|-------------|
|
|
43
|
+
| `github` | Interact with GitHub using the `gh` CLI |
|
|
44
|
+
| `weather` | Get weather info using wttr.in and Open-Meteo |
|
|
45
|
+
| `summarize` | Summarize URLs, files, and YouTube videos |
|
|
46
|
+
| `tmux` | Remote-control tmux sessions |
|
|
47
|
+
| `skill-creator` | Create new skills |
|
|
@@ -0,0 +1,48 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: github
|
|
3
|
+
description: "Interact with GitHub using the `gh` CLI. Use `gh issue`, `gh pr`, `gh run`, and `gh api` for issues, PRs, CI runs, and advanced queries."
|
|
4
|
+
metadata: {"kyber":{"emoji":"🐙","requires":{"bins":["gh"]},"install":[{"id":"brew","kind":"brew","formula":"gh","bins":["gh"],"label":"Install GitHub CLI (brew)"},{"id":"apt","kind":"apt","package":"gh","bins":["gh"],"label":"Install GitHub CLI (apt)"}]}}
|
|
5
|
+
---
|
|
6
|
+
|
|
7
|
+
# GitHub Skill
|
|
8
|
+
|
|
9
|
+
Use the `gh` CLI to interact with GitHub. Always specify `--repo owner/repo` when not in a git directory, or use URLs directly.
|
|
10
|
+
|
|
11
|
+
## Pull Requests
|
|
12
|
+
|
|
13
|
+
Check CI status on a PR:
|
|
14
|
+
```bash
|
|
15
|
+
gh pr checks 55 --repo owner/repo
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
List recent workflow runs:
|
|
19
|
+
```bash
|
|
20
|
+
gh run list --repo owner/repo --limit 10
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
View a run and see which steps failed:
|
|
24
|
+
```bash
|
|
25
|
+
gh run view <run-id> --repo owner/repo
|
|
26
|
+
```
|
|
27
|
+
|
|
28
|
+
View logs for failed steps only:
|
|
29
|
+
```bash
|
|
30
|
+
gh run view <run-id> --repo owner/repo --log-failed
|
|
31
|
+
```
|
|
32
|
+
|
|
33
|
+
## API for Advanced Queries
|
|
34
|
+
|
|
35
|
+
The `gh api` command is useful for accessing data not available through other subcommands.
|
|
36
|
+
|
|
37
|
+
Get PR with specific fields:
|
|
38
|
+
```bash
|
|
39
|
+
gh api repos/owner/repo/pulls/55 --jq '.title, .state, .user.login'
|
|
40
|
+
```
|
|
41
|
+
|
|
42
|
+
## JSON Output
|
|
43
|
+
|
|
44
|
+
Most commands support `--json` for structured output. You can use `--jq` to filter:
|
|
45
|
+
|
|
46
|
+
```bash
|
|
47
|
+
gh issue list --repo owner/repo --json number,title --jq '.[] | "\(.number): \(.title)"'
|
|
48
|
+
```
|
|
@@ -0,0 +1,371 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: skill-creator
|
|
3
|
+
description: Create or update AgentSkills. Use when designing, structuring, or packaging skills with scripts, references, and assets.
|
|
4
|
+
---
|
|
5
|
+
|
|
6
|
+
# Skill Creator
|
|
7
|
+
|
|
8
|
+
This skill provides guidance for creating effective skills.
|
|
9
|
+
|
|
10
|
+
## About Skills
|
|
11
|
+
|
|
12
|
+
Skills are modular, self-contained packages that extend the agent's capabilities by providing
|
|
13
|
+
specialized knowledge, workflows, and tools. Think of them as "onboarding guides" for specific
|
|
14
|
+
domains or tasks—they transform the agent from a general-purpose agent into a specialized agent
|
|
15
|
+
equipped with procedural knowledge that no model can fully possess.
|
|
16
|
+
|
|
17
|
+
### What Skills Provide
|
|
18
|
+
|
|
19
|
+
1. Specialized workflows - Multi-step procedures for specific domains
|
|
20
|
+
2. Tool integrations - Instructions for working with specific file formats or APIs
|
|
21
|
+
3. Domain expertise - Company-specific knowledge, schemas, business logic
|
|
22
|
+
4. Bundled resources - Scripts, references, and assets for complex and repetitive tasks
|
|
23
|
+
|
|
24
|
+
## Core Principles
|
|
25
|
+
|
|
26
|
+
### Concise is Key
|
|
27
|
+
|
|
28
|
+
The context window is a public good. Skills share the context window with everything else the agent needs: system prompt, conversation history, other Skills' metadata, and the actual user request.
|
|
29
|
+
|
|
30
|
+
**Default assumption: the agent is already very smart.** Only add context the agent doesn't already have. Challenge each piece of information: "Does the agent really need this explanation?" and "Does this paragraph justify its token cost?"
|
|
31
|
+
|
|
32
|
+
Prefer concise examples over verbose explanations.
|
|
33
|
+
|
|
34
|
+
### Set Appropriate Degrees of Freedom
|
|
35
|
+
|
|
36
|
+
Match the level of specificity to the task's fragility and variability:
|
|
37
|
+
|
|
38
|
+
**High freedom (text-based instructions)**: Use when multiple approaches are valid, decisions depend on context, or heuristics guide the approach.
|
|
39
|
+
|
|
40
|
+
**Medium freedom (pseudocode or scripts with parameters)**: Use when a preferred pattern exists, some variation is acceptable, or configuration affects behavior.
|
|
41
|
+
|
|
42
|
+
**Low freedom (specific scripts, few parameters)**: Use when operations are fragile and error-prone, consistency is critical, or a specific sequence must be followed.
|
|
43
|
+
|
|
44
|
+
Think of the agent as exploring a path: a narrow bridge with cliffs needs specific guardrails (low freedom), while an open field allows many routes (high freedom).
|
|
45
|
+
|
|
46
|
+
### Anatomy of a Skill
|
|
47
|
+
|
|
48
|
+
Every skill consists of a required SKILL.md file and optional bundled resources:
|
|
49
|
+
|
|
50
|
+
```
|
|
51
|
+
skill-name/
|
|
52
|
+
├── SKILL.md (required)
|
|
53
|
+
│ ├── YAML frontmatter metadata (required)
|
|
54
|
+
│ │ ├── name: (required)
|
|
55
|
+
│ │ └── description: (required)
|
|
56
|
+
│ └── Markdown instructions (required)
|
|
57
|
+
└── Bundled Resources (optional)
|
|
58
|
+
├── scripts/ - Executable code (Python/Bash/etc.)
|
|
59
|
+
├── references/ - Documentation intended to be loaded into context as needed
|
|
60
|
+
└── assets/ - Files used in output (templates, icons, fonts, etc.)
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
#### SKILL.md (required)
|
|
64
|
+
|
|
65
|
+
Every SKILL.md consists of:
|
|
66
|
+
|
|
67
|
+
- **Frontmatter** (YAML): Contains `name` and `description` fields. These are the only fields that the agent reads to determine when the skill gets used, thus it is very important to be clear and comprehensive in describing what the skill is, and when it should be used.
|
|
68
|
+
- **Body** (Markdown): Instructions and guidance for using the skill. Only loaded AFTER the skill triggers (if at all).
|
|
69
|
+
|
|
70
|
+
#### Bundled Resources (optional)
|
|
71
|
+
|
|
72
|
+
##### Scripts (`scripts/`)
|
|
73
|
+
|
|
74
|
+
Executable code (Python/Bash/etc.) for tasks that require deterministic reliability or are repeatedly rewritten.
|
|
75
|
+
|
|
76
|
+
- **When to include**: When the same code is being rewritten repeatedly or deterministic reliability is needed
|
|
77
|
+
- **Example**: `scripts/rotate_pdf.py` for PDF rotation tasks
|
|
78
|
+
- **Benefits**: Token efficient, deterministic, may be executed without loading into context
|
|
79
|
+
- **Note**: Scripts may still need to be read by the agent for patching or environment-specific adjustments
|
|
80
|
+
|
|
81
|
+
##### References (`references/`)
|
|
82
|
+
|
|
83
|
+
Documentation and reference material intended to be loaded as needed into context to inform the agent's process and thinking.
|
|
84
|
+
|
|
85
|
+
- **When to include**: For documentation that the agent should reference while working
|
|
86
|
+
- **Examples**: `references/finance.md` for financial schemas, `references/mnda.md` for company NDA template, `references/policies.md` for company policies, `references/api_docs.md` for API specifications
|
|
87
|
+
- **Use cases**: Database schemas, API documentation, domain knowledge, company policies, detailed workflow guides
|
|
88
|
+
- **Benefits**: Keeps SKILL.md lean, loaded only when the agent determines it's needed
|
|
89
|
+
- **Best practice**: If files are large (>10k words), include grep search patterns in SKILL.md
|
|
90
|
+
- **Avoid duplication**: Information should live in either SKILL.md or references files, not both. Prefer references files for detailed information unless it's truly core to the skill—this keeps SKILL.md lean while making information discoverable without hogging the context window. Keep only essential procedural instructions and workflow guidance in SKILL.md; move detailed reference material, schemas, and examples to references files.
|
|
91
|
+
|
|
92
|
+
##### Assets (`assets/`)
|
|
93
|
+
|
|
94
|
+
Files not intended to be loaded into context, but rather used within the output the agent produces.
|
|
95
|
+
|
|
96
|
+
- **When to include**: When the skill needs files that will be used in the final output
|
|
97
|
+
- **Examples**: `assets/logo.png` for brand assets, `assets/slides.pptx` for PowerPoint templates, `assets/frontend-template/` for HTML/React boilerplate, `assets/font.ttf` for typography
|
|
98
|
+
- **Use cases**: Templates, images, icons, boilerplate code, fonts, sample documents that get copied or modified
|
|
99
|
+
- **Benefits**: Separates output resources from documentation, enables the agent to use files without loading them into context
|
|
100
|
+
|
|
101
|
+
#### What to Not Include in a Skill
|
|
102
|
+
|
|
103
|
+
A skill should only contain essential files that directly support its functionality. Do NOT create extraneous documentation or auxiliary files, including:
|
|
104
|
+
|
|
105
|
+
- README.md
|
|
106
|
+
- INSTALLATION_GUIDE.md
|
|
107
|
+
- QUICK_REFERENCE.md
|
|
108
|
+
- CHANGELOG.md
|
|
109
|
+
- etc.
|
|
110
|
+
|
|
111
|
+
The skill should only contain the information needed for an AI agent to do the job at hand. It should not contain auxiliary context about the process that went into creating it, setup and testing procedures, user-facing documentation, etc. Creating additional documentation files just adds clutter and confusion.
|
|
112
|
+
|
|
113
|
+
### Progressive Disclosure Design Principle
|
|
114
|
+
|
|
115
|
+
Skills use a three-level loading system to manage context efficiently:
|
|
116
|
+
|
|
117
|
+
1. **Metadata (name + description)** - Always in context (~100 words)
|
|
118
|
+
2. **SKILL.md body** - When skill triggers (<5k words)
|
|
119
|
+
3. **Bundled resources** - As needed by the agent (Unlimited because scripts can be executed without reading into context window)
|
|
120
|
+
|
|
121
|
+
#### Progressive Disclosure Patterns
|
|
122
|
+
|
|
123
|
+
Keep SKILL.md body to the essentials and under 500 lines to minimize context bloat. Split content into separate files when approaching this limit. When splitting out content into other files, it is very important to reference them from SKILL.md and describe clearly when to read them, to ensure the reader of the skill knows they exist and when to use them.
|
|
124
|
+
|
|
125
|
+
**Key principle:** When a skill supports multiple variations, frameworks, or options, keep only the core workflow and selection guidance in SKILL.md. Move variant-specific details (patterns, examples, configuration) into separate reference files.
|
|
126
|
+
|
|
127
|
+
**Pattern 1: High-level guide with references**
|
|
128
|
+
|
|
129
|
+
```markdown
|
|
130
|
+
# PDF Processing
|
|
131
|
+
|
|
132
|
+
## Quick start
|
|
133
|
+
|
|
134
|
+
Extract text with pdfplumber:
|
|
135
|
+
[code example]
|
|
136
|
+
|
|
137
|
+
## Advanced features
|
|
138
|
+
|
|
139
|
+
- **Form filling**: See [FORMS.md](FORMS.md) for complete guide
|
|
140
|
+
- **API reference**: See [REFERENCE.md](REFERENCE.md) for all methods
|
|
141
|
+
- **Examples**: See [EXAMPLES.md](EXAMPLES.md) for common patterns
|
|
142
|
+
```
|
|
143
|
+
|
|
144
|
+
the agent loads FORMS.md, REFERENCE.md, or EXAMPLES.md only when needed.
|
|
145
|
+
|
|
146
|
+
**Pattern 2: Domain-specific organization**
|
|
147
|
+
|
|
148
|
+
For Skills with multiple domains, organize content by domain to avoid loading irrelevant context:
|
|
149
|
+
|
|
150
|
+
```
|
|
151
|
+
bigquery-skill/
|
|
152
|
+
├── SKILL.md (overview and navigation)
|
|
153
|
+
└── reference/
|
|
154
|
+
├── finance.md (revenue, billing metrics)
|
|
155
|
+
├── sales.md (opportunities, pipeline)
|
|
156
|
+
├── product.md (API usage, features)
|
|
157
|
+
└── marketing.md (campaigns, attribution)
|
|
158
|
+
```
|
|
159
|
+
|
|
160
|
+
When a user asks about sales metrics, the agent only reads sales.md.
|
|
161
|
+
|
|
162
|
+
Similarly, for skills supporting multiple frameworks or variants, organize by variant:
|
|
163
|
+
|
|
164
|
+
```
|
|
165
|
+
cloud-deploy/
|
|
166
|
+
├── SKILL.md (workflow + provider selection)
|
|
167
|
+
└── references/
|
|
168
|
+
├── aws.md (AWS deployment patterns)
|
|
169
|
+
├── gcp.md (GCP deployment patterns)
|
|
170
|
+
└── azure.md (Azure deployment patterns)
|
|
171
|
+
```
|
|
172
|
+
|
|
173
|
+
When the user chooses AWS, the agent only reads aws.md.
|
|
174
|
+
|
|
175
|
+
**Pattern 3: Conditional details**
|
|
176
|
+
|
|
177
|
+
Show basic content, link to advanced content:
|
|
178
|
+
|
|
179
|
+
```markdown
|
|
180
|
+
# DOCX Processing
|
|
181
|
+
|
|
182
|
+
## Creating documents
|
|
183
|
+
|
|
184
|
+
Use docx-js for new documents. See [DOCX-JS.md](DOCX-JS.md).
|
|
185
|
+
|
|
186
|
+
## Editing documents
|
|
187
|
+
|
|
188
|
+
For simple edits, modify the XML directly.
|
|
189
|
+
|
|
190
|
+
**For tracked changes**: See [REDLINING.md](REDLINING.md)
|
|
191
|
+
**For OOXML details**: See [OOXML.md](OOXML.md)
|
|
192
|
+
```
|
|
193
|
+
|
|
194
|
+
the agent reads REDLINING.md or OOXML.md only when the user needs those features.
|
|
195
|
+
|
|
196
|
+
**Important guidelines:**
|
|
197
|
+
|
|
198
|
+
- **Avoid deeply nested references** - Keep references one level deep from SKILL.md. All reference files should link directly from SKILL.md.
|
|
199
|
+
- **Structure longer reference files** - For files longer than 100 lines, include a table of contents at the top so the agent can see the full scope when previewing.
|
|
200
|
+
|
|
201
|
+
## Skill Creation Process
|
|
202
|
+
|
|
203
|
+
Skill creation involves these steps:
|
|
204
|
+
|
|
205
|
+
1. Understand the skill with concrete examples
|
|
206
|
+
2. Plan reusable skill contents (scripts, references, assets)
|
|
207
|
+
3. Initialize the skill (run init_skill.py)
|
|
208
|
+
4. Edit the skill (implement resources and write SKILL.md)
|
|
209
|
+
5. Package the skill (run package_skill.py)
|
|
210
|
+
6. Iterate based on real usage
|
|
211
|
+
|
|
212
|
+
Follow these steps in order, skipping only if there is a clear reason why they are not applicable.
|
|
213
|
+
|
|
214
|
+
### Skill Naming
|
|
215
|
+
|
|
216
|
+
- Use lowercase letters, digits, and hyphens only; normalize user-provided titles to hyphen-case (e.g., "Plan Mode" -> `plan-mode`).
|
|
217
|
+
- When generating names, generate a name under 64 characters (letters, digits, hyphens).
|
|
218
|
+
- Prefer short, verb-led phrases that describe the action.
|
|
219
|
+
- Namespace by tool when it improves clarity or triggering (e.g., `gh-address-comments`, `linear-address-issue`).
|
|
220
|
+
- Name the skill folder exactly after the skill name.
|
|
221
|
+
|
|
222
|
+
### Step 1: Understanding the Skill with Concrete Examples
|
|
223
|
+
|
|
224
|
+
Skip this step only when the skill's usage patterns are already clearly understood. It remains valuable even when working with an existing skill.
|
|
225
|
+
|
|
226
|
+
To create an effective skill, clearly understand concrete examples of how the skill will be used. This understanding can come from either direct user examples or generated examples that are validated with user feedback.
|
|
227
|
+
|
|
228
|
+
For example, when building an image-editor skill, relevant questions include:
|
|
229
|
+
|
|
230
|
+
- "What functionality should the image-editor skill support? Editing, rotating, anything else?"
|
|
231
|
+
- "Can you give some examples of how this skill would be used?"
|
|
232
|
+
- "I can imagine users asking for things like 'Remove the red-eye from this image' or 'Rotate this image'. Are there other ways you imagine this skill being used?"
|
|
233
|
+
- "What would a user say that should trigger this skill?"
|
|
234
|
+
|
|
235
|
+
To avoid overwhelming users, avoid asking too many questions in a single message. Start with the most important questions and follow up as needed for better effectiveness.
|
|
236
|
+
|
|
237
|
+
Conclude this step when there is a clear sense of the functionality the skill should support.
|
|
238
|
+
|
|
239
|
+
### Step 2: Planning the Reusable Skill Contents
|
|
240
|
+
|
|
241
|
+
To turn concrete examples into an effective skill, analyze each example by:
|
|
242
|
+
|
|
243
|
+
1. Considering how to execute on the example from scratch
|
|
244
|
+
2. Identifying what scripts, references, and assets would be helpful when executing these workflows repeatedly
|
|
245
|
+
|
|
246
|
+
Example: When building a `pdf-editor` skill to handle queries like "Help me rotate this PDF," the analysis shows:
|
|
247
|
+
|
|
248
|
+
1. Rotating a PDF requires re-writing the same code each time
|
|
249
|
+
2. A `scripts/rotate_pdf.py` script would be helpful to store in the skill
|
|
250
|
+
|
|
251
|
+
Example: When designing a `frontend-webapp-builder` skill for queries like "Build me a todo app" or "Build me a dashboard to track my steps," the analysis shows:
|
|
252
|
+
|
|
253
|
+
1. Writing a frontend webapp requires the same boilerplate HTML/React each time
|
|
254
|
+
2. An `assets/hello-world/` template containing the boilerplate HTML/React project files would be helpful to store in the skill
|
|
255
|
+
|
|
256
|
+
Example: When building a `big-query` skill to handle queries like "How many users have logged in today?" the analysis shows:
|
|
257
|
+
|
|
258
|
+
1. Querying BigQuery requires re-discovering the table schemas and relationships each time
|
|
259
|
+
2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill
|
|
260
|
+
|
|
261
|
+
To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets.
|
|
262
|
+
|
|
263
|
+
### Step 3: Initializing the Skill
|
|
264
|
+
|
|
265
|
+
At this point, it is time to actually create the skill.
|
|
266
|
+
|
|
267
|
+
Skip this step only if the skill being developed already exists, and iteration or packaging is needed. In this case, continue to the next step.
|
|
268
|
+
|
|
269
|
+
When creating a new skill from scratch, always run the `init_skill.py` script. The script conveniently generates a new template skill directory that automatically includes everything a skill requires, making the skill creation process much more efficient and reliable.
|
|
270
|
+
|
|
271
|
+
Usage:
|
|
272
|
+
|
|
273
|
+
```bash
|
|
274
|
+
scripts/init_skill.py <skill-name> --path <output-directory> [--resources scripts,references,assets] [--examples]
|
|
275
|
+
```
|
|
276
|
+
|
|
277
|
+
Examples:
|
|
278
|
+
|
|
279
|
+
```bash
|
|
280
|
+
scripts/init_skill.py my-skill --path skills/public
|
|
281
|
+
scripts/init_skill.py my-skill --path skills/public --resources scripts,references
|
|
282
|
+
scripts/init_skill.py my-skill --path skills/public --resources scripts --examples
|
|
283
|
+
```
|
|
284
|
+
|
|
285
|
+
The script:
|
|
286
|
+
|
|
287
|
+
- Creates the skill directory at the specified path
|
|
288
|
+
- Generates a SKILL.md template with proper frontmatter and TODO placeholders
|
|
289
|
+
- Optionally creates resource directories based on `--resources`
|
|
290
|
+
- Optionally adds example files when `--examples` is set
|
|
291
|
+
|
|
292
|
+
After initialization, customize the SKILL.md and add resources as needed. If you used `--examples`, replace or delete placeholder files.
|
|
293
|
+
|
|
294
|
+
### Step 4: Edit the Skill
|
|
295
|
+
|
|
296
|
+
When editing the (newly-generated or existing) skill, remember that the skill is being created for another instance of the agent to use. Include information that would be beneficial and non-obvious to the agent. Consider what procedural knowledge, domain-specific details, or reusable assets would help another the agent instance execute these tasks more effectively.
|
|
297
|
+
|
|
298
|
+
#### Learn Proven Design Patterns
|
|
299
|
+
|
|
300
|
+
Consult these helpful guides based on your skill's needs:
|
|
301
|
+
|
|
302
|
+
- **Multi-step processes**: See references/workflows.md for sequential workflows and conditional logic
|
|
303
|
+
- **Specific output formats or quality standards**: See references/output-patterns.md for template and example patterns
|
|
304
|
+
|
|
305
|
+
These files contain established best practices for effective skill design.
|
|
306
|
+
|
|
307
|
+
#### Start with Reusable Skill Contents
|
|
308
|
+
|
|
309
|
+
To begin implementation, start with the reusable resources identified above: `scripts/`, `references/`, and `assets/` files. Note that this step may require user input. For example, when implementing a `brand-guidelines` skill, the user may need to provide brand assets or templates to store in `assets/`, or documentation to store in `references/`.
|
|
310
|
+
|
|
311
|
+
Added scripts must be tested by actually running them to ensure there are no bugs and that the output matches what is expected. If there are many similar scripts, only a representative sample needs to be tested to ensure confidence that they all work while balancing time to completion.
|
|
312
|
+
|
|
313
|
+
If you used `--examples`, delete any placeholder files that are not needed for the skill. Only create resource directories that are actually required.
|
|
314
|
+
|
|
315
|
+
#### Update SKILL.md
|
|
316
|
+
|
|
317
|
+
**Writing Guidelines:** Always use imperative/infinitive form.
|
|
318
|
+
|
|
319
|
+
##### Frontmatter
|
|
320
|
+
|
|
321
|
+
Write the YAML frontmatter with `name` and `description`:
|
|
322
|
+
|
|
323
|
+
- `name`: The skill name
|
|
324
|
+
- `description`: This is the primary triggering mechanism for your skill, and helps the agent understand when to use the skill.
|
|
325
|
+
- Include both what the Skill does and specific triggers/contexts for when to use it.
|
|
326
|
+
- Include all "when to use" information here - Not in the body. The body is only loaded after triggering, so "When to Use This Skill" sections in the body are not helpful to the agent.
|
|
327
|
+
- Example description for a `docx` skill: "Comprehensive document creation, editing, and analysis with support for tracked changes, comments, formatting preservation, and text extraction. Use when the agent needs to work with professional documents (.docx files) for: (1) Creating new documents, (2) Modifying or editing content, (3) Working with tracked changes, (4) Adding comments, or any other document tasks"
|
|
328
|
+
|
|
329
|
+
Do not include any other fields in YAML frontmatter.
|
|
330
|
+
|
|
331
|
+
##### Body
|
|
332
|
+
|
|
333
|
+
Write instructions for using the skill and its bundled resources.
|
|
334
|
+
|
|
335
|
+
### Step 5: Packaging a Skill
|
|
336
|
+
|
|
337
|
+
Once development of the skill is complete, it must be packaged into a distributable .skill file that gets shared with the user. The packaging process automatically validates the skill first to ensure it meets all requirements:
|
|
338
|
+
|
|
339
|
+
```bash
|
|
340
|
+
scripts/package_skill.py <path/to/skill-folder>
|
|
341
|
+
```
|
|
342
|
+
|
|
343
|
+
Optional output directory specification:
|
|
344
|
+
|
|
345
|
+
```bash
|
|
346
|
+
scripts/package_skill.py <path/to/skill-folder> ./dist
|
|
347
|
+
```
|
|
348
|
+
|
|
349
|
+
The packaging script will:
|
|
350
|
+
|
|
351
|
+
1. **Validate** the skill automatically, checking:
|
|
352
|
+
|
|
353
|
+
- YAML frontmatter format and required fields
|
|
354
|
+
- Skill naming conventions and directory structure
|
|
355
|
+
- Description completeness and quality
|
|
356
|
+
- File organization and resource references
|
|
357
|
+
|
|
358
|
+
2. **Package** the skill if validation passes, creating a .skill file named after the skill (e.g., `my-skill.skill`) that includes all files and maintains the proper directory structure for distribution. The .skill file is a zip file with a .skill extension.
|
|
359
|
+
|
|
360
|
+
If validation fails, the script will report the errors and exit without creating a package. Fix any validation errors and run the packaging command again.
|
|
361
|
+
|
|
362
|
+
### Step 6: Iterate
|
|
363
|
+
|
|
364
|
+
After testing the skill, users may request improvements. Often this happens right after using the skill, with fresh context of how the skill performed.
|
|
365
|
+
|
|
366
|
+
**Iteration workflow:**
|
|
367
|
+
|
|
368
|
+
1. Use the skill on real tasks
|
|
369
|
+
2. Notice struggles or inefficiencies
|
|
370
|
+
3. Identify how SKILL.md or bundled resources should be updated
|
|
371
|
+
4. Implement changes and test again
|