skyloom 1.5.3 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/core/agent.d.ts +2 -0
- package/dist/core/agent.d.ts.map +1 -1
- package/dist/core/agent.js +24 -5
- package/dist/core/agent.js.map +1 -1
- package/dist/core/learn.d.ts +30 -0
- package/dist/core/learn.d.ts.map +1 -0
- package/dist/core/learn.js +156 -0
- package/dist/core/learn.js.map +1 -0
- package/dist/core/security.d.ts +73 -0
- package/dist/core/security.d.ts.map +1 -0
- package/dist/core/security.js +220 -0
- package/dist/core/security.js.map +1 -0
- package/package.json +1 -1
- package/src/core/agent.ts +15 -5
- package/src/core/learn.ts +146 -0
- package/src/core/security.ts +243 -0
|
@@ -0,0 +1,243 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* 安全与对齐模块 — Security & Alignment
|
|
3
|
+
*
|
|
4
|
+
* Danger level grading, red-line enforcement, audit trail, human-in-the-loop.
|
|
5
|
+
* All security decisions flow through this module before tool execution.
|
|
6
|
+
*/
|
|
7
|
+
|
|
8
|
+
import { getLogger } from "./logger";
|
|
9
|
+
|
|
10
|
+
const log = getLogger("security");
|
|
11
|
+
|
|
12
|
+
/* ── Danger levels ── */
|
|
13
|
+
export enum DangerLevel {
|
|
14
|
+
/** Read-only, no side effects — auto-approved */
|
|
15
|
+
SAFE = 0,
|
|
16
|
+
/** Minor side effects (write single file, git status) — logged */
|
|
17
|
+
LOW = 1,
|
|
18
|
+
/** Significant side effects (overwrite, delete, git push) — notify */
|
|
19
|
+
MEDIUM = 2,
|
|
20
|
+
/** Dangerous (sudo, remote deploy, mass delete) — confirm */
|
|
21
|
+
HIGH = 3,
|
|
22
|
+
/** Red-line — NEVER execute without human-in-the-loop */
|
|
23
|
+
CRITICAL = 4,
|
|
24
|
+
}
|
|
25
|
+
|
|
26
|
+
/* ═══════════════════════════════════════
|
|
27
|
+
Red-line list: operations that are NEVER auto-approved
|
|
28
|
+
═══════════════════════════════════════ */
|
|
29
|
+
const REDLINE_PATTERNS = [
|
|
30
|
+
/rm\s+-rf/, /format\s+\w:/, /dd\s+if=/,
|
|
31
|
+
/>\s*\/dev\/sd/, /mkfs\./, /:(){ :\|:& };:/,
|
|
32
|
+
/sudo\s+rm/, /chmod\s+777\s+\//, /wget.*\|.*sh/,
|
|
33
|
+
/curl.*\|.*bash/, /eval\s+\$/, /exec\s+\$/,
|
|
34
|
+
/subprocess\.call.*rm/, /os\.system.*rm/,
|
|
35
|
+
];
|
|
36
|
+
|
|
37
|
+
const REDLINE_COMMANDS = [
|
|
38
|
+
"shutdown", "reboot", "init 0", "init 6",
|
|
39
|
+
"del /f /s /q C:\\*", "rd /s /q C:\\",
|
|
40
|
+
];
|
|
41
|
+
|
|
42
|
+
/* ═══════════════════════════════════════
|
|
43
|
+
Per-tool danger level mapping
|
|
44
|
+
═══════════════════════════════════════ */
|
|
45
|
+
const TOOL_DANGER_MAP: Record<string, DangerLevel> = {
|
|
46
|
+
read_file: DangerLevel.SAFE,
|
|
47
|
+
list_directory: DangerLevel.SAFE,
|
|
48
|
+
tree: DangerLevel.SAFE,
|
|
49
|
+
file_search: DangerLevel.SAFE,
|
|
50
|
+
code_search: DangerLevel.SAFE,
|
|
51
|
+
grep: DangerLevel.SAFE,
|
|
52
|
+
git_status: DangerLevel.SAFE,
|
|
53
|
+
git_diff: DangerLevel.SAFE,
|
|
54
|
+
git_log: DangerLevel.SAFE,
|
|
55
|
+
system_info: DangerLevel.SAFE,
|
|
56
|
+
system_diagnose: DangerLevel.SAFE,
|
|
57
|
+
list_processes: DangerLevel.SAFE,
|
|
58
|
+
list_installed_apps: DangerLevel.SAFE,
|
|
59
|
+
list_skills: DangerLevel.SAFE,
|
|
60
|
+
recall_facts: DangerLevel.SAFE,
|
|
61
|
+
mcp_list_servers: DangerLevel.SAFE,
|
|
62
|
+
|
|
63
|
+
write_file: DangerLevel.LOW,
|
|
64
|
+
edit_file: DangerLevel.LOW,
|
|
65
|
+
copy_file: DangerLevel.LOW,
|
|
66
|
+
move_file: DangerLevel.LOW,
|
|
67
|
+
http_get: DangerLevel.LOW,
|
|
68
|
+
fetch_page: DangerLevel.LOW,
|
|
69
|
+
web_search: DangerLevel.LOW,
|
|
70
|
+
remember_fact: DangerLevel.LOW,
|
|
71
|
+
use_skill: DangerLevel.LOW,
|
|
72
|
+
task_done: DangerLevel.LOW,
|
|
73
|
+
|
|
74
|
+
delete_file: DangerLevel.MEDIUM,
|
|
75
|
+
git_add: DangerLevel.MEDIUM,
|
|
76
|
+
git_commit: DangerLevel.MEDIUM,
|
|
77
|
+
git_checkout: DangerLevel.MEDIUM,
|
|
78
|
+
http_post: DangerLevel.MEDIUM,
|
|
79
|
+
mcp_add_server: DangerLevel.MEDIUM,
|
|
80
|
+
mcp_remove_server: DangerLevel.MEDIUM,
|
|
81
|
+
launch_app: DangerLevel.MEDIUM,
|
|
82
|
+
open_path: DangerLevel.MEDIUM,
|
|
83
|
+
browser_open: DangerLevel.MEDIUM,
|
|
84
|
+
|
|
85
|
+
run_bash: DangerLevel.HIGH,
|
|
86
|
+
shell_exec: DangerLevel.HIGH,
|
|
87
|
+
kill_process: DangerLevel.HIGH,
|
|
88
|
+
package_manager: DangerLevel.HIGH,
|
|
89
|
+
service_control: DangerLevel.HIGH,
|
|
90
|
+
delegate_to: DangerLevel.HIGH,
|
|
91
|
+
mcp_scaffold_server: DangerLevel.HIGH,
|
|
92
|
+
};
|
|
93
|
+
|
|
94
|
+
/* ═══════════════════════════════════════
|
|
95
|
+
Audit trail entry
|
|
96
|
+
═══════════════════════════════════════ */
|
|
97
|
+
export interface AuditEntry {
|
|
98
|
+
ts: string;
|
|
99
|
+
agent: string;
|
|
100
|
+
tool: string;
|
|
101
|
+
args: Record<string, any>;
|
|
102
|
+
dangerLevel: DangerLevel;
|
|
103
|
+
approved: boolean;
|
|
104
|
+
result: string;
|
|
105
|
+
durationMs: number;
|
|
106
|
+
traceId: string;
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
/* ═══════════════════════════════════════
|
|
110
|
+
Security context — per-session security state
|
|
111
|
+
═══════════════════════════════════════ */
|
|
112
|
+
export class SecurityContext {
|
|
113
|
+
public auditLog: AuditEntry[] = [];
|
|
114
|
+
public deniedCount = 0;
|
|
115
|
+
public autoApprovedCount = 0;
|
|
116
|
+
public manualApprovedCount = 0;
|
|
117
|
+
public approvalMode: "auto" | "interactive" | "strict" = "auto";
|
|
118
|
+
|
|
119
|
+
private approvalCallback: ((tool: string, args: Record<string, any>, level: DangerLevel) => Promise<boolean>) | null = null;
|
|
120
|
+
|
|
121
|
+
constructor(opts?: { mode?: "auto" | "interactive" | "strict"; onApprove?: (tool: string, args: Record<string, any>, level: DangerLevel) => Promise<boolean> }) {
|
|
122
|
+
if (opts?.mode) this.approvalMode = opts.mode;
|
|
123
|
+
if (opts?.onApprove) this.approvalCallback = opts.onApprove;
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
/** Get the danger level for a tool. Defaults to SAFE for unknown tools. */
|
|
127
|
+
getDangerLevel(toolName: string): DangerLevel {
|
|
128
|
+
return TOOL_DANGER_MAP[toolName] ?? DangerLevel.SAFE;
|
|
129
|
+
}
|
|
130
|
+
|
|
131
|
+
/** Check if arguments contain red-line patterns (critical danger). */
|
|
132
|
+
checkRedline(toolName: string, args: Record<string, any>): string | null {
|
|
133
|
+
if (toolName !== "run_bash" && toolName !== "shell_exec") return null;
|
|
134
|
+
const cmd = String(args.command || args.cmd || "").toLowerCase();
|
|
135
|
+
for (const pattern of REDLINE_PATTERNS) {
|
|
136
|
+
if (pattern.test(cmd)) return `Red-line pattern detected: ${pattern.source.slice(0, 40)}`;
|
|
137
|
+
}
|
|
138
|
+
for (const forbidden of REDLINE_COMMANDS) {
|
|
139
|
+
if (cmd.includes(forbidden)) return `Red-line command: ${forbidden}`;
|
|
140
|
+
}
|
|
141
|
+
return null;
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
/** Determine whether a tool call is permitted. Returns [approved, reason]. */
|
|
145
|
+
async checkApproval(toolName: string, args: Record<string, any>, agentName: string): Promise<[boolean, string]> {
|
|
146
|
+
const level = this.getDangerLevel(toolName);
|
|
147
|
+
|
|
148
|
+
// Red-line check
|
|
149
|
+
const redline = this.checkRedline(toolName, args);
|
|
150
|
+
if (redline) {
|
|
151
|
+
log.warn("redline_blocked", { agent: agentName, tool: toolName, reason: redline });
|
|
152
|
+
return [false, redline];
|
|
153
|
+
}
|
|
154
|
+
|
|
155
|
+
// Safe — always allow
|
|
156
|
+
if (level === DangerLevel.SAFE) return [true, "safe"];
|
|
157
|
+
|
|
158
|
+
// Strict mode — deny all non-safe
|
|
159
|
+
if (this.approvalMode === "strict") {
|
|
160
|
+
return [false, `Strict mode: tool '${toolName}' (level ${level}) requires manual approval`];
|
|
161
|
+
}
|
|
162
|
+
|
|
163
|
+
// Auto mode — allow LOW, prompt for MEDIUM+, deny CRITICAL
|
|
164
|
+
if (this.approvalMode === "auto") {
|
|
165
|
+
if (level <= DangerLevel.LOW) return [true, "auto-low"];
|
|
166
|
+
if (level === DangerLevel.CRITICAL) return [false, `CRITICAL tool '${toolName}' requires explicit human approval`];
|
|
167
|
+
// MEDIUM/HIGH with auto mode => need callback
|
|
168
|
+
if (this.approvalCallback) {
|
|
169
|
+
const approved = await this.approvalCallback(toolName, args, level);
|
|
170
|
+
return [approved, approved ? "user-approved" : "user-denied"];
|
|
171
|
+
}
|
|
172
|
+
return [true, "auto-med"]; // no callback → auto-allow but log
|
|
173
|
+
}
|
|
174
|
+
|
|
175
|
+
// Interactive mode — prompt for LOW+
|
|
176
|
+
if (this.approvalCallback) {
|
|
177
|
+
const approved = await this.approvalCallback(toolName, args, level);
|
|
178
|
+
return [approved, approved ? "user-approved" : "user-denied"];
|
|
179
|
+
}
|
|
180
|
+
return [true, "no-callback"];
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
/** Record an audit entry. */
|
|
184
|
+
recordAudit(tool: string, agent: string, args: Record<string, any>, dangerLevel: DangerLevel, approved: boolean, resultPreview: string, durationMs: number, traceId: string): void {
|
|
185
|
+
const entry: AuditEntry = {
|
|
186
|
+
ts: new Date().toISOString(),
|
|
187
|
+
agent, tool, args, dangerLevel, approved,
|
|
188
|
+
result: resultPreview.slice(0, 500),
|
|
189
|
+
durationMs, traceId,
|
|
190
|
+
};
|
|
191
|
+
this.auditLog.push(entry);
|
|
192
|
+
if (this.auditLog.length > 5000) this.auditLog.shift();
|
|
193
|
+
|
|
194
|
+
if (approved) {
|
|
195
|
+
if (dangerLevel >= DangerLevel.HIGH) this.manualApprovedCount++;
|
|
196
|
+
else this.autoApprovedCount++;
|
|
197
|
+
} else {
|
|
198
|
+
this.deniedCount++;
|
|
199
|
+
}
|
|
200
|
+
|
|
201
|
+
log.info(dangerLevel >= DangerLevel.HIGH ? "dangerous_tool_executed" : "tool_executed", {
|
|
202
|
+
tool, agent, level: dangerLevel, approved,
|
|
203
|
+
});
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
/** Get summary statistics. */
|
|
207
|
+
getStats() {
|
|
208
|
+
return {
|
|
209
|
+
total: this.auditLog.length,
|
|
210
|
+
denied: this.deniedCount,
|
|
211
|
+
autoApproved: this.autoApprovedCount,
|
|
212
|
+
manualApproved: this.manualApprovedCount,
|
|
213
|
+
byLevel: {
|
|
214
|
+
safe: this.auditLog.filter(e => e.dangerLevel === DangerLevel.SAFE).length,
|
|
215
|
+
low: this.auditLog.filter(e => e.dangerLevel === DangerLevel.LOW).length,
|
|
216
|
+
medium: this.auditLog.filter(e => e.dangerLevel === DangerLevel.MEDIUM).length,
|
|
217
|
+
high: this.auditLog.filter(e => e.dangerLevel === DangerLevel.HIGH).length,
|
|
218
|
+
critical: this.auditLog.filter(e => e.dangerLevel === DangerLevel.CRITICAL).length,
|
|
219
|
+
},
|
|
220
|
+
lastDenied: this.auditLog.filter(e => !e.approved).slice(-5).map(e => `${e.tool}: ${e.result}`),
|
|
221
|
+
};
|
|
222
|
+
}
|
|
223
|
+
|
|
224
|
+
/** Install approval callback for interactive mode. */
|
|
225
|
+
setApprovalCallback(fn: (tool: string, args: Record<string, any>, level: DangerLevel) => Promise<boolean>) {
|
|
226
|
+
this.approvalCallback = fn;
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
|
|
230
|
+
/* ── Global security context ── */
|
|
231
|
+
let globalSecurity: SecurityContext | null = null;
|
|
232
|
+
|
|
233
|
+
export function getSecurity(): SecurityContext {
|
|
234
|
+
if (!globalSecurity) globalSecurity = new SecurityContext();
|
|
235
|
+
return globalSecurity;
|
|
236
|
+
}
|
|
237
|
+
|
|
238
|
+
export function resetSecurity(): void {
|
|
239
|
+
globalSecurity = null;
|
|
240
|
+
}
|
|
241
|
+
|
|
242
|
+
/** Red-line patterns for reference (used by tools to self-check). */
|
|
243
|
+
export { REDLINE_PATTERNS, REDLINE_COMMANDS };
|