@integrity-labs/agt-cli 0.28.104 → 0.28.105
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/bin/agt.js +4 -4
- package/dist/{chunk-DO6ZJ2SC.js → chunk-5EVWGQ5X.js} +3 -3
- package/dist/{chunk-WNN5WT42.js → chunk-GBE523G5.js} +2 -2
- package/dist/{chunk-5DYG42FL.js → chunk-YUTJO6FU.js} +8 -1
- package/dist/chunk-YUTJO6FU.js.map +1 -0
- package/dist/{claude-pair-runtime-JP3TEGDV.js → claude-pair-runtime-WOE2EELU.js} +2 -2
- package/dist/lib/manager-worker.js +46 -15
- package/dist/lib/manager-worker.js.map +1 -1
- package/dist/mcp/augmented-admin.js +21 -0
- package/dist/{persistent-session-6CU3BIHP.js → persistent-session-Q65SZNJ6.js} +3 -3
- package/dist/{responsiveness-probe-GLZZZ2OK.js → responsiveness-probe-FS3JNFI2.js} +3 -3
- package/package.json +1 -1
- package/dist/chunk-5DYG42FL.js.map +0 -1
- /package/dist/{chunk-DO6ZJ2SC.js.map → chunk-5EVWGQ5X.js.map} +0 -0
- /package/dist/{chunk-WNN5WT42.js.map → chunk-GBE523G5.js.map} +0 -0
- /package/dist/{claude-pair-runtime-JP3TEGDV.js.map → claude-pair-runtime-WOE2EELU.js.map} +0 -0
- /package/dist/{persistent-session-6CU3BIHP.js.map → persistent-session-Q65SZNJ6.js.map} +0 -0
- /package/dist/{responsiveness-probe-GLZZZ2OK.js.map → responsiveness-probe-FS3JNFI2.js.map} +0 -0
|
@@ -21131,6 +21131,10 @@ var AdminDebugClient = class _AdminDebugClient {
|
|
|
21131
21131
|
tailLogs(args) {
|
|
21132
21132
|
return this.get("/admin/debug/tail-logs", _AdminDebugClient.cleanQuery(args));
|
|
21133
21133
|
}
|
|
21134
|
+
/** Conversation eval-FAILURE breakdown: why conversations couldn't be scored (ENG-6661). */
|
|
21135
|
+
evalFailures(args) {
|
|
21136
|
+
return this.get("/admin/debug/eval-failures", _AdminDebugClient.cleanQuery(args));
|
|
21137
|
+
}
|
|
21134
21138
|
/** Time-windowed read of ONE allowlisted host log across rotated files (ENG-6515). */
|
|
21135
21139
|
queryLogs(args) {
|
|
21136
21140
|
return this.get("/admin/debug/query-logs", _AdminDebugClient.cleanQuery(args));
|
|
@@ -21298,6 +21302,10 @@ var inspectFlagsSchema = external_exports.object({
|
|
|
21298
21302
|
host: external_exports.string().min(1).max(128).optional().describe("The host id (uuid) or its exact, case-insensitive name. Pass this OR agent_id."),
|
|
21299
21303
|
agent_id: external_exports.string().min(1).max(64).optional().describe("The agent UUID \u2014 flags are inspected on the agent's current host. Pass this OR host.")
|
|
21300
21304
|
});
|
|
21305
|
+
var evalFailuresSchema = external_exports.object({
|
|
21306
|
+
period: external_exports.enum(["24h", "7d", "30d"]).optional().describe("Window to report over (24h | 7d | 30d). Default 7d."),
|
|
21307
|
+
agent_id: external_exports.string().min(1).max(64).optional().describe("Filter to one agent (UUID); omit for a fleet-wide breakdown across your authorized orgs.")
|
|
21308
|
+
});
|
|
21301
21309
|
var alertIdField = external_exports.string().min(1).max(64).describe("The alert id (uuid), from debug_list_alerts.");
|
|
21302
21310
|
var triageReasonField = external_exports.string().max(2e3).optional().describe("Why \u2014 recorded on the cross-org audit trail. Be specific.");
|
|
21303
21311
|
var ackAlertSchema = external_exports.object({
|
|
@@ -21679,6 +21687,19 @@ server.tool(
|
|
|
21679
21687
|
}
|
|
21680
21688
|
}
|
|
21681
21689
|
);
|
|
21690
|
+
server.tool(
|
|
21691
|
+
"debug_eval_failures",
|
|
21692
|
+
'Report WHY conversations could not be scored by the host-side success evaluator: the failure counterpart to the "conversation success" trend, which only ever shows EVALUATED conversations (so an agent whose conversations all fail to reconstruct silently vanishes from it). Use when conversation scores look thin/absent for an agent, or to audit eval coverage fleet-wide. Returns { scope, period, scanned, truncated, report, recent }. `report` is the aggregate: { total, gaveUp (subset that hit the retry cap, will never be scored), byReason[] (org-wide count + gaveUp per reason), perAgent[] (worst-first standing) }. The three reasons are data-shaped: `no_transcript` (the host had no local transcript at all), `not_reconstructable` (transcripts exist but none carry the conversation\'s channel ref), `empty_transcript` (turns reconstructed but rendered to nothing). `recent` is the newest failing conversations (boundary + reason only, NEVER transcript content). NOTE: transient/misconfigured EVAL BACKEND failures are NOT here; those show on the host (hosts.eval_backend_*), check debug_get_host. Pass { period? (24h|7d|30d, default 7d), agent_id? (omit for fleet-wide) }. Org-walled in SQL; every call is audited as a cross-org access.',
|
|
21693
|
+
evalFailuresSchema.shape,
|
|
21694
|
+
async (args) => {
|
|
21695
|
+
try {
|
|
21696
|
+
const result = await client.evalFailures(args);
|
|
21697
|
+
return { content: [{ type: "text", text: JSON.stringify(result, null, 2) }] };
|
|
21698
|
+
} catch (err) {
|
|
21699
|
+
return { content: [{ type: "text", text: formatError2(err) }], isError: true };
|
|
21700
|
+
}
|
|
21701
|
+
}
|
|
21702
|
+
);
|
|
21682
21703
|
server.tool(
|
|
21683
21704
|
"debug_probe_integration",
|
|
21684
21705
|
"Force a FRESH host-side connectivity probe for ONE of an agent's integrations and return the LIVE verdict \u2014 use when a user reports an integration \"isn't working\" but the console shows it connected, or to confirm a fix landed. Unlike the cached status the dashboard shows, this SSH-less SSM-invokes the agent's host to run the probe against its actual wired `.mcp.json` + credentials, so it can't disagree with reality. Returns { agent_id, code_name, slug, host, verdict, message, probed_at, ssm_status }. `verdict` is the live result: `ok` | `degraded` | `transient_error` (retryable) | `down` | `not_probeable` (no probe wired for this kind) \u2014 or a central degrade: `unreachable` (agent has no host), `not_installed` (integration not on this agent), `host_cli_too_old` (the host predates the probe \u2014 update its agt-cli), `probe_error`. Pass { agent_id, slug } where slug is the integration's definition code_name (e.g. `gmail`, `slack`, `here-now`). Fails closed for an unauthorized org; every call is audited as a cross-org host access.",
|
|
@@ -34,8 +34,8 @@ import {
|
|
|
34
34
|
writeDirectChatSessionState,
|
|
35
35
|
writeEgressAllowlist,
|
|
36
36
|
writePersistentClaudeWrapper
|
|
37
|
-
} from "./chunk-
|
|
38
|
-
import "./chunk-
|
|
37
|
+
} from "./chunk-GBE523G5.js";
|
|
38
|
+
import "./chunk-YUTJO6FU.js";
|
|
39
39
|
import "./chunk-XWVM4KPK.js";
|
|
40
40
|
export {
|
|
41
41
|
EGRESS_BASELINE_DOMAINS,
|
|
@@ -74,4 +74,4 @@ export {
|
|
|
74
74
|
writeEgressAllowlist,
|
|
75
75
|
writePersistentClaudeWrapper
|
|
76
76
|
};
|
|
77
|
-
//# sourceMappingURL=persistent-session-
|
|
77
|
+
//# sourceMappingURL=persistent-session-Q65SZNJ6.js.map
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import {
|
|
2
2
|
paneLogPath
|
|
3
|
-
} from "./chunk-
|
|
4
|
-
import "./chunk-
|
|
3
|
+
} from "./chunk-GBE523G5.js";
|
|
4
|
+
import "./chunk-YUTJO6FU.js";
|
|
5
5
|
import "./chunk-XWVM4KPK.js";
|
|
6
6
|
|
|
7
7
|
// src/lib/responsiveness-probe.ts
|
|
@@ -250,4 +250,4 @@ export {
|
|
|
250
250
|
parkPendingInbound,
|
|
251
251
|
readAndResetChannelDeflections
|
|
252
252
|
};
|
|
253
|
-
//# sourceMappingURL=responsiveness-probe-
|
|
253
|
+
//# sourceMappingURL=responsiveness-probe-FS3JNFI2.js.map
|