nolo-cli 0.1.13 → 0.1.15
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +9 -2
- package/agent-runtime/hostAdapter.ts +53 -0
- package/agent-runtime/index.ts +28 -0
- package/agent-runtime/localLoop.ts +62 -0
- package/agent-runtime/runtimeDecision.ts +70 -0
- package/agent-runtime/types.ts +87 -0
- package/agentRunCommand.ts +104 -0
- package/agentRuntimeCommands.ts +139 -22
- package/agentRuntimeLocal.ts +7 -0
- package/ai/agent/_executeModel.ts +118 -0
- package/ai/agent/agentSlice.ts +544 -1
- package/ai/agent/appWorkingMemory.ts +126 -0
- package/ai/agent/avatarUtils.ts +24 -0
- package/ai/agent/buildEditingContext.ts +373 -0
- package/ai/agent/buildSystemPrompt.ts +532 -0
- package/ai/agent/cleanAgentMessages.ts +140 -0
- package/ai/agent/cliChatClient.ts +119 -0
- package/ai/agent/contextCompiler.ts +107 -0
- package/ai/agent/contextLayerContract.ts +44 -0
- package/ai/agent/createAgentSchema.ts +234 -0
- package/ai/agent/executeToolCall.ts +58 -0
- package/ai/agent/fetchAgentContexts.ts +42 -0
- package/ai/agent/generatePrompt.ts +3 -0
- package/ai/agent/getFullChatContextKeys.ts +168 -0
- package/ai/agent/hooks/fetchPublicAgents.ts +133 -0
- package/ai/agent/hooks/useAgentConfig.ts +61 -0
- package/ai/agent/hooks/useAgentDialog.ts +35 -0
- package/ai/agent/hooks/useAgentFormValidation.ts +202 -0
- package/ai/agent/hooks/usePublicAgents.ts +473 -0
- package/ai/agent/persistMessageWithFixedId.ts +37 -0
- package/ai/agent/planSlice.ts +259 -0
- package/ai/agent/referenceUtils.ts +229 -0
- package/ai/agent/runAgentBackground.ts +238 -0
- package/ai/agent/runAgentClientLoop.ts +138 -0
- package/ai/agent/runtimeGuidance.ts +97 -0
- package/ai/agent/runtimeServerBase.ts +37 -0
- package/ai/agent/server/fetchPublicAgents.ts +128 -0
- package/ai/agent/startParallelAgentStreams.ts +424 -0
- package/ai/agent/startupProtocol.ts +53 -0
- package/ai/agent/streamAgentChatTurn.ts +1299 -0
- package/ai/agent/streamAgentChatTurnUtils.ts +738 -0
- package/ai/agent/types.ts +71 -0
- package/ai/agent/utils/imageOutput.ts +39 -0
- package/ai/agent/utils/publicImageAgentMode.ts +26 -0
- package/ai/agent/utils/sortUtils.ts +250 -0
- package/ai/agent/web/referencePickerUtils.ts +146 -0
- package/ai/ai.locale.ts +1083 -0
- package/ai/chat/accumulateToolCallChunks.ts +95 -0
- package/ai/chat/fetchUtils.native.ts +276 -0
- package/ai/chat/fetchUtils.ts +153 -0
- package/ai/chat/inlineImageUrlsForCustomProvider.ts +117 -0
- package/ai/chat/parseApiError.ts +64 -0
- package/ai/chat/parseMultilineSSE.ts +95 -0
- package/ai/chat/sendOpenAICompletionsRequest.native.ts +682 -0
- package/ai/chat/sendOpenAICompletionsRequest.ts +712 -0
- package/ai/chat/sendOpenAIResponseRequest.ts +512 -0
- package/ai/chat/shouldUseServerProxy.ts +18 -0
- package/ai/chat/sseClient.native.ts +91 -0
- package/ai/chat/sseClient.ts +67 -0
- package/ai/chat/streamReader.native.ts +31 -0
- package/ai/chat/streamReader.ts +62 -0
- package/ai/chat/updateTotalUsage.ts +72 -0
- package/ai/context/buildReferenceContext.ts +437 -0
- package/ai/context/calculateContextUsage.ts +133 -0
- package/ai/context/retention.ts +165 -0
- package/ai/context/tokenUtils.ts +78 -0
- package/ai/index.ts +1 -1
- package/ai/llm/agentCapabilities.ts +74 -0
- package/ai/llm/calculateGeminiImageTokens.ts +57 -0
- package/ai/llm/deepinfra.ts +28 -0
- package/ai/llm/fireworks.ts +68 -0
- package/ai/llm/generateRequestBody.ts +165 -0
- package/ai/llm/getModelContextWindow.ts +84 -0
- package/ai/llm/getNoloKey.ts +37 -0
- package/ai/llm/getPricing.ts +232 -0
- package/ai/llm/hooks/useModelPricing.ts +75 -0
- package/ai/llm/imagePricing.ts +66 -0
- package/ai/llm/isResponseAPIModel.ts +13 -0
- package/ai/llm/kimi.ts +18 -0
- package/ai/llm/mimo.ts +71 -0
- package/ai/llm/mistral.ts +22 -0
- package/ai/llm/modelAvatar.ts +427 -0
- package/ai/llm/models.ts +45 -0
- package/ai/llm/openrouterModels.ts +141 -0
- package/ai/llm/providers.ts +307 -0
- package/ai/llm/reasoningModels.ts +28 -0
- package/ai/llm/types.ts +59 -0
- package/ai/llm/usageRequestOptions.ts +59 -0
- package/ai/memory/capture.ts +148 -0
- package/ai/memory/consolidate.ts +104 -0
- package/ai/memory/delete.ts +147 -0
- package/ai/memory/overlay.ts +84 -0
- package/ai/memory/query.ts +38 -0
- package/ai/memory/queryShared.ts +160 -0
- package/ai/memory/rank.ts +105 -0
- package/ai/memory/recentRelationshipRecap.ts +247 -0
- package/ai/memory/remember.ts +167 -0
- package/ai/memory/runtime.ts +76 -0
- package/ai/memory/store.ts +20 -0
- package/ai/memory/storeShared.ts +76 -0
- package/ai/memory/types.ts +46 -0
- package/ai/memory/understanding.ts +349 -0
- package/ai/memory/understandingGreeting.ts +264 -0
- package/ai/messages/type.ts +20 -0
- package/ai/policy/personalizationDialog.ts +333 -0
- package/ai/policy/runtimePolicy.ts +440 -0
- package/ai/policy/selfUpdateFields.ts +48 -0
- package/ai/policy/types.ts +64 -0
- package/ai/skills/referenceRuntime.ts +274 -0
- package/ai/skills/skillDiagnostics.ts +251 -0
- package/ai/skills/skillDocBuilder.ts +139 -0
- package/ai/skills/skillDocProtocol.ts +434 -0
- package/ai/skills/skillReferenceSummary.ts +63 -0
- package/ai/skills/skillSummaryMarker.ts +26 -0
- package/ai/token/calculatePrice.ts +546 -0
- package/ai/token/db.ts +98 -0
- package/ai/token/externalToolCost.ts +321 -0
- package/ai/token/hooks/useRecords.ts +65 -0
- package/ai/token/missingUsageEstimate.ts +42 -0
- package/ai/token/modelUsageQuery.ts +252 -0
- package/ai/token/normalizeUsage.ts +84 -0
- package/ai/token/openaiImageGenerationUsage.ts +56 -0
- package/ai/token/prepareTokenUsageData.ts +88 -0
- package/ai/token/query.ts +88 -0
- package/ai/token/queryUserTokens.ts +59 -0
- package/ai/token/resolveBillingTarget.ts +52 -0
- package/ai/token/saveTokenRecord.ts +53 -0
- package/ai/token/serverDialogProjection.ts +78 -0
- package/ai/token/serverTokenWriter.ts +143 -0
- package/ai/token/stats.ts +21 -0
- package/ai/token/tokenThunks.ts +24 -0
- package/ai/token/types.ts +93 -0
- package/ai/tools/agent/agentTools.ts +176 -0
- package/ai/tools/agent/agentUpdateShared.ts +311 -0
- package/ai/tools/agent/callAgentTool.ts +139 -0
- package/ai/tools/agent/createAgentTool.ts +512 -0
- package/ai/tools/agent/createDialogTool.ts +69 -0
- package/ai/tools/agent/createSkillAgentTool.ts +62 -0
- package/ai/tools/agent/parallelBudget.ts +221 -0
- package/ai/tools/agent/presets/appBuilderPreset.ts +147 -0
- package/ai/tools/agent/runLlmTool.ts +96 -0
- package/ai/tools/agent/runStreamingAgentTool.ts +73 -0
- package/ai/tools/agent/skillAgentArgs.ts +106 -0
- package/ai/tools/agent/skillAgentPreset.ts +89 -0
- package/ai/tools/agent/streamParallelAgentsTool.ts +122 -0
- package/ai/tools/agent/updateAgentTool.ts +96 -0
- package/ai/tools/agent/updateSelfTool.ts +113 -0
- package/ai/tools/amazonProductScraperTool.ts +86 -0
- package/ai/tools/apifyActorClient.ts +45 -0
- package/ai/tools/appEditGuard.ts +372 -0
- package/ai/tools/appReadSnapshot.ts +153 -0
- package/ai/tools/appTools.ts +1549 -0
- package/ai/tools/applyEditTool.ts +256 -0
- package/ai/tools/applyLineEditsTool.ts +312 -0
- package/ai/tools/browserTools/click.ts +33 -0
- package/ai/tools/browserTools/closeSession.ts +29 -0
- package/ai/tools/browserTools/common.ts +27 -0
- package/ai/tools/browserTools/openSession.ts +48 -0
- package/ai/tools/browserTools/readContent.ts +38 -0
- package/ai/tools/browserTools/selectOption.ts +46 -0
- package/ai/tools/browserTools/typeText.ts +42 -0
- package/ai/tools/category/createCategoryTool.ts +66 -0
- package/ai/tools/category/queryContentsByCategoryTool.ts +69 -0
- package/ai/tools/category/updateContentCategoryTool.ts +75 -0
- package/ai/tools/cfBrowserTools.ts +319 -0
- package/ai/tools/cfSpeechToTextTool.ts +49 -0
- package/ai/tools/checkEnvTool.ts +65 -0
- package/ai/tools/cloudflareCrawlTool.ts +289 -0
- package/ai/tools/codeSearchTool.ts +111 -0
- package/ai/tools/codeTools.ts +101 -0
- package/ai/tools/createDocTool.ts +132 -0
- package/ai/tools/createPlanTool.ts +999 -0
- package/ai/tools/createSkillDocTool.ts +155 -0
- package/ai/tools/createWorkflowTool.ts +154 -0
- package/ai/tools/deepseekOcrTool.ts +34 -0
- package/ai/tools/delayTool.ts +31 -0
- package/ai/tools/deleteSpacesTool.ts +325 -0
- package/ai/tools/deleteSpacesToolModel.ts +159 -0
- package/ai/tools/devReloadUtils.ts +29 -0
- package/ai/tools/dialogMessageSearch.ts +137 -0
- package/ai/tools/doctorSkillTool.ts +72 -0
- package/ai/tools/ecommerceScraperTool.ts +86 -0
- package/ai/tools/emailTools.ts +549 -0
- package/ai/tools/evalSkillTool.ts +92 -0
- package/ai/tools/exaSearchTool.ts +64 -0
- package/ai/tools/execBashTool.ts +379 -0
- package/ai/tools/executeSqlTool.ts +192 -0
- package/ai/tools/fetchWebpageSupport.ts +309 -0
- package/ai/tools/fetchWebpageTool.ts +84 -0
- package/ai/tools/geminiImagePreviewTool.ts +361 -0
- package/ai/tools/generateDocxTool.ts +215 -0
- package/ai/tools/googleSearchScraperTool.ts +106 -0
- package/ai/tools/importDataTool.ts +133 -0
- package/ai/tools/importSkillTool.ts +162 -0
- package/ai/tools/index.ts +1927 -0
- package/ai/tools/listFilesTool.ts +82 -0
- package/ai/tools/listUserSpacesTool.ts +113 -0
- package/ai/tools/modelUsageTools.ts +199 -0
- package/ai/tools/olmOcrTool.ts +34 -0
- package/ai/tools/openaiImageTool.ts +267 -0
- package/ai/tools/prepareTools.ts +23 -0
- package/ai/tools/readDocTool.ts +84 -0
- package/ai/tools/readFileTool.ts +211 -0
- package/ai/tools/readTool.ts +163 -0
- package/ai/tools/readXPostTool.ts +233 -0
- package/ai/tools/rememberMemoryTool.ts +84 -0
- package/ai/tools/remotionVideoTool.ts +151 -0
- package/ai/tools/searchDialogMessagesTool.ts +222 -0
- package/ai/tools/searchRepoTool.ts +115 -0
- package/ai/tools/searchWorkspaceTool.ts +259 -0
- package/ai/tools/skillFollowup.ts +86 -0
- package/ai/tools/surfWeatherTool.ts +169 -0
- package/ai/tools/table/addTableRowTool.ts +217 -0
- package/ai/tools/table/createTableTool.ts +315 -0
- package/ai/tools/table/rowTools.ts +366 -0
- package/ai/tools/table/schemaTools.ts +244 -0
- package/ai/tools/table/shareTableTool.ts +148 -0
- package/ai/tools/table/toolShared.ts +129 -0
- package/ai/tools/toolApiClient.ts +198 -0
- package/ai/tools/toolNameAliases.ts +57 -0
- package/ai/tools/toolResultError.ts +42 -0
- package/ai/tools/toolRunSlice.ts +303 -0
- package/ai/tools/toolSchemaCompatibility.ts +53 -0
- package/ai/tools/toolVisibility.ts +4 -0
- package/ai/tools/types.ts +20 -0
- package/ai/tools/uiAskChoiceTool.ts +104 -0
- package/ai/tools/updateContentTitleTool.ts +84 -0
- package/ai/tools/updateDocTool.ts +105 -0
- package/ai/tools/updateUserPreferenceProfileTool.ts +145 -0
- package/ai/tools/whisperTool.ts +77 -0
- package/ai/tools/writeFileTool.ts +210 -0
- package/ai/tools/youtubeScraperTool.ts +116 -0
- package/ai/tools/ziweiChartTool.ts +678 -0
- package/ai/types.ts +55 -0
- package/ai/workflow/workflowExecutor.ts +323 -0
- package/ai/workflow/workflowSlice.ts +73 -0
- package/ai/workflow/workflowTypes.ts +106 -0
- package/client/agentRun.test.ts +240 -0
- package/client/agentRun.ts +182 -19
- package/client/compactDialog.test.ts +238 -0
- package/client/localRuntimeAdapter.test.ts +135 -0
- package/client/localRuntimeAdapter.ts +244 -0
- package/client/profileConfig.test.ts +40 -0
- package/client/streamingOutput.test.ts +22 -0
- package/client/streamingOutput.ts +38 -0
- package/commandRegistry.ts +11 -2
- package/connector-experimental/index.ts +5 -0
- package/database/actions/cacheMergedUserData.ts +64 -0
- package/database/actions/common.ts +242 -0
- package/database/actions/deleteFile.ts +40 -0
- package/database/actions/fetchUserData.ts +16 -0
- package/database/actions/fileContent.ts +125 -0
- package/database/actions/patch.ts +155 -0
- package/database/actions/read.ts +337 -0
- package/database/actions/readAndWait.ts +224 -0
- package/database/actions/readRequestManager.ts +120 -0
- package/database/actions/remove.ts +94 -0
- package/database/actions/replication.ts +366 -0
- package/database/actions/upload.ts +174 -0
- package/database/actions/upsert.ts +56 -0
- package/database/actions/write.ts +126 -0
- package/database/client/db.native.ts +73 -0
- package/database/client/db.ts +51 -0
- package/database/client/fetchUserData.ts +61 -0
- package/database/client/handleError.ts +19 -0
- package/database/client/queryRequest.ts +21 -0
- package/database/config.ts +21 -0
- package/database/dbActionThunks.ts +1 -0
- package/database/dbSlice.ts +149 -0
- package/database/email.ts +42 -0
- package/database/fileRing.ts +51 -0
- package/database/fileSharding.ts +70 -0
- package/database/fileStorage.native.ts +92 -0
- package/database/fileStorage.ts +232 -0
- package/database/fileUrl.ts +34 -0
- package/database/hooks/useUserData.ts +489 -0
- package/database/index.ts +1 -0
- package/database/keys.ts +765 -0
- package/database/queryPrefixes.ts +14 -0
- package/database/requests.ts +443 -0
- package/database/runtimeServerContext.ts +35 -0
- package/database/server/MemoryDB.ts +76 -0
- package/database/server/actorAccess.ts +76 -0
- package/database/server/agentDelegation.ts +124 -0
- package/database/server/coreDataOwnership.ts +13 -0
- package/database/server/coreDataProxy.ts +76 -0
- package/database/server/cybotReadonly.ts +18 -0
- package/database/server/dataHandlers.ts +111 -0
- package/database/server/db.ts +118 -0
- package/database/server/dbPath.ts +20 -0
- package/database/server/delete.ts +499 -0
- package/database/server/emailRepository.ts +1480 -0
- package/database/server/ensureDbOpen.ts +12 -0
- package/database/server/fileRead.ts +337 -0
- package/database/server/fileService.ts +436 -0
- package/database/server/handleTransaction.ts +86 -0
- package/database/server/patch.ts +282 -0
- package/database/server/query.ts +138 -0
- package/database/server/read.ts +325 -0
- package/database/server/resourceAccess.ts +211 -0
- package/database/server/routes.ts +110 -0
- package/database/server/spaceMemberAuthority.ts +67 -0
- package/database/server/upload.ts +159 -0
- package/database/server/write.ts +494 -0
- package/database/server/writeAuthority.ts +133 -0
- package/database/sqliteDb.ts +46 -0
- package/database/table/deleteTable.ts +120 -0
- package/database/tenantPlacement.ts +57 -0
- package/database/tombstones.ts +52 -0
- package/database/userDataLoadDecision.ts +17 -0
- package/database/userDataMerge.ts +95 -0
- package/database/userPreferenceRegister.ts +108 -0
- package/database/utils/dbPath.ts +47 -0
- package/database/utils/ulid.native.ts +6 -0
- package/database/utils/ulid.ts +1 -0
- package/index.ts +37 -19
- package/localRuntimeDb.ts +28 -0
- package/package.json +17 -4
- package/runtimeModeArgs.ts +33 -0
- package/tui/readlineWorkspace.ts +1 -0
- package/tui/session.ts +22 -0
|
@@ -0,0 +1,309 @@
|
|
|
1
|
+
const DOCS_HOST_RE = /^docs\./i;
|
|
2
|
+
|
|
3
|
+
export interface DocsIndexEntry {
|
|
4
|
+
title: string;
|
|
5
|
+
url: string;
|
|
6
|
+
source: "llms.txt" | "llms-full.txt";
|
|
7
|
+
}
|
|
8
|
+
|
|
9
|
+
export interface DocsResolution {
|
|
10
|
+
resolvedUrl: string;
|
|
11
|
+
source: "original" | "llms.txt" | "llms-full.txt";
|
|
12
|
+
}
|
|
13
|
+
|
|
14
|
+
export interface ExtractionIssue {
|
|
15
|
+
code: "EMPTY_EXTRACTION" | "HTML_SHELL";
|
|
16
|
+
message: string;
|
|
17
|
+
}
|
|
18
|
+
|
|
19
|
+
function normalizePathname(pathname: string) {
|
|
20
|
+
return pathname
|
|
21
|
+
.replace(/\/index\.md$/i, "/")
|
|
22
|
+
.replace(/\.md$/i, "")
|
|
23
|
+
.replace(/\/+/g, "/")
|
|
24
|
+
.replace(/\/$/, "") || "/";
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
function tokenize(value: string) {
|
|
28
|
+
return Array.from(
|
|
29
|
+
new Set(
|
|
30
|
+
value
|
|
31
|
+
.toLowerCase()
|
|
32
|
+
.split(/[^a-z0-9]+/i)
|
|
33
|
+
.map((part) => part.trim())
|
|
34
|
+
.filter(Boolean)
|
|
35
|
+
.filter((part) => !["md", "html", "htm", "docs", "doc"].includes(part))
|
|
36
|
+
)
|
|
37
|
+
);
|
|
38
|
+
}
|
|
39
|
+
|
|
40
|
+
function splitNormalizedSegments(pathname: string) {
|
|
41
|
+
const normalized = normalizePathname(pathname);
|
|
42
|
+
return normalized
|
|
43
|
+
.split("/")
|
|
44
|
+
.map((segment) => segment.trim())
|
|
45
|
+
.filter(Boolean);
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
function segmentSignature(segment: string) {
|
|
49
|
+
const tokens = tokenize(segment);
|
|
50
|
+
if (tokens.length > 0) return tokens.join("-");
|
|
51
|
+
return segment.trim().toLowerCase();
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
function hasCompatiblePathStructure(requestedPath: string, candidatePath: string) {
|
|
55
|
+
const requestedSegments = splitNormalizedSegments(requestedPath);
|
|
56
|
+
const candidateSegments = splitNormalizedSegments(candidatePath);
|
|
57
|
+
|
|
58
|
+
if (requestedSegments.length <= 1 || candidateSegments.length <= 1) {
|
|
59
|
+
return true;
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
if (candidateSegments.length > requestedSegments.length) {
|
|
63
|
+
return false;
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
for (let index = 1; index <= candidateSegments.length; index += 1) {
|
|
67
|
+
const requestedSegment = requestedSegments.at(-index);
|
|
68
|
+
const candidateSegment = candidateSegments.at(-index);
|
|
69
|
+
if (!requestedSegment || !candidateSegment) return false;
|
|
70
|
+
if (segmentSignature(requestedSegment) !== segmentSignature(candidateSegment)) {
|
|
71
|
+
return false;
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
return true;
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
function collectEntryTokens(entry: DocsIndexEntry) {
|
|
79
|
+
const parsed = new URL(entry.url);
|
|
80
|
+
return {
|
|
81
|
+
pathTokens: tokenize(parsed.pathname),
|
|
82
|
+
titleTokens: tokenize(entry.title),
|
|
83
|
+
normalizedPath: normalizePathname(parsed.pathname),
|
|
84
|
+
};
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
function normalizeCandidateUrl(rawUrl: string, baseUrl: string) {
|
|
88
|
+
try {
|
|
89
|
+
const parsed = new URL(rawUrl, baseUrl);
|
|
90
|
+
return parsed.toString();
|
|
91
|
+
} catch {
|
|
92
|
+
return null;
|
|
93
|
+
}
|
|
94
|
+
}
|
|
95
|
+
|
|
96
|
+
export function isDocsHost(rawUrl: string) {
|
|
97
|
+
try {
|
|
98
|
+
const parsed = new URL(rawUrl);
|
|
99
|
+
return DOCS_HOST_RE.test(parsed.hostname);
|
|
100
|
+
} catch {
|
|
101
|
+
return false;
|
|
102
|
+
}
|
|
103
|
+
}
|
|
104
|
+
|
|
105
|
+
export function parseLlmsIndex(text: string, baseUrl: string): DocsIndexEntry[] {
|
|
106
|
+
const entries: DocsIndexEntry[] = [];
|
|
107
|
+
const linkRe = /-\s+\[([^\]]+)\]\(([^)]+)\)/g;
|
|
108
|
+
|
|
109
|
+
for (const match of text.matchAll(linkRe)) {
|
|
110
|
+
const title = match[1]?.trim();
|
|
111
|
+
const rawUrl = match[2]?.trim();
|
|
112
|
+
if (!title || !rawUrl) continue;
|
|
113
|
+
const url = normalizeCandidateUrl(rawUrl, baseUrl);
|
|
114
|
+
if (!url) continue;
|
|
115
|
+
entries.push({ title, url, source: "llms.txt" });
|
|
116
|
+
}
|
|
117
|
+
|
|
118
|
+
return entries;
|
|
119
|
+
}
|
|
120
|
+
|
|
121
|
+
export function parseLlmsFullSources(text: string, baseUrl: string): DocsIndexEntry[] {
|
|
122
|
+
const entries: DocsIndexEntry[] = [];
|
|
123
|
+
const lines = text.split(/\r?\n/);
|
|
124
|
+
let currentTitle = "";
|
|
125
|
+
|
|
126
|
+
for (const rawLine of lines) {
|
|
127
|
+
const line = rawLine.trim();
|
|
128
|
+
if (!line) continue;
|
|
129
|
+
|
|
130
|
+
if (line.startsWith("# ")) {
|
|
131
|
+
currentTitle = line.slice(2).trim();
|
|
132
|
+
continue;
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
if (!line.toLowerCase().startsWith("source:")) continue;
|
|
136
|
+
|
|
137
|
+
const rawUrl = line.slice("source:".length).trim();
|
|
138
|
+
const url = normalizeCandidateUrl(rawUrl, baseUrl);
|
|
139
|
+
if (!url || !currentTitle) continue;
|
|
140
|
+
entries.push({ title: currentTitle, url, source: "llms-full.txt" });
|
|
141
|
+
}
|
|
142
|
+
|
|
143
|
+
return entries;
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
function scoreDocsEntry(requestedUrl: URL, entry: DocsIndexEntry) {
|
|
147
|
+
const requestedPath = normalizePathname(requestedUrl.pathname);
|
|
148
|
+
const requestedTokens = tokenize(requestedUrl.pathname);
|
|
149
|
+
const lastRequestedToken = requestedTokens.at(-1);
|
|
150
|
+
const { pathTokens, titleTokens, normalizedPath } = collectEntryTokens(entry);
|
|
151
|
+
|
|
152
|
+
if (requestedPath === normalizedPath) return 10_000;
|
|
153
|
+
|
|
154
|
+
let score = 0;
|
|
155
|
+
const unionTokens = new Set([...pathTokens, ...titleTokens]);
|
|
156
|
+
|
|
157
|
+
for (const token of requestedTokens) {
|
|
158
|
+
if (pathTokens.includes(token)) score += 3;
|
|
159
|
+
if (titleTokens.includes(token)) score += 4;
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
if (lastRequestedToken) {
|
|
163
|
+
if (pathTokens.at(-1) === lastRequestedToken) score += 10;
|
|
164
|
+
if (titleTokens.includes(lastRequestedToken)) score += 4;
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
if (requestedTokens.length > 0 && requestedTokens.every((token) => unionTokens.has(token))) {
|
|
168
|
+
score += 10;
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
score -= Math.abs(unionTokens.size - requestedTokens.length);
|
|
172
|
+
return score;
|
|
173
|
+
}
|
|
174
|
+
|
|
175
|
+
export function resolveDocsUrlFromEntries(
|
|
176
|
+
rawUrl: string,
|
|
177
|
+
entries: DocsIndexEntry[]
|
|
178
|
+
): DocsResolution {
|
|
179
|
+
const requestedUrl = new URL(rawUrl);
|
|
180
|
+
const sameOriginEntries = entries.filter((entry) => {
|
|
181
|
+
try {
|
|
182
|
+
return new URL(entry.url).origin === requestedUrl.origin;
|
|
183
|
+
} catch {
|
|
184
|
+
return false;
|
|
185
|
+
}
|
|
186
|
+
});
|
|
187
|
+
|
|
188
|
+
if (sameOriginEntries.length === 0) {
|
|
189
|
+
return { resolvedUrl: rawUrl, source: "original" };
|
|
190
|
+
}
|
|
191
|
+
|
|
192
|
+
const ranked = sameOriginEntries
|
|
193
|
+
.filter((entry) => hasCompatiblePathStructure(requestedUrl.pathname, new URL(entry.url).pathname))
|
|
194
|
+
.map((entry) => ({
|
|
195
|
+
entry,
|
|
196
|
+
score: scoreDocsEntry(requestedUrl, entry),
|
|
197
|
+
}))
|
|
198
|
+
.sort((a, b) => b.score - a.score);
|
|
199
|
+
|
|
200
|
+
const best = ranked[0];
|
|
201
|
+
if (!best || best.score < 8) {
|
|
202
|
+
return { resolvedUrl: rawUrl, source: "original" };
|
|
203
|
+
}
|
|
204
|
+
|
|
205
|
+
return {
|
|
206
|
+
resolvedUrl: best.entry.url,
|
|
207
|
+
source: best.entry.source,
|
|
208
|
+
};
|
|
209
|
+
}
|
|
210
|
+
|
|
211
|
+
export async function discoverCanonicalDocsUrl(
|
|
212
|
+
rawUrl: string,
|
|
213
|
+
fetchImpl: typeof fetch = fetch
|
|
214
|
+
): Promise<DocsResolution> {
|
|
215
|
+
if (!isDocsHost(rawUrl)) {
|
|
216
|
+
return { resolvedUrl: rawUrl, source: "original" };
|
|
217
|
+
}
|
|
218
|
+
|
|
219
|
+
const parsed = new URL(rawUrl);
|
|
220
|
+
const baseUrl = parsed.origin + "/";
|
|
221
|
+
const entries: DocsIndexEntry[] = [];
|
|
222
|
+
|
|
223
|
+
const llmsText = await fetchTextIfOk(new URL("/llms.txt", parsed.origin).toString(), fetchImpl);
|
|
224
|
+
if (llmsText) {
|
|
225
|
+
entries.push(...parseLlmsIndex(llmsText, baseUrl));
|
|
226
|
+
}
|
|
227
|
+
|
|
228
|
+
const fromLlms = resolveDocsUrlFromEntries(rawUrl, entries);
|
|
229
|
+
if (fromLlms.source !== "original") {
|
|
230
|
+
return fromLlms;
|
|
231
|
+
}
|
|
232
|
+
|
|
233
|
+
const llmsFullText = await fetchTextIfOk(
|
|
234
|
+
new URL("/llms-full.txt", parsed.origin).toString(),
|
|
235
|
+
fetchImpl
|
|
236
|
+
);
|
|
237
|
+
if (llmsFullText) {
|
|
238
|
+
entries.push(...parseLlmsFullSources(llmsFullText, baseUrl));
|
|
239
|
+
}
|
|
240
|
+
|
|
241
|
+
return resolveDocsUrlFromEntries(rawUrl, entries);
|
|
242
|
+
}
|
|
243
|
+
|
|
244
|
+
async function fetchTextIfOk(url: string, fetchImpl: typeof fetch) {
|
|
245
|
+
try {
|
|
246
|
+
const response = await fetchImpl(url, {
|
|
247
|
+
method: "GET",
|
|
248
|
+
redirect: "follow",
|
|
249
|
+
headers: { Accept: "text/plain, text/markdown, text/html;q=0.8, */*;q=0.1" },
|
|
250
|
+
});
|
|
251
|
+
if (!response.ok) return null;
|
|
252
|
+
return await response.text();
|
|
253
|
+
} catch {
|
|
254
|
+
return null;
|
|
255
|
+
}
|
|
256
|
+
}
|
|
257
|
+
|
|
258
|
+
export async function assertFetchableDocsUrl(
|
|
259
|
+
rawUrl: string,
|
|
260
|
+
fetchImpl: typeof fetch = fetch,
|
|
261
|
+
originalUrl?: string
|
|
262
|
+
): Promise<void> {
|
|
263
|
+
if (!isDocsHost(rawUrl)) return;
|
|
264
|
+
|
|
265
|
+
try {
|
|
266
|
+
const response = await fetchImpl(rawUrl, {
|
|
267
|
+
method: "HEAD",
|
|
268
|
+
redirect: "follow",
|
|
269
|
+
headers: { Accept: "text/html,application/xhtml+xml" },
|
|
270
|
+
});
|
|
271
|
+
|
|
272
|
+
if (response.ok || response.status === 405 || response.status === 501) {
|
|
273
|
+
return;
|
|
274
|
+
}
|
|
275
|
+
|
|
276
|
+
throw new Error(`文档页面返回 ${response.status}`);
|
|
277
|
+
} catch (error) {
|
|
278
|
+
const message = error instanceof Error ? error.message : String(error);
|
|
279
|
+
const rewriteHint =
|
|
280
|
+
originalUrl && originalUrl !== rawUrl
|
|
281
|
+
? `原始地址 ${originalUrl} 已规范化为 ${rawUrl},但规范化地址不可用。`
|
|
282
|
+
: "";
|
|
283
|
+
throw new Error(`访问网页失败:文档地址不可用 (${rawUrl})。${rewriteHint}${message}`);
|
|
284
|
+
}
|
|
285
|
+
}
|
|
286
|
+
|
|
287
|
+
export function detectExtractionIssue(markdown: string, sourceUrl: string): ExtractionIssue | null {
|
|
288
|
+
const trimmed = markdown.trim();
|
|
289
|
+
if (!trimmed) {
|
|
290
|
+
return {
|
|
291
|
+
code: "EMPTY_EXTRACTION",
|
|
292
|
+
message: `访问网页失败:${sourceUrl} 未提取到正文内容。`,
|
|
293
|
+
};
|
|
294
|
+
}
|
|
295
|
+
|
|
296
|
+
const lower = trimmed.toLowerCase();
|
|
297
|
+
if (
|
|
298
|
+
lower.startsWith("<!doctype html") ||
|
|
299
|
+
lower.startsWith("<html") ||
|
|
300
|
+
lower.includes("__next_error__")
|
|
301
|
+
) {
|
|
302
|
+
return {
|
|
303
|
+
code: "HTML_SHELL",
|
|
304
|
+
message: `访问网页失败:${sourceUrl} 返回了错误页或 HTML 壳,而不是正文内容。`,
|
|
305
|
+
};
|
|
306
|
+
}
|
|
307
|
+
|
|
308
|
+
return null;
|
|
309
|
+
}
|
|
@@ -0,0 +1,84 @@
|
|
|
1
|
+
// /ai/tools/fetchWebpageTool.ts
|
|
2
|
+
// 现在底层走 Cloudflare Browser Rendering,支持 JS 动态渲染
|
|
3
|
+
|
|
4
|
+
import { callToolApi } from "./toolApiClient";
|
|
5
|
+
import {
|
|
6
|
+
assertFetchableDocsUrl,
|
|
7
|
+
detectExtractionIssue,
|
|
8
|
+
discoverCanonicalDocsUrl,
|
|
9
|
+
} from "./fetchWebpageSupport";
|
|
10
|
+
|
|
11
|
+
/**
|
|
12
|
+
* [Schema] 定义了 'fetchWebpage' 工具的结构,供 LLM 调用。
|
|
13
|
+
*/
|
|
14
|
+
export const fetchWebpageFunctionSchema = {
|
|
15
|
+
name: "fetchWebpage",
|
|
16
|
+
description:
|
|
17
|
+
"访问指定的网页 URL,使用真实浏览器渲染后提取 Markdown 内容,支持 JS 动态渲染页面(SPA/React 等)。" +
|
|
18
|
+
"对于 docs.* 文档站,会自动通过 /llms.txt 和 /llms-full.txt 规范化 URL。" +
|
|
19
|
+
"适合文章阅读、内容总结、网页数据提取。" +
|
|
20
|
+
"如果用户明确给了 URL 并要求据此更新代码/文档,应优先直接抓取这些 URL,并把抓到的字段视为权威来源。",
|
|
21
|
+
parameters: {
|
|
22
|
+
type: "object",
|
|
23
|
+
properties: {
|
|
24
|
+
url: {
|
|
25
|
+
type: "string",
|
|
26
|
+
description:
|
|
27
|
+
"要抓取其内容的网页的完整 URL 地址(http/https)。对于 docs.* 文档站,可提供大致推测的页面路径,工具会先尝试规范化到权威文档 URL。",
|
|
28
|
+
},
|
|
29
|
+
waitForNetworkIdle: {
|
|
30
|
+
type: "boolean",
|
|
31
|
+
description: "是否等待网络请求结束再提取(适合 SPA/动态页面),默认 false。",
|
|
32
|
+
default: false,
|
|
33
|
+
},
|
|
34
|
+
},
|
|
35
|
+
required: ["url"],
|
|
36
|
+
},
|
|
37
|
+
};
|
|
38
|
+
|
|
39
|
+
/**
|
|
40
|
+
* [Executor] 'fetchWebpage' 工具的执行函数。
|
|
41
|
+
* 底层调用 Cloudflare Browser Rendering /api/cf-markdown,支持 JS 渲染。
|
|
42
|
+
*/
|
|
43
|
+
export async function fetchWebpageFunc(
|
|
44
|
+
args: { url: string; waitForNetworkIdle?: boolean },
|
|
45
|
+
thunkApi: any
|
|
46
|
+
): Promise<{ rawData: string; displayData: string }> {
|
|
47
|
+
const { url, waitForNetworkIdle = false } = args;
|
|
48
|
+
if (!url || typeof url !== "string" || !url.startsWith("http")) {
|
|
49
|
+
throw new Error(
|
|
50
|
+
"访问网页失败:必须提供一个有效的、以 http 或 https 开头的 URL。"
|
|
51
|
+
);
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
const gotoOptions = waitForNetworkIdle ? { waitUntil: "networkidle0" } : undefined;
|
|
55
|
+
const resolution = await discoverCanonicalDocsUrl(url);
|
|
56
|
+
const targetUrl = resolution.resolvedUrl;
|
|
57
|
+
|
|
58
|
+
await assertFetchableDocsUrl(targetUrl, fetch, url);
|
|
59
|
+
|
|
60
|
+
const data = await callToolApi<{
|
|
61
|
+
markdown: string;
|
|
62
|
+
success: boolean;
|
|
63
|
+
browserMsUsed?: number;
|
|
64
|
+
source: string;
|
|
65
|
+
}>(thunkApi, "/api/cf-markdown", { url: targetUrl, gotoOptions }, { withAuth: true });
|
|
66
|
+
|
|
67
|
+
const markdown = data.markdown ?? "";
|
|
68
|
+
const extractionIssue = detectExtractionIssue(markdown, targetUrl);
|
|
69
|
+
if (extractionIssue) {
|
|
70
|
+
throw new Error(extractionIssue.message);
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
const seconds = data.browserMsUsed ? (data.browserMsUsed / 1000).toFixed(2) : "?";
|
|
74
|
+
const statusMsg =
|
|
75
|
+
`✅ 已成功获取网页内容 (URL: ${targetUrl})\n` +
|
|
76
|
+
`🌐 渲染引擎: Cloudflare Browser Rendering\n` +
|
|
77
|
+
`⏱ 浏览器耗时: ${seconds}s | 字符数: ${markdown.length}` +
|
|
78
|
+
(targetUrl !== url ? `\n🧭 文档地址已规范化: ${url} → ${targetUrl}` : "");
|
|
79
|
+
|
|
80
|
+
return {
|
|
81
|
+
rawData: targetUrl === url ? markdown : `[Resolved URL] ${targetUrl}\n\n${markdown}`,
|
|
82
|
+
displayData: `${statusMsg}\n\n${markdown}`,
|
|
83
|
+
};
|
|
84
|
+
}
|