npm - cursor-buddy - Versions diffs - 0.0.0-beta.2 - Mend

cursor-buddy 0.0.0-beta.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/LICENSE +21 -0
package/README.md +422 -0
package/dist/client-Ba6rv-du.d.mts +460 -0
package/dist/client-Ba6rv-du.d.mts.map +1 -0
package/dist/client-D-LeEdoH.mjs +2254 -0
package/dist/client-D-LeEdoH.mjs.map +1 -0
package/dist/index.d.mts +3 -0
package/dist/index.mjs +3 -0
package/dist/point-tool-DtHgq6gQ.mjs +54 -0
package/dist/point-tool-DtHgq6gQ.mjs.map +1 -0
package/dist/point-tool-kIviMn1q.d.mts +46 -0
package/dist/point-tool-kIviMn1q.d.mts.map +1 -0
package/dist/react/index.d.mts +142 -0
package/dist/react/index.d.mts.map +1 -0
package/dist/react/index.mjs +574 -0
package/dist/react/index.mjs.map +1 -0
package/dist/server/adapters/next.d.mts +22 -0
package/dist/server/adapters/next.d.mts.map +1 -0
package/dist/server/adapters/next.mjs +24 -0
package/dist/server/adapters/next.mjs.map +1 -0
package/dist/server/index.d.mts +31 -0
package/dist/server/index.d.mts.map +1 -0
package/dist/server/index.mjs +278 -0
package/dist/server/index.mjs.map +1 -0
package/dist/types-COQKMo5C.d.mts +44 -0
package/dist/types-COQKMo5C.d.mts.map +1 -0
package/package.json +108 -0

package/dist/server/adapters/next.d.mts ADDED Viewed

@@ -0,0 +1,22 @@
+import { t as CursorBuddyHandler } from "../../types-COQKMo5C.mjs";
+//#region src/server/adapters/next.d.ts
+/**
+ * Convert a CursorBuddyHandler to Next.js App Router route handlers.
+ *
+ * @example
+ * ```ts
+ * // app/api/cursor-buddy/[...path]/route.ts
+ * import { toNextJsHandler } from "cursor-buddy/server/next"
+ * import { cursorBuddy } from "@/lib/cursor-buddy"
+ *
+ * export const { GET, POST } = toNextJsHandler(cursorBuddy)
+ * ```
+ */
+declare function toNextJsHandler(cursorBuddy: CursorBuddyHandler): {
+  GET: (request: Request) => Promise<Response>;
+  POST: (request: Request) => Promise<Response>;
+};
+//#endregion
+export { toNextJsHandler };
+//# sourceMappingURL=next.d.mts.map

package/dist/server/adapters/next.d.mts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"next.d.mts","names":[],"sources":["../../../src/server/adapters/next.ts"],"mappings":";;;;;AAcA;;;;;;;;;;iBAAgB,eAAA,CAAgB,WAAA,EAAa,kBAAA;iBACjB,OAAA,KAAO,OAAA,CAAA,QAAA;kBAAP,OAAA,KAAO,OAAA,CAAA,QAAA;AAAA"}

package/dist/server/adapters/next.mjs ADDED Viewed

@@ -0,0 +1,24 @@
+//#region src/server/adapters/next.ts
+/**
+* Convert a CursorBuddyHandler to Next.js App Router route handlers.
+*
+* @example
+* ```ts
+* // app/api/cursor-buddy/[...path]/route.ts
+* import { toNextJsHandler } from "cursor-buddy/server/next"
+* import { cursorBuddy } from "@/lib/cursor-buddy"
+*
+* export const { GET, POST } = toNextJsHandler(cursorBuddy)
+* ```
+*/
+function toNextJsHandler(cursorBuddy) {
+	const handler = (request) => cursorBuddy.handler(request);
+	return {
+		GET: handler,
+		POST: handler
+	};
+}
+//#endregion
+export { toNextJsHandler };
+//# sourceMappingURL=next.mjs.map

package/dist/server/adapters/next.mjs.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"next.mjs","names":[],"sources":["../../../src/server/adapters/next.ts"],"sourcesContent":["import type { CursorBuddyHandler } from \"../types\"\n\n/**\n * Convert a CursorBuddyHandler to Next.js App Router route handlers.\n *\n * @example\n * ```ts\n * // app/api/cursor-buddy/[...path]/route.ts\n * import { toNextJsHandler } from \"cursor-buddy/server/next\"\n * import { cursorBuddy } from \"@/lib/cursor-buddy\"\n *\n * export const { GET, POST } = toNextJsHandler(cursorBuddy)\n * ```\n */\nexport function toNextJsHandler(cursorBuddy: CursorBuddyHandler) {\n const handler = (request: Request) => cursorBuddy.handler(request)\n\n return {\n GET: handler,\n POST: handler,\n }\n}\n"],"mappings":";;;;;;;;;;;;;AAcA,SAAgB,gBAAgB,aAAiC;CAC/D,MAAM,WAAW,YAAqB,YAAY,QAAQ,QAAQ;AAElE,QAAO;EACL,KAAK;EACL,MAAM;EACP"}

package/dist/server/index.d.mts ADDED Viewed

@@ -0,0 +1,31 @@
+import { n as pointTool, t as PointToolInput } from "../point-tool-kIviMn1q.mjs";
+import { n as CursorBuddyHandlerConfig, t as CursorBuddyHandler } from "../types-COQKMo5C.mjs";
+//#region src/server/handler.d.ts
+/**
+ * Create a cursor buddy request handler.
+ *
+ * The handler responds to three routes based on the last path segment:
+ * - /chat - Screenshot + transcript → AI SSE stream
+ * - /transcribe - Audio → text
+ * - /tts - Text → audio
+ *
+ * @example
+ * ```ts
+ * import { createCursorBuddyHandler } from "cursor-buddy/server"
+ * import { openai } from "@ai-sdk/openai"
+ *
+ * const cursorBuddy = createCursorBuddyHandler({
+ *   model: openai("gpt-4o"),
+ *   speechModel: openai.speech("tts-1"), // optional for browser-only speech
+ *   transcriptionModel: openai.transcription("whisper-1"),
+ * })
+ * ```
+ */
+declare function createCursorBuddyHandler(config: CursorBuddyHandlerConfig): CursorBuddyHandler;
+//#endregion
+//#region src/server/system-prompt.d.ts
+declare const DEFAULT_SYSTEM_PROMPT = "You are a helpful AI assistant that lives inside a web page as a cursor companion.\n\nYou can see the user's current screen and hear what they say. Respond conversationally. Your response will be spoken aloud with text-to-speech, so keep it natural, concise, and easy to follow.\n\n## Core behavior\n\n- Speak like a helpful companion, not a robot\n- Keep most responses to 1-3 short sentences\n- Focus on what is visible right now on the user's screen\n- If something is unclear or not visible, say that plainly\n- Do not mention screenshots, overlays, annotations, or internal helper data\n- Do not mention marker numbers to the user\n\n## The point tool\n\nYou have a `point` tool that can visually indicate something on the user's screen.\n\nUse the `point` tool when the user is asking you to identify, locate, indicate, highlight, or show something visible on screen.\n\nCommon cases where you should use `point`:\n- the user asks where something is\n- the user asks what to click\n- the user says things like \"show me\", \"point to it\", \"where is it\", \"which one\", \"what should I click\", or \"highlight that\"\n\nDo not use the `point` tool when spoken guidance alone is enough and the user is not asking you to identify a specific on-screen target.\n\nExamples where spoken guidance alone may be enough:\n- explaining what a page does\n- answering a general question about what is on screen\n- giving brief next-step advice that does not depend on locating a specific element\n\nIf using the `point` tool:\n- first give the spoken response\n- then call the tool\n- call it at most once per response\n- point only at the most relevant target\n- never replace the tool call with plain text like \"(point here)\" or \"I\u2019m pointing at it now\"\n\n\nIf the user asks where something is on screen, what to click, or asks you to point something out, you should usually use the point tool rather than only describing it in words.\nDo not say things like \"I can point to it if you want\" when the user already asked where it is. In that case, answer briefly and use the point tool.\n\n## How to point\n\nPrefer marker-based pointing for interactive elements when a marker is available.\nInteractive elements may include buttons, links, inputs, tabs, menus, toggles, and other clickable controls.\n\nUse:\n- `type: \"marker\"` for interactive elements that have a marker\n- `type: \"coordinates\"` only for visible non-interactive content without a marker\n\nNever use coordinates for an interactive element if a marker is available.\n\nCoordinates must refer to the center of the target area.\n\nWhen calling the point tool, choose exactly one mode:\n\n- Marker mode:\n  - use type \"marker\"\n  - provide markerId\n  - do not provide x or y\n\n- Coordinates mode:\n  - use type \"coordinates\"\n  - provide x and y\n  - do not provide markerId\n\nNever combine markerId with x or y in the same tool call.\n\n## What to say\n\nWhen the user asks you to point something out:\n- briefly answer in a natural spoken way\n- then use the tool if the request is about locating or indicating something on screen\n\nGood spoken style:\n- \"Click this button right here.\"\n- \"The error message is over here.\"\n- \"This is the field you want.\"\n- \"That setting is in this section.\"\n\nAvoid:\n- mentioning marker IDs\n- mentioning internal tools\n- describing internal reasoning\n- saying you are looking at a screenshot\n\n## If the target is not clear\n\nIf you cannot confidently find the requested thing on screen:\n- say you cannot see it clearly or cannot find it\n- do not point at a random or uncertain target\n\n## Priority\n\nYour first priority is being helpful and correct.\nYour second priority is using the `point` tool whenever the user is asking you to visually identify a specific thing on screen.\n";
+//#endregion
+export { type CursorBuddyHandler, type CursorBuddyHandlerConfig, DEFAULT_SYSTEM_PROMPT, type PointToolInput, createCursorBuddyHandler, pointTool };
+//# sourceMappingURL=index.d.mts.map

package/dist/server/index.d.mts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"index.d.mts","names":[],"sources":["../../src/server/handler.ts","../../src/server/system-prompt.ts"],"mappings":";;;;;;;AAyBA;;;;;;;;;;;;ACzBA;;;;;iBDyBgB,wBAAA,CACd,MAAA,EAAQ,wBAAA,GACP,kBAAA;;;cC3BU,qBAAA"}

package/dist/server/index.mjs ADDED Viewed

@@ -0,0 +1,278 @@
+import { t as pointTool } from "../point-tool-DtHgq6gQ.mjs";
+import { experimental_generateSpeech, experimental_transcribe, streamText } from "ai";
+//#region src/server/system-prompt.ts
+const DEFAULT_SYSTEM_PROMPT = `You are a helpful AI assistant that lives inside a web page as a cursor companion.
+You can see the user's current screen and hear what they say. Respond conversationally. Your response will be spoken aloud with text-to-speech, so keep it natural, concise, and easy to follow.
+## Core behavior
+- Speak like a helpful companion, not a robot
+- Keep most responses to 1-3 short sentences
+- Focus on what is visible right now on the user's screen
+- If something is unclear or not visible, say that plainly
+- Do not mention screenshots, overlays, annotations, or internal helper data
+- Do not mention marker numbers to the user
+## The point tool
+You have a \`point\` tool that can visually indicate something on the user's screen.
+Use the \`point\` tool when the user is asking you to identify, locate, indicate, highlight, or show something visible on screen.
+Common cases where you should use \`point\`:
+- the user asks where something is
+- the user asks what to click
+- the user says things like "show me", "point to it", "where is it", "which one", "what should I click", or "highlight that"
+Do not use the \`point\` tool when spoken guidance alone is enough and the user is not asking you to identify a specific on-screen target.
+Examples where spoken guidance alone may be enough:
+- explaining what a page does
+- answering a general question about what is on screen
+- giving brief next-step advice that does not depend on locating a specific element
+If using the \`point\` tool:
+- first give the spoken response
+- then call the tool
+- call it at most once per response
+- point only at the most relevant target
+- never replace the tool call with plain text like "(point here)" or "I’m pointing at it now"
+If the user asks where something is on screen, what to click, or asks you to point something out, you should usually use the point tool rather than only describing it in words.
+Do not say things like "I can point to it if you want" when the user already asked where it is. In that case, answer briefly and use the point tool.
+## How to point
+Prefer marker-based pointing for interactive elements when a marker is available.
+Interactive elements may include buttons, links, inputs, tabs, menus, toggles, and other clickable controls.
+Use:
+- \`type: "marker"\` for interactive elements that have a marker
+- \`type: "coordinates"\` only for visible non-interactive content without a marker
+Never use coordinates for an interactive element if a marker is available.
+Coordinates must refer to the center of the target area.
+When calling the point tool, choose exactly one mode:
+- Marker mode:
+  - use type "marker"
+  - provide markerId
+  - do not provide x or y
+- Coordinates mode:
+  - use type "coordinates"
+  - provide x and y
+  - do not provide markerId
+Never combine markerId with x or y in the same tool call.
+## What to say
+When the user asks you to point something out:
+- briefly answer in a natural spoken way
+- then use the tool if the request is about locating or indicating something on screen
+Good spoken style:
+- "Click this button right here."
+- "The error message is over here."
+- "This is the field you want."
+- "That setting is in this section."
+Avoid:
+- mentioning marker IDs
+- mentioning internal tools
+- describing internal reasoning
+- saying you are looking at a screenshot
+## If the target is not clear
+If you cannot confidently find the requested thing on screen:
+- say you cannot see it clearly or cannot find it
+- do not point at a random or uncertain target
+## Priority
+Your first priority is being helpful and correct.
+Your second priority is using the \`point\` tool whenever the user is asking you to visually identify a specific thing on screen.
+`;
+//#endregion
+//#region src/server/routes/chat.ts
+/**
+* Handle chat requests: screenshot + transcript → AI SSE stream
+*/
+async function handleChat(request, config) {
+	const { screenshot, transcript, history, capture, markerContext } = await request.json();
+	const systemPrompt = typeof config.system === "function" ? config.system({ defaultPrompt: DEFAULT_SYSTEM_PROMPT }) : config.system ?? DEFAULT_SYSTEM_PROMPT;
+	const maxMessages = (config.maxHistory ?? 10) * 2;
+	const trimmedHistory = history.slice(-maxMessages);
+	const captureContextParts = [];
+	if (capture) captureContextParts.push(`Screenshot size: ${capture.width}x${capture.height} pixels.`);
+	if (markerContext) captureContextParts.push("", markerContext);
+	const captureContext = captureContextParts.length > 0 ? captureContextParts.join("\n") : null;
+	const messages = [...trimmedHistory.map((msg) => ({
+		role: msg.role,
+		content: msg.content
+	})), {
+		role: "user",
+		content: [
+			...captureContext ? [{
+				type: "text",
+				text: captureContext
+			}] : [],
+			{
+				type: "image",
+				image: screenshot
+			},
+			{
+				type: "text",
+				text: transcript
+			}
+		]
+	}];
+	return streamText({
+		model: config.model,
+		system: systemPrompt,
+		providerOptions: config?.modelProviderMetadata,
+		messages,
+		tools: {
+			point: pointTool,
+			...config.tools
+		},
+		experimental_repairToolCall: async ({ toolCall }) => {
+			if (toolCall.toolName !== "point") return null;
+			let parsed;
+			try {
+				parsed = JSON.parse(toolCall.input);
+			} catch {
+				return null;
+			}
+			if (!parsed || typeof parsed !== "object") return null;
+			const input = parsed;
+			if (input.type === "marker") {
+				const repaired = {
+					type: "marker",
+					markerId: input.markerId,
+					label: input.label
+				};
+				return {
+					...toolCall,
+					input: JSON.stringify(repaired)
+				};
+			}
+			if (input.type === "coordinates") {
+				const repaired = {
+					type: "coordinates",
+					x: input.x,
+					y: input.y,
+					label: input.label
+				};
+				return {
+					...toolCall,
+					input: JSON.stringify(repaired)
+				};
+			}
+			return null;
+		}
+	}).toUIMessageStreamResponse();
+}
+//#endregion
+//#region src/server/routes/transcribe.ts
+/**
+* Handle transcription requests: audio file → text
+*/
+async function handleTranscribe(request, config) {
+	if (!config.transcriptionModel) return new Response(JSON.stringify({ error: "Server transcription is not configured. Provide a transcriptionModel or use browser transcription only." }), {
+		status: 501,
+		headers: { "Content-Type": "application/json" }
+	});
+	const audioFile = (await request.formData()).get("audio");
+	if (!audioFile || !(audioFile instanceof File)) return new Response(JSON.stringify({ error: "No audio file provided" }), {
+		status: 400,
+		headers: { "Content-Type": "application/json" }
+	});
+	const audioBuffer = await audioFile.arrayBuffer();
+	const response = { text: (await experimental_transcribe({
+		model: config.transcriptionModel,
+		audio: new Uint8Array(audioBuffer)
+	})).text };
+	return new Response(JSON.stringify(response), { headers: { "Content-Type": "application/json" } });
+}
+//#endregion
+//#region src/server/routes/tts.ts
+/**
+* Handle TTS requests: text → audio
+*/
+async function handleTTS(request, config) {
+	if (!config.speechModel) return new Response(JSON.stringify({ error: "Server speech is not configured. Provide a speechModel or use browser speech only." }), {
+		status: 501,
+		headers: { "Content-Type": "application/json" }
+	});
+	const outputFormat = "wav";
+	const { text } = await request.json();
+	if (!text) return new Response(JSON.stringify({ error: "No text provided" }), {
+		status: 400,
+		headers: { "Content-Type": "application/json" }
+	});
+	const result = await experimental_generateSpeech({
+		model: config.speechModel,
+		text,
+		outputFormat
+	});
+	const audioData = new Uint8Array(result.audio.uint8Array);
+	return new Response(audioData, { headers: { "Content-Type": "audio/wav" } });
+}
+//#endregion
+//#region src/server/handler.ts
+/**
+* Create a cursor buddy request handler.
+*
+* The handler responds to three routes based on the last path segment:
+* - /chat - Screenshot + transcript → AI SSE stream
+* - /transcribe - Audio → text
+* - /tts - Text → audio
+*
+* @example
+* ```ts
+* import { createCursorBuddyHandler } from "cursor-buddy/server"
+* import { openai } from "@ai-sdk/openai"
+*
+* const cursorBuddy = createCursorBuddyHandler({
+*   model: openai("gpt-4o"),
+*   speechModel: openai.speech("tts-1"), // optional for browser-only speech
+*   transcriptionModel: openai.transcription("whisper-1"),
+* })
+* ```
+*/
+function createCursorBuddyHandler(config) {
+	const handler = async (request) => {
+		const pathSegments = new URL(request.url).pathname.split("/").filter(Boolean);
+		switch (pathSegments[pathSegments.length - 1]) {
+			case "chat": return handleChat(request, config);
+			case "transcribe": return handleTranscribe(request, config);
+			case "tts": return handleTTS(request, config);
+			default: return new Response(JSON.stringify({
+				error: "Not found",
+				availableRoutes: [
+					"/chat",
+					"/transcribe",
+					"/tts"
+				]
+			}), {
+				status: 404,
+				headers: { "Content-Type": "application/json" }
+			});
+		}
+	};
+	return {
+		handler,
+		config
+	};
+}
+//#endregion
+export { DEFAULT_SYSTEM_PROMPT, createCursorBuddyHandler, pointTool };
+//# sourceMappingURL=index.mjs.map

package/dist/server/index.mjs.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"index.mjs","names":["transcribe","generateSpeech"],"sources":["../../src/server/system-prompt.ts","../../src/server/routes/chat.ts","../../src/server/routes/transcribe.ts","../../src/server/routes/tts.ts","../../src/server/handler.ts"],"sourcesContent":["export const DEFAULT_SYSTEM_PROMPT = `You are a helpful AI assistant that lives inside a web page as a cursor companion.\n\nYou can see the user's current screen and hear what they say. Respond conversationally. Your response will be spoken aloud with text-to-speech, so keep it natural, concise, and easy to follow.\n\n## Core behavior\n\n- Speak like a helpful companion, not a robot\n- Keep most responses to 1-3 short sentences\n- Focus on what is visible right now on the user's screen\n- If something is unclear or not visible, say that plainly\n- Do not mention screenshots, overlays, annotations, or internal helper data\n- Do not mention marker numbers to the user\n\n## The point tool\n\nYou have a \\`point\\` tool that can visually indicate something on the user's screen.\n\nUse the \\`point\\` tool when the user is asking you to identify, locate, indicate, highlight, or show something visible on screen.\n\nCommon cases where you should use \\`point\\`:\n- the user asks where something is\n- the user asks what to click\n- the user says things like \"show me\", \"point to it\", \"where is it\", \"which one\", \"what should I click\", or \"highlight that\"\n\nDo not use the \\`point\\` tool when spoken guidance alone is enough and the user is not asking you to identify a specific on-screen target.\n\nExamples where spoken guidance alone may be enough:\n- explaining what a page does\n- answering a general question about what is on screen\n- giving brief next-step advice that does not depend on locating a specific element\n\nIf using the \\`point\\` tool:\n- first give the spoken response\n- then call the tool\n- call it at most once per response\n- point only at the most relevant target\n- never replace the tool call with plain text like \"(point here)\" or \"I’m pointing at it now\"\n\n\nIf the user asks where something is on screen, what to click, or asks you to point something out, you should usually use the point tool rather than only describing it in words.\nDo not say things like \"I can point to it if you want\" when the user already asked where it is. In that case, answer briefly and use the point tool.\n\n## How to point\n\nPrefer marker-based pointing for interactive elements when a marker is available.\nInteractive elements may include buttons, links, inputs, tabs, menus, toggles, and other clickable controls.\n\nUse:\n- \\`type: \"marker\"\\` for interactive elements that have a marker\n- \\`type: \"coordinates\"\\` only for visible non-interactive content without a marker\n\nNever use coordinates for an interactive element if a marker is available.\n\nCoordinates must refer to the center of the target area.\n\nWhen calling the point tool, choose exactly one mode:\n\n- Marker mode:\n - use type \"marker\"\n - provide markerId\n - do not provide x or y\n\n- Coordinates mode:\n - use type \"coordinates\"\n - provide x and y\n - do not provide markerId\n\nNever combine markerId with x or y in the same tool call.\n\n## What to say\n\nWhen the user asks you to point something out:\n- briefly answer in a natural spoken way\n- then use the tool if the request is about locating or indicating something on screen\n\nGood spoken style:\n- \"Click this button right here.\"\n- \"The error message is over here.\"\n- \"This is the field you want.\"\n- \"That setting is in this section.\"\n\nAvoid:\n- mentioning marker IDs\n- mentioning internal tools\n- describing internal reasoning\n- saying you are looking at a screenshot\n\n## If the target is not clear\n\nIf you cannot confidently find the requested thing on screen:\n- say you cannot see it clearly or cannot find it\n- do not point at a random or uncertain target\n\n## Priority\n\nYour first priority is being helpful and correct.\nYour second priority is using the \\`point\\` tool whenever the user is asking you to visually identify a specific thing on screen.\n`\n","import { streamText } from \"ai\"\nimport { pointTool } from \"../../shared/point-tool\"\nimport { DEFAULT_SYSTEM_PROMPT } from \"../system-prompt\"\nimport type { ChatRequestBody, CursorBuddyHandlerConfig } from \"../types\"\n\n/**\n * Handle chat requests: screenshot + transcript → AI SSE stream\n */\nexport async function handleChat(\n request: Request,\n config: CursorBuddyHandlerConfig,\n): Promise<Response> {\n const body = (await request.json()) as ChatRequestBody\n const { screenshot, transcript, history, capture, markerContext } = body\n\n // Resolve system prompt (string or function)\n const systemPrompt =\n typeof config.system === \"function\"\n ? config.system({ defaultPrompt: DEFAULT_SYSTEM_PROMPT })\n : (config.system ?? DEFAULT_SYSTEM_PROMPT)\n\n // Trim history to maxHistory (default 10 exchanges = 20 messages)\n const maxMessages = (config.maxHistory ?? 10) * 2\n const trimmedHistory = history.slice(-maxMessages)\n\n // Build capture context with marker information\n const captureContextParts: string[] = []\n\n if (capture) {\n captureContextParts.push(\n `Screenshot size: ${capture.width}x${capture.height} pixels.`,\n )\n }\n\n if (markerContext) {\n captureContextParts.push(\"\", markerContext)\n }\n\n const captureContext =\n captureContextParts.length > 0 ? captureContextParts.join(\"\\n\") : null\n\n // Build messages array with vision content\n const messages = [\n ...trimmedHistory.map((msg) => ({\n role: msg.role as \"user\" | \"assistant\",\n content: msg.content,\n })),\n {\n role: \"user\" as const,\n content: [\n ...(captureContext\n ? [\n {\n type: \"text\" as const,\n text: captureContext,\n },\n ]\n : []),\n {\n type: \"image\" as const,\n image: screenshot,\n },\n {\n type: \"text\" as const,\n text: transcript,\n },\n ],\n },\n ]\n\n const result = streamText({\n model: config.model,\n system: systemPrompt,\n providerOptions: config?.modelProviderMetadata,\n messages,\n tools: {\n point: pointTool,\n ...config.tools,\n },\n experimental_repairToolCall: async ({ toolCall }) => {\n if (toolCall.toolName !== \"point\") return null\n\n let parsed: unknown\n try {\n parsed = JSON.parse(toolCall.input)\n } catch {\n return null\n }\n\n if (!parsed || typeof parsed !== \"object\") return null\n\n const input = parsed as Record<string, unknown>\n\n if (input.type === \"marker\") {\n const repaired = {\n type: \"marker\",\n markerId: input.markerId,\n label: input.label,\n }\n\n return {\n ...toolCall,\n input: JSON.stringify(repaired),\n }\n }\n\n if (input.type === \"coordinates\") {\n const repaired = {\n type: \"coordinates\",\n x: input.x,\n y: input.y,\n label: input.label,\n }\n\n return {\n ...toolCall,\n input: JSON.stringify(repaired),\n }\n }\n\n return null\n },\n })\n\n return result.toUIMessageStreamResponse()\n}\n","import { experimental_transcribe as transcribe } from \"ai\"\nimport type { CursorBuddyHandlerConfig, TranscribeResponse } from \"../types\"\n\n/**\n * Handle transcription requests: audio file → text\n */\nexport async function handleTranscribe(\n request: Request,\n config: CursorBuddyHandlerConfig,\n): Promise<Response> {\n if (!config.transcriptionModel) {\n return new Response(\n JSON.stringify({\n error:\n \"Server transcription is not configured. Provide a transcriptionModel or use browser transcription only.\",\n }),\n {\n status: 501,\n headers: { \"Content-Type\": \"application/json\" },\n },\n )\n }\n\n const formData = await request.formData()\n const audioFile = formData.get(\"audio\")\n\n if (!audioFile || !(audioFile instanceof File)) {\n return new Response(JSON.stringify({ error: \"No audio file provided\" }), {\n status: 400,\n headers: { \"Content-Type\": \"application/json\" },\n })\n }\n\n const audioBuffer = await audioFile.arrayBuffer()\n\n const result = await transcribe({\n model: config.transcriptionModel,\n audio: new Uint8Array(audioBuffer),\n })\n\n const response: TranscribeResponse = { text: result.text }\n\n return new Response(JSON.stringify(response), {\n headers: { \"Content-Type\": \"application/json\" },\n })\n}\n","import { experimental_generateSpeech as generateSpeech } from \"ai\"\nimport type { CursorBuddyHandlerConfig, TTSRequestBody } from \"../types\"\n\n/**\n * Handle TTS requests: text → audio\n */\nexport async function handleTTS(\n request: Request,\n config: CursorBuddyHandlerConfig,\n): Promise<Response> {\n if (!config.speechModel) {\n return new Response(\n JSON.stringify({\n error:\n \"Server speech is not configured. Provide a speechModel or use browser speech only.\",\n }),\n {\n status: 501,\n headers: { \"Content-Type\": \"application/json\" },\n },\n )\n }\n\n const outputFormat = \"wav\"\n const body = (await request.json()) as TTSRequestBody\n const { text } = body\n\n if (!text) {\n return new Response(JSON.stringify({ error: \"No text provided\" }), {\n status: 400,\n headers: { \"Content-Type\": \"application/json\" },\n })\n }\n\n const result = await generateSpeech({\n model: config.speechModel,\n text,\n outputFormat,\n })\n\n // Create a new ArrayBuffer copy to satisfy TypeScript's strict typing\n const audioData = new Uint8Array(result.audio.uint8Array)\n\n return new Response(audioData, {\n headers: {\n \"Content-Type\": \"audio/wav\",\n },\n })\n}\n","import { handleChat } from \"./routes/chat\"\nimport { handleTranscribe } from \"./routes/transcribe\"\nimport { handleTTS } from \"./routes/tts\"\nimport type { CursorBuddyHandler, CursorBuddyHandlerConfig } from \"./types\"\n\n/**\n * Create a cursor buddy request handler.\n *\n * The handler responds to three routes based on the last path segment:\n * - /chat - Screenshot + transcript → AI SSE stream\n * - /transcribe - Audio → text\n * - /tts - Text → audio\n *\n * @example\n * ```ts\n * import { createCursorBuddyHandler } from \"cursor-buddy/server\"\n * import { openai } from \"@ai-sdk/openai\"\n *\n * const cursorBuddy = createCursorBuddyHandler({\n * model: openai(\"gpt-4o\"),\n * speechModel: openai.speech(\"tts-1\"), // optional for browser-only speech\n * transcriptionModel: openai.transcription(\"whisper-1\"),\n * })\n * ```\n */\nexport function createCursorBuddyHandler(\n config: CursorBuddyHandlerConfig,\n): CursorBuddyHandler {\n const handler = async (request: Request): Promise<Response> => {\n const url = new URL(request.url)\n const pathSegments = url.pathname.split(\"/\").filter(Boolean)\n const route = pathSegments[pathSegments.length - 1]\n\n switch (route) {\n case \"chat\":\n return handleChat(request, config)\n\n case \"transcribe\":\n return handleTranscribe(request, config)\n\n case \"tts\":\n return handleTTS(request, config)\n\n default:\n return new Response(\n JSON.stringify({\n error: \"Not found\",\n availableRoutes: [\"/chat\", \"/transcribe\", \"/tts\"],\n }),\n {\n status: 404,\n headers: { \"Content-Type\": \"application/json\" },\n },\n )\n }\n }\n\n return { handler, config }\n}\n"],"mappings":";;;AAAA,MAAa,wBAAwB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;ACQrC,eAAsB,WACpB,SACA,QACmB;CAEnB,MAAM,EAAE,YAAY,YAAY,SAAS,SAAS,kBADpC,MAAM,QAAQ,MAAM;CAIlC,MAAM,eACJ,OAAO,OAAO,WAAW,aACrB,OAAO,OAAO,EAAE,eAAe,uBAAuB,CAAC,GACtD,OAAO,UAAU;CAGxB,MAAM,eAAe,OAAO,cAAc,MAAM;CAChD,MAAM,iBAAiB,QAAQ,MAAM,CAAC,YAAY;CAGlD,MAAM,sBAAgC,EAAE;AAExC,KAAI,QACF,qBAAoB,KAClB,oBAAoB,QAAQ,MAAM,GAAG,QAAQ,OAAO,UACrD;AAGH,KAAI,cACF,qBAAoB,KAAK,IAAI,cAAc;CAG7C,MAAM,iBACJ,oBAAoB,SAAS,IAAI,oBAAoB,KAAK,KAAK,GAAG;CAGpE,MAAM,WAAW,CACf,GAAG,eAAe,KAAK,SAAS;EAC9B,MAAM,IAAI;EACV,SAAS,IAAI;EACd,EAAE,EACH;EACE,MAAM;EACN,SAAS;GACP,GAAI,iBACA,CACE;IACE,MAAM;IACN,MAAM;IACP,CACF,GACD,EAAE;GACN;IACE,MAAM;IACN,OAAO;IACR;GACD;IACE,MAAM;IACN,MAAM;IACP;GACF;EACF,CACF;AAwDD,QAtDe,WAAW;EACxB,OAAO,OAAO;EACd,QAAQ;EACR,iBAAiB,QAAQ;EACzB;EACA,OAAO;GACL,OAAO;GACP,GAAG,OAAO;GACX;EACD,6BAA6B,OAAO,EAAE,eAAe;AACnD,OAAI,SAAS,aAAa,QAAS,QAAO;GAE1C,IAAI;AACJ,OAAI;AACF,aAAS,KAAK,MAAM,SAAS,MAAM;WAC7B;AACN,WAAO;;AAGT,OAAI,CAAC,UAAU,OAAO,WAAW,SAAU,QAAO;GAElD,MAAM,QAAQ;AAEd,OAAI,MAAM,SAAS,UAAU;IAC3B,MAAM,WAAW;KACf,MAAM;KACN,UAAU,MAAM;KAChB,OAAO,MAAM;KACd;AAED,WAAO;KACL,GAAG;KACH,OAAO,KAAK,UAAU,SAAS;KAChC;;AAGH,OAAI,MAAM,SAAS,eAAe;IAChC,MAAM,WAAW;KACf,MAAM;KACN,GAAG,MAAM;KACT,GAAG,MAAM;KACT,OAAO,MAAM;KACd;AAED,WAAO;KACL,GAAG;KACH,OAAO,KAAK,UAAU,SAAS;KAChC;;AAGH,UAAO;;EAEV,CAAC,CAEY,2BAA2B;;;;;;;ACtH3C,eAAsB,iBACpB,SACA,QACmB;AACnB,KAAI,CAAC,OAAO,mBACV,QAAO,IAAI,SACT,KAAK,UAAU,EACb,OACE,2GACH,CAAC,EACF;EACE,QAAQ;EACR,SAAS,EAAE,gBAAgB,oBAAoB;EAChD,CACF;CAIH,MAAM,aADW,MAAM,QAAQ,UAAU,EACd,IAAI,QAAQ;AAEvC,KAAI,CAAC,aAAa,EAAE,qBAAqB,MACvC,QAAO,IAAI,SAAS,KAAK,UAAU,EAAE,OAAO,0BAA0B,CAAC,EAAE;EACvE,QAAQ;EACR,SAAS,EAAE,gBAAgB,oBAAoB;EAChD,CAAC;CAGJ,MAAM,cAAc,MAAM,UAAU,aAAa;CAOjD,MAAM,WAA+B,EAAE,OALxB,MAAMA,wBAAW;EAC9B,OAAO,OAAO;EACd,OAAO,IAAI,WAAW,YAAY;EACnC,CAAC,EAEkD,MAAM;AAE1D,QAAO,IAAI,SAAS,KAAK,UAAU,SAAS,EAAE,EAC5C,SAAS,EAAE,gBAAgB,oBAAoB,EAChD,CAAC;;;;;;;ACtCJ,eAAsB,UACpB,SACA,QACmB;AACnB,KAAI,CAAC,OAAO,YACV,QAAO,IAAI,SACT,KAAK,UAAU,EACb,OACE,sFACH,CAAC,EACF;EACE,QAAQ;EACR,SAAS,EAAE,gBAAgB,oBAAoB;EAChD,CACF;CAGH,MAAM,eAAe;CAErB,MAAM,EAAE,SADM,MAAM,QAAQ,MAAM;AAGlC,KAAI,CAAC,KACH,QAAO,IAAI,SAAS,KAAK,UAAU,EAAE,OAAO,oBAAoB,CAAC,EAAE;EACjE,QAAQ;EACR,SAAS,EAAE,gBAAgB,oBAAoB;EAChD,CAAC;CAGJ,MAAM,SAAS,MAAMC,4BAAe;EAClC,OAAO,OAAO;EACd;EACA;EACD,CAAC;CAGF,MAAM,YAAY,IAAI,WAAW,OAAO,MAAM,WAAW;AAEzD,QAAO,IAAI,SAAS,WAAW,EAC7B,SAAS,EACP,gBAAgB,aACjB,EACF,CAAC;;;;;;;;;;;;;;;;;;;;;;;;ACtBJ,SAAgB,yBACd,QACoB;CACpB,MAAM,UAAU,OAAO,YAAwC;EAE7D,MAAM,eADM,IAAI,IAAI,QAAQ,IAAI,CACP,SAAS,MAAM,IAAI,CAAC,OAAO,QAAQ;AAG5D,UAFc,aAAa,aAAa,SAAS,IAEjD;GACE,KAAK,OACH,QAAO,WAAW,SAAS,OAAO;GAEpC,KAAK,aACH,QAAO,iBAAiB,SAAS,OAAO;GAE1C,KAAK,MACH,QAAO,UAAU,SAAS,OAAO;GAEnC,QACE,QAAO,IAAI,SACT,KAAK,UAAU;IACb,OAAO;IACP,iBAAiB;KAAC;KAAS;KAAe;KAAO;IAClD,CAAC,EACF;IACE,QAAQ;IACR,SAAS,EAAE,gBAAgB,oBAAoB;IAChD,CACF;;;AAIP,QAAO;EAAE;EAAS;EAAQ"}

package/dist/types-COQKMo5C.d.mts ADDED Viewed

@@ -0,0 +1,44 @@
+import { LanguageModel, SpeechModel, Tool, TranscriptionModel } from "ai";
+//#region src/server/types.d.ts
+/**
+ * Configuration for createCursorBuddyHandler
+ */
+interface CursorBuddyHandlerConfig {
+  /** AI SDK language model for chat (e.g., openai("gpt-4o")) */
+  model: LanguageModel;
+  modelProviderMetadata?: Record<string, any>;
+  /**
+   * AI SDK speech model for TTS (e.g., openai.speech("tts-1")).
+   * Optional when clients use browser-only speech.
+   */
+  speechModel?: SpeechModel;
+  /**
+   * AI SDK transcription model (e.g., openai.transcription("whisper-1")).
+   * Optional when clients use browser-only transcription.
+   */
+  transcriptionModel?: TranscriptionModel;
+  /**
+   * System prompt for the AI. Can be a string or a function that receives
+   * the default prompt and returns a modified version.
+   */
+  system?: string | ((ctx: {
+    defaultPrompt: string;
+  }) => string);
+  /** AI SDK tools available to the model */
+  tools?: Record<string, Tool>;
+  /** Maximum conversation history messages to include (default: 10) */
+  maxHistory?: number;
+}
+/**
+ * Return type of createCursorBuddyHandler
+ */
+interface CursorBuddyHandler {
+  /** The main request handler */
+  handler: (request: Request) => Promise<Response>;
+  /** The resolved configuration */
+  config: CursorBuddyHandlerConfig;
+}
+//#endregion
+export { CursorBuddyHandlerConfig as n, CursorBuddyHandler as t };
+//# sourceMappingURL=types-COQKMo5C.d.mts.map

package/dist/types-COQKMo5C.d.mts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"types-COQKMo5C.d.mts","names":[],"sources":["../src/server/types.ts"],"mappings":";;;;;AAKA;UAAiB,wBAAA;;EAEf,KAAA,EAAO,aAAA;EACP,qBAAA,GAAwB,MAAA;EAMV;;;;EAAd,WAAA,GAAc,WAAA;EAeA;;;;EATd,kBAAA,GAAqB,kBAAA;EANrB;;;;EAYA,MAAA,cAAoB,GAAA;IAAO,aAAA;EAAA;EAG3B;EAAA,KAAA,GAAQ,MAAA,SAAe,IAAA;EAAA;EAGvB,UAAA;AAAA;;AAMF;;UAAiB,kBAAA;EAEI;EAAnB,OAAA,GAAU,OAAA,EAAS,OAAA,KAAY,OAAA,CAAQ,QAAA;EAAR;EAG/B,MAAA,EAAQ,wBAAA;AAAA"}

package/package.json ADDED Viewed

@@ -0,0 +1,108 @@
+{
+  "name": "cursor-buddy",
+  "version": "0.0.0-beta.2",
+  "description": "AI-powered cursor companion for web apps",
+  "type": "module",
+  "license": "MIT",
+  "homepage": "https://github.com/leojuriolli7/cursor-buddy#readme",
+  "bugs": {
+    "url": "https://github.com/leojuriolli7/cursor-buddy/issues"
+  },
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/leojuriolli7/cursor-buddy.git",
+    "directory": "packages/cursor-buddy"
+  },
+  "keywords": [
+    "ai",
+    "assistant",
+    "cursor",
+    "react",
+    "voice",
+    "screen-capture"
+  ],
+  "sideEffects": false,
+  "scripts": {
+    "build": "tsdown",
+    "dev": "tsdown --watch",
+    "test": "vitest run",
+    "test:watch": "vitest",
+    "typecheck": "tsc --noEmit",
+    "prepack": "pnpm build",
+    "release:check": "pnpm typecheck && npm pack --dry-run",
+    "release:publish": "pnpm release:check && npm publish",
+    "release:patch": "npm version patch",
+    "release:minor": "npm version minor",
+    "release:major": "npm version major"
+  },
+  "files": [
+    "dist",
+    "README.md"
+  ],
+  "publishConfig": {
+    "access": "public"
+  },
+  "main": "./dist/index.mjs",
+  "module": "./dist/index.mjs",
+  "types": "./dist/index.d.mts",
+  "exports": {
+    ".": {
+      "types": "./dist/index.d.mts",
+      "default": "./dist/index.mjs"
+    },
+    "./react": {
+      "types": "./dist/react/index.d.mts",
+      "default": "./dist/react/index.mjs"
+    },
+    "./server": {
+      "types": "./dist/server/index.d.mts",
+      "default": "./dist/server/index.mjs"
+    },
+    "./server/next": {
+      "types": "./dist/server/adapters/next.d.mts",
+      "default": "./dist/server/adapters/next.mjs"
+    }
+  },
+  "typesVersions": {
+    "*": {
+      "react": [
+        "./dist/react/index.d.mts"
+      ],
+      "server": [
+        "./dist/server/index.d.mts"
+      ],
+      "server/next": [
+        "./dist/server/adapters/next.d.mts"
+      ]
+    }
+  },
+  "dependencies": {
+    "@nanostores/react": "^1.1.0",
+    "ai": "^6.0.158",
+    "html2canvas-pro": "^2.0.2",
+    "nanostores": "^1.2.0",
+    "zod": "^3.24.0"
+  },
+  "devDependencies": {
+    "@types/react": "^19.0.8",
+    "@types/react-dom": "^19.2.3",
+    "happy-dom": "^20.9.0",
+    "react": "^19.0.0",
+    "react-dom": "^19.0.0",
+    "tsdown": "^0.21.7",
+    "typescript": "^5.7.3",
+    "vitest": "^3.2.4"
+  },
+  "peerDependencies": {
+    "react": "^18.0.0 || ^19.0.0",
+    "react-dom": "^18.0.0 || ^19.0.0"
+  },
+  "peerDependenciesMeta": {
+    "react": {
+      "optional": true
+    },
+    "react-dom": {
+      "optional": true
+    }
+  }
+}