npm - cursor-buddy - Versions diffs - 0.0.2 → 0.0.4 - Mend

cursor-buddy 0.0.2 → 0.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/dist/client-DJRU6dKB.d.mts +462 -0
package/dist/client-DJRU6dKB.d.mts.map +1 -0
package/dist/client-UXGQt-7f.mjs +2193 -0
package/dist/client-UXGQt-7f.mjs.map +1 -0
package/dist/index.d.mts +2 -2
package/dist/index.mjs +1 -1
package/dist/react/index.d.mts +39 -24
package/dist/react/index.d.mts.map +1 -1
package/dist/react/index.mjs +108 -88
package/dist/react/index.mjs.map +1 -1
package/dist/server/adapters/next.d.mts +1 -1
package/dist/server/index.d.mts +3 -3
package/dist/server/index.mjs +38 -14
package/dist/server/index.mjs.map +1 -1
package/dist/{types-L97cq8UK.d.mts → types-BxBhjZju.d.mts} +12 -5
package/dist/types-BxBhjZju.d.mts.map +1 -0
package/package.json +1 -1
package/README.md +0 -344
package/dist/client-Bd33JD8T.mjs +0 -890
package/dist/client-Bd33JD8T.mjs.map +0 -1
package/dist/client-DKZY5bI1.d.mts +0 -314
package/dist/client-DKZY5bI1.d.mts.map +0 -1
package/dist/types-L97cq8UK.d.mts.map +0 -1

package/dist/{types-L97cq8UK.d.mts → types-BxBhjZju.d.mts} RENAMED Viewed

@@ -7,10 +7,17 @@ import { LanguageModel, SpeechModel, Tool, TranscriptionModel } from "ai";
 interface CursorBuddyHandlerConfig {
   /** AI SDK language model for chat (e.g., openai("gpt-4o")) */
   model: LanguageModel;
-  /** AI SDK speech model for TTS (e.g., openai.speech("tts-1")) */
-  speechModel: SpeechModel;
-  /** AI SDK transcription model (e.g., openai.transcription("whisper-1")) */
-  transcriptionModel: TranscriptionModel;
+  modelProviderMetadata?: Record<string, any>;
+  /**
+   * AI SDK speech model for TTS (e.g., openai.speech("tts-1")).
+   * Optional when clients use browser-only speech.
+   */
+  speechModel?: SpeechModel;
+  /**
+   * AI SDK transcription model (e.g., openai.transcription("whisper-1")).
+   * Optional when clients use browser-only transcription.
+   */
+  transcriptionModel?: TranscriptionModel;
   /**
    * System prompt for the AI. Can be a string or a function that receives
    * the default prompt and returns a modified version.
@@ -34,4 +41,4 @@ interface CursorBuddyHandler {
 }
 //#endregion
 export { CursorBuddyHandlerConfig as n, CursorBuddyHandler as t };
-//# sourceMappingURL=types-L97cq8UK.d.mts.map
+//# sourceMappingURL=types-BxBhjZju.d.mts.map

package/dist/types-BxBhjZju.d.mts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"types-BxBhjZju.d.mts","names":[],"sources":["../src/server/types.ts"],"mappings":";;;;;AAKA;UAAiB,wBAAA;;EAEf,KAAA,EAAO,aAAA;EACP,qBAAA,GAAwB,MAAA;EAMV;;;;EAAd,WAAA,GAAc,WAAA;EAeA;;;;EATd,kBAAA,GAAqB,kBAAA;EANrB;;;;EAYA,MAAA,cAAoB,GAAA;IAAO,aAAA;EAAA;EAG3B;EAAA,KAAA,GAAQ,MAAA,SAAe,IAAA;EAAA;EAGvB,UAAA;AAAA;;AAMF;;UAAiB,kBAAA;EAEI;EAAnB,OAAA,GAAU,OAAA,EAAS,OAAA,KAAY,OAAA,CAAQ,QAAA;EAAR;EAG/B,MAAA,EAAQ,wBAAA;AAAA"}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "cursor-buddy",
-  "version": "0.0.2",
+  "version": "0.0.4",
   "description": "AI-powered cursor companion for web apps",
   "type": "module",
   "license": "MIT",

package/README.md DELETED Viewed

@@ -1,344 +0,0 @@
-# cursor-buddy
-AI-powered cursor companion for web apps. Push-to-talk voice assistant that can see your screen and point at things.
-## Features
-- **Push-to-talk voice input** — Hold a hotkey to speak, release to send
-- **Screenshot context** — AI sees your current viewport
-- **Voice responses** — Text-to-speech playback
-- **Cursor pointing** — AI can point at UI elements it references
-- **Voice interruption** — Start talking again to cut off current response
-- **Framework agnostic** — Core client works without React, adapter-based architecture
-- **Customizable** — CSS variables, custom components, headless mode
-## Installation
-```bash
-npm install cursor-buddy
-# or
-pnpm add cursor-buddy
-```
-## Quick Start
-### 1. Server Setup
-Create an API route that handles chat, transcription, and TTS.
-```ts
-// lib/cursor-buddy.ts
-import { createCursorBuddyHandler } from "cursor-buddy/server"
-import { openai } from "@ai-sdk/openai"
-export const cursorBuddy = createCursorBuddyHandler({
-  model: openai("gpt-4o"),
-  speechModel: openai.speech("tts-1"),
-  transcriptionModel: openai.transcription("whisper-1"),
-})
-```
-#### Next.js App Router
-```ts
-// app/api/cursor-buddy/[...path]/route.ts
-import { toNextJsHandler } from "cursor-buddy/server/next"
-import { cursorBuddy } from "@/lib/cursor-buddy"
-export const { GET, POST } = toNextJsHandler(cursorBuddy)
-```
-### 2. Client Setup
-Add the `<CursorBuddy />` component to your app.
-```tsx
-// app/layout.tsx
-import { CursorBuddy } from "cursor-buddy/react"
-export default function RootLayout({ children }) {
-  return (
-    <html>
-      <body>
-        {children}
-        <CursorBuddy endpoint="/api/cursor-buddy" />
-      </body>
-    </html>
-  )
-}
-```
-That's it! Hold **Ctrl+Alt** to speak, release to send.
-## Server Configuration
-```ts
-createCursorBuddyHandler({
-  // Required
-  model: LanguageModel,              // AI SDK chat model
-  speechModel: SpeechModel,          // AI SDK speech model
-  transcriptionModel: TranscriptionModel,  // AI SDK transcription model
-  // Optional
-  system: string | ((ctx) => string),  // Custom system prompt
-  tools: Record<string, Tool>,         // AI SDK tools
-  maxHistory: number,                  // Max conversation history (default: 10)
-})
-```
-### Custom System Prompt
-```ts
-createCursorBuddyHandler({
-  model: openai("gpt-4o"),
-  speechModel: openai.speech("tts-1"),
-  transcriptionModel: openai.transcription("whisper-1"),
-  // Extend the default prompt
-  system: ({ defaultPrompt }) => `
-    ${defaultPrompt}
-    You are helping users navigate a project management dashboard.
-    The sidebar contains: Projects, Tasks, Calendar, Settings.
-  `,
-})
-```
-## Client Configuration
-```tsx
-<CursorBuddy
-  // Required
-  endpoint="/api/cursor-buddy"
-  // Optional
-  hotkey="ctrl+alt"              // Push-to-talk hotkey (default: "ctrl+alt")
-  container={element}            // Portal container (default: document.body)
-  // Custom components
-  cursor={(props) => <CustomCursor {...props} />}
-  speechBubble={(props) => <CustomBubble {...props} />}
-  waveform={(props) => <CustomWaveform {...props} />}
-  // Callbacks
-  onTranscript={(text) => {}}    // Called when speech is transcribed
-  onResponse={(text) => {}}      // Called when AI responds
-  onPoint={(target) => {}}       // Called when AI points at element
-  onStateChange={(state) => {}}  // Called on state change
-  onError={(error) => {}}        // Called on error
-/>
-```
-## Customization
-### CSS Variables
-Cursor buddy styles are customizable via CSS variables. Override them in your stylesheet:
-```css
-:root {
-  /* Cursor colors by state */
-  --cursor-buddy-color-idle: #3b82f6;
-  --cursor-buddy-color-listening: #ef4444;
-  --cursor-buddy-color-processing: #eab308;
-  --cursor-buddy-color-responding: #22c55e;
-  /* Speech bubble */
-  --cursor-buddy-bubble-bg: #ffffff;
-  --cursor-buddy-bubble-text: #1f2937;
-  --cursor-buddy-bubble-radius: 8px;
-  --cursor-buddy-bubble-shadow: 0 4px 12px rgba(0, 0, 0, 0.15);
-  /* Waveform */
-  --cursor-buddy-waveform-color: #ef4444;
-}
-```
-### Custom Components
-Replace default components with your own:
-```tsx
-import { CursorBuddy, type CursorRenderProps } from "cursor-buddy/react"
-function MyCursor({ state, rotation, scale }: CursorRenderProps) {
-  return (
-    <div style={{ transform: `rotate(${rotation}rad) scale(${scale})` }}>
-      {state === "listening" ? "🎤" : "👆"}
-    </div>
-  )
-}
-<CursorBuddy
-  endpoint="/api/cursor-buddy"
-  cursor={(props) => <MyCursor {...props} />}
-/>
-```
-## Headless Mode
-For full control, use the provider and hook directly:
-```tsx
-import {
-  CursorBuddyProvider,
-  useCursorBuddy
-} from "cursor-buddy/react"
-function App() {
-  return (
-    <CursorBuddyProvider endpoint="/api/cursor-buddy">
-      <MyCustomUI />
-    </CursorBuddyProvider>
-  )
-}
-function MyCustomUI() {
-  const {
-    state,           // "idle" | "listening" | "processing" | "responding"
-    transcript,      // Latest user speech
-    response,        // Latest AI response
-    audioLevel,      // 0-1, for waveform visualization
-    isEnabled,
-    isPointing,
-    error,
-    // Actions
-    startListening,
-    stopListening,
-    setEnabled,
-    pointAt,         // Manually point at coordinates
-    dismissPointing,
-    reset,
-  } = useCursorBuddy()
-  return (
-    <div>
-      <p>State: {state}</p>
-      <button
-        onMouseDown={startListening}
-        onMouseUp={stopListening}
-      >
-        Hold to speak
-      </button>
-    </div>
-  )
-}
-```
-## Framework-Agnostic Usage
-For non-React environments, use the core client directly:
-```ts
-import { CursorBuddyClient } from "cursor-buddy"
-const client = new CursorBuddyClient("/api/cursor-buddy", {
-  onStateChange: (state) => console.log("State:", state),
-  onTranscript: (text) => console.log("Transcript:", text),
-  onResponse: (text) => console.log("Response:", text),
-  onError: (err) => console.error("Error:", err),
-})
-// Subscribe to state changes
-client.subscribe(() => {
-  const snapshot = client.getSnapshot()
-  console.log(snapshot)
-})
-// Trigger voice interaction
-client.startListening()
-// ... user speaks ...
-client.stopListening()
-```
-## Render Props Types
-```ts
-interface CursorRenderProps {
-  state: "idle" | "listening" | "processing" | "responding"
-  isPointing: boolean
-  rotation: number   // Radians, direction of travel
-  scale: number      // 1.0 normal, up to 1.3 during flight
-}
-interface SpeechBubbleRenderProps {
-  text: string
-  isVisible: boolean
-}
-interface WaveformRenderProps {
-  audioLevel: number  // 0-1
-  isListening: boolean
-}
-```
-## API Reference
-### Core Exports (`cursor-buddy`)
-| Export | Description |
-|--------|-------------|
-| `CursorBuddyClient` | Framework-agnostic client class |
-| `VoiceState` | Type: `"idle" \| "listening" \| "processing" \| "responding"` |
-| `PointingTarget` | Type: `{ x: number, y: number, label: string }` |
-| `Point` | Type: `{ x: number, y: number }` |
-### Server Exports (`cursor-buddy/server`)
-| Export | Description |
-|--------|-------------|
-| `createCursorBuddyHandler` | Create the main request handler |
-| `DEFAULT_SYSTEM_PROMPT` | Default system prompt for reference |
-| `CursorBuddyHandlerConfig` | Type for handler configuration |
-| `CursorBuddyHandler` | Return type of `createCursorBuddyHandler` |
-### Server Adapters (`cursor-buddy/server/next`)
-| Export | Description |
-|--------|-------------|
-| `toNextJsHandler` | Convert handler to Next.js App Router format |
-### React Exports (`cursor-buddy/react`)
-| Export | Description |
-|--------|-------------|
-| `CursorBuddy` | Drop-in component with built-in UI |
-| `CursorBuddyProvider` | Headless provider for custom UI |
-| `useCursorBuddy` | Hook to access state and actions |
-### Types (`cursor-buddy/react`)
-| Export | Description |
-|--------|-------------|
-| `CursorBuddyProps` | Props for `<CursorBuddy />` |
-| `CursorBuddyProviderProps` | Props for `<CursorBuddyProvider />` |
-| `UseCursorBuddyReturn` | Return type of `useCursorBuddy()` |
-| `CursorRenderProps` | Props passed to custom cursor |
-| `SpeechBubbleRenderProps` | Props passed to custom speech bubble |
-| `WaveformRenderProps` | Props passed to custom waveform |
-## How It Works
-1. User holds the hotkey (Ctrl+Alt)
-2. Microphone captures audio, waveform shows audio level
-3. User releases hotkey
-4. Screenshot of viewport is captured
-5. Audio is transcribed via AI SDK
-6. Screenshot + capture metadata sent to AI model
-7. AI responds with text, optionally including `[POINT:x,y:label]` tag in screenshot-image coordinates
-8. Response is spoken via TTS
-9. If pointing tag present, coordinates are mapped back to the live viewport and the cursor animates to the target location
-10. **If user presses hotkey again at any point, current response is interrupted**
-## TODOs
-- [ ] More test coverage for internal services
-- [ ] Add `muted` prop for TTS control
-- [ ] Faster transcription -> chat -> TTS flow (eg single endpoint instead of 3 calls)
-- [ ] Composition pattern for custom components
-- [ ] Better hotkey registering code
-## License
-MIT