@namch/agent-assistant 1.0.0 → 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (168) hide show
  1. package/README.md +83 -539
  2. package/agents/backend-engineer.md +0 -8
  3. package/agents/brainstormer.md +0 -6
  4. package/agents/business-analyst.md +0 -5
  5. package/agents/database-architect.md +0 -6
  6. package/agents/debugger.md +0 -6
  7. package/agents/designer.md +0 -5
  8. package/agents/devops-engineer.md +0 -7
  9. package/agents/docs-manager.md +0 -6
  10. package/agents/frontend-engineer.md +0 -7
  11. package/agents/game-engineer.md +0 -7
  12. package/agents/mobile-engineer.md +0 -7
  13. package/agents/performance-engineer.md +0 -7
  14. package/agents/planner.md +0 -6
  15. package/agents/project-manager.md +0 -6
  16. package/agents/researcher.md +0 -5
  17. package/agents/reviewer.md +0 -6
  18. package/agents/scouter.md +0 -6
  19. package/agents/security-engineer.md +0 -7
  20. package/agents/tech-lead.md +0 -7
  21. package/agents/tester.md +0 -5
  22. package/cli/README.md +19 -10
  23. package/documents/business/business-features.md +1 -1
  24. package/documents/business/business-prd.md +4 -4
  25. package/documents/knowledge-architecture.md +1 -1
  26. package/documents/knowledge-domain.md +1 -1
  27. package/documents/knowledge-overview.md +14 -29
  28. package/documents/knowledge-source-base.md +14 -14
  29. package/package.json +1 -1
  30. package/rules/QUICK-REFERENCE.md +4 -1
  31. package/rules/SKILL-DISCOVERY.md +37 -14
  32. package/skills/active-directory-attacks/SKILL.md +383 -0
  33. package/skills/active-directory-attacks/references/advanced-attacks.md +382 -0
  34. package/skills/agent-evaluation/SKILL.md +64 -0
  35. package/skills/agent-memory-mcp/SKILL.md +82 -0
  36. package/skills/agent-memory-systems/SKILL.md +67 -0
  37. package/skills/agent-tool-builder/SKILL.md +53 -0
  38. package/skills/ai-agents-architect/SKILL.md +90 -0
  39. package/skills/ai-product/SKILL.md +54 -0
  40. package/skills/ai-wrapper-product/SKILL.md +273 -0
  41. package/skills/api-documentation-generator/SKILL.md +484 -0
  42. package/skills/api-fuzzing-bug-bounty/SKILL.md +433 -0
  43. package/skills/api-security-best-practices/SKILL.md +907 -0
  44. package/skills/autonomous-agent-patterns/SKILL.md +761 -0
  45. package/skills/autonomous-agents/SKILL.md +68 -0
  46. package/skills/aws-penetration-testing/SKILL.md +405 -0
  47. package/skills/aws-penetration-testing/references/advanced-aws-pentesting.md +469 -0
  48. package/skills/azure-functions/SKILL.md +42 -0
  49. package/skills/backend-dev-guidelines/SKILL.md +342 -0
  50. package/skills/backend-dev-guidelines/resources/architecture-overview.md +451 -0
  51. package/skills/backend-dev-guidelines/resources/async-and-errors.md +307 -0
  52. package/skills/backend-dev-guidelines/resources/complete-examples.md +638 -0
  53. package/skills/backend-dev-guidelines/resources/configuration.md +275 -0
  54. package/skills/backend-dev-guidelines/resources/database-patterns.md +224 -0
  55. package/skills/backend-dev-guidelines/resources/middleware-guide.md +213 -0
  56. package/skills/backend-dev-guidelines/resources/routing-and-controllers.md +756 -0
  57. package/skills/backend-dev-guidelines/resources/sentry-and-monitoring.md +336 -0
  58. package/skills/backend-dev-guidelines/resources/services-and-repositories.md +789 -0
  59. package/skills/backend-dev-guidelines/resources/testing-guide.md +235 -0
  60. package/skills/backend-dev-guidelines/resources/validation-patterns.md +754 -0
  61. package/skills/broken-authentication/SKILL.md +476 -0
  62. package/skills/bullmq-specialist/SKILL.md +57 -0
  63. package/skills/bun-development/SKILL.md +691 -0
  64. package/skills/burp-suite-testing/SKILL.md +380 -0
  65. package/skills/cloud-penetration-testing/SKILL.md +501 -0
  66. package/skills/cloud-penetration-testing/references/advanced-cloud-scripts.md +318 -0
  67. package/skills/computer-use-agents/SKILL.md +315 -0
  68. package/skills/content-creator/SKILL.md +248 -0
  69. package/skills/content-creator/assets/content_calendar_template.md +99 -0
  70. package/skills/content-creator/references/brand_guidelines.md +199 -0
  71. package/skills/content-creator/references/content_frameworks.md +534 -0
  72. package/skills/content-creator/references/social_media_optimization.md +317 -0
  73. package/skills/content-creator/scripts/brand_voice_analyzer.py +185 -0
  74. package/skills/content-creator/scripts/seo_optimizer.py +419 -0
  75. package/skills/context-window-management/SKILL.md +53 -0
  76. package/skills/conversation-memory/SKILL.md +61 -0
  77. package/skills/copy-editing/SKILL.md +439 -0
  78. package/skills/copywriting/SKILL.md +225 -0
  79. package/skills/crewai/SKILL.md +243 -0
  80. package/skills/discord-bot-architect/SKILL.md +277 -0
  81. package/skills/dispatching-parallel-agents/SKILL.md +180 -0
  82. package/skills/email-sequence/SKILL.md +925 -0
  83. package/skills/email-systems/SKILL.md +54 -0
  84. package/skills/ethical-hacking-methodology/SKILL.md +466 -0
  85. package/skills/executing-plans/SKILL.md +76 -0
  86. package/skills/file-path-traversal/SKILL.md +486 -0
  87. package/skills/finishing-a-development-branch/SKILL.md +200 -0
  88. package/skills/frontend-dev-guidelines/SKILL.md +359 -0
  89. package/skills/frontend-dev-guidelines/resources/common-patterns.md +331 -0
  90. package/skills/frontend-dev-guidelines/resources/complete-examples.md +872 -0
  91. package/skills/frontend-dev-guidelines/resources/component-patterns.md +502 -0
  92. package/skills/frontend-dev-guidelines/resources/data-fetching.md +767 -0
  93. package/skills/frontend-dev-guidelines/resources/file-organization.md +502 -0
  94. package/skills/frontend-dev-guidelines/resources/loading-and-error-states.md +501 -0
  95. package/skills/frontend-dev-guidelines/resources/performance.md +406 -0
  96. package/skills/frontend-dev-guidelines/resources/routing-guide.md +364 -0
  97. package/skills/frontend-dev-guidelines/resources/styling-guide.md +428 -0
  98. package/skills/frontend-dev-guidelines/resources/typescript-standards.md +418 -0
  99. package/skills/gcp-cloud-run/SKILL.md +288 -0
  100. package/skills/git-pushing/SKILL.md +33 -0
  101. package/skills/git-pushing/scripts/smart_commit.sh +19 -0
  102. package/skills/github-workflow-automation/SKILL.md +846 -0
  103. package/skills/html-injection-testing/SKILL.md +498 -0
  104. package/skills/idor-testing/SKILL.md +442 -0
  105. package/skills/inngest/SKILL.md +55 -0
  106. package/skills/javascript-mastery/SKILL.md +645 -0
  107. package/skills/kaizen/SKILL.md +730 -0
  108. package/skills/langfuse/SKILL.md +238 -0
  109. package/skills/langgraph/SKILL.md +287 -0
  110. package/skills/linux-privilege-escalation/SKILL.md +504 -0
  111. package/skills/llm-app-patterns/SKILL.md +760 -0
  112. package/skills/metasploit-framework/SKILL.md +478 -0
  113. package/skills/multi-agent-brainstorming/SKILL.md +256 -0
  114. package/skills/neon-postgres/SKILL.md +56 -0
  115. package/skills/nextjs-supabase-auth/SKILL.md +56 -0
  116. package/skills/nosql-expert/SKILL.md +111 -0
  117. package/skills/pentest-checklist/SKILL.md +334 -0
  118. package/skills/pentest-commands/SKILL.md +438 -0
  119. package/skills/plaid-fintech/SKILL.md +50 -0
  120. package/skills/planning-with-files/SKILL.md +211 -0
  121. package/skills/planning-with-files/examples.md +202 -0
  122. package/skills/planning-with-files/reference.md +218 -0
  123. package/skills/planning-with-files/scripts/check-complete.sh +44 -0
  124. package/skills/planning-with-files/scripts/init-session.sh +120 -0
  125. package/skills/planning-with-files/templates/findings.md +95 -0
  126. package/skills/planning-with-files/templates/progress.md +114 -0
  127. package/skills/planning-with-files/templates/task_plan.md +132 -0
  128. package/skills/privilege-escalation-methods/SKILL.md +333 -0
  129. package/skills/production-code-audit/SKILL.md +540 -0
  130. package/skills/prompt-caching/SKILL.md +61 -0
  131. package/skills/prompt-engineering/SKILL.md +171 -0
  132. package/skills/prompt-library/SKILL.md +322 -0
  133. package/skills/rag-engineer/SKILL.md +90 -0
  134. package/skills/rag-implementation/SKILL.md +63 -0
  135. package/skills/react-ui-patterns/SKILL.md +289 -0
  136. package/skills/red-team-tools/SKILL.md +310 -0
  137. package/skills/scanning-tools/SKILL.md +589 -0
  138. package/skills/shodan-reconnaissance/SKILL.md +503 -0
  139. package/skills/slack-bot-builder/SKILL.md +264 -0
  140. package/skills/smtp-penetration-testing/SKILL.md +500 -0
  141. package/skills/social-content/SKILL.md +807 -0
  142. package/skills/software-architecture/SKILL.md +75 -0
  143. package/skills/sql-injection-testing/SKILL.md +448 -0
  144. package/skills/sqlmap-database-pentesting/SKILL.md +400 -0
  145. package/skills/ssh-penetration-testing/SKILL.md +488 -0
  146. package/skills/stripe-integration/SKILL.md +69 -0
  147. package/skills/subagent-driven-development/SKILL.md +240 -0
  148. package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +20 -0
  149. package/skills/subagent-driven-development/implementer-prompt.md +78 -0
  150. package/skills/subagent-driven-development/spec-reviewer-prompt.md +61 -0
  151. package/skills/tavily-web/SKILL.md +36 -0
  152. package/skills/telegram-bot-builder/SKILL.md +254 -0
  153. package/skills/test-driven-development/SKILL.md +371 -0
  154. package/skills/test-driven-development/testing-anti-patterns.md +299 -0
  155. package/skills/test-fixing/SKILL.md +119 -0
  156. package/skills/top-web-vulnerabilities/SKILL.md +543 -0
  157. package/skills/trigger-dev/SKILL.md +67 -0
  158. package/skills/twilio-communications/SKILL.md +295 -0
  159. package/skills/upstash-qstash/SKILL.md +68 -0
  160. package/skills/verification-before-completion/SKILL.md +139 -0
  161. package/skills/voice-agents/SKILL.md +68 -0
  162. package/skills/voice-ai-development/SKILL.md +302 -0
  163. package/skills/windows-privilege-escalation/SKILL.md +496 -0
  164. package/skills/wireshark-analysis/SKILL.md +497 -0
  165. package/skills/wordpress-penetration-testing/SKILL.md +485 -0
  166. package/skills/workflow-automation/SKILL.md +68 -0
  167. package/skills/xss-html-injection/SKILL.md +499 -0
  168. package/skills/zapier-make-patterns/SKILL.md +67 -0
@@ -0,0 +1,302 @@
1
+ ---
2
+ name: voice-ai-development
3
+ description: "Expert in building voice AI applications - from real-time voice agents to voice-enabled apps. Covers OpenAI Realtime API, Vapi for voice agents, Deepgram for transcription, ElevenLabs for synthesis, LiveKit for real-time infrastructure, and WebRTC fundamentals. Knows how to build low-latency, production-ready voice experiences. Use when: voice ai, voice agent, speech to text, text to speech, realtime voice."
4
+ source: vibeship-spawner-skills (Apache 2.0)
5
+ ---
6
+
7
+ # Voice AI Development
8
+
9
+ **Role**: Voice AI Architect
10
+
11
+ You are an expert in building real-time voice applications. You think in terms of
12
+ latency budgets, audio quality, and user experience. You know that voice apps feel
13
+ magical when fast and broken when slow. You choose the right combination of providers
14
+ for each use case and optimize relentlessly for perceived responsiveness.
15
+
16
+ ## Capabilities
17
+
18
+ - OpenAI Realtime API
19
+ - Vapi voice agents
20
+ - Deepgram STT/TTS
21
+ - ElevenLabs voice synthesis
22
+ - LiveKit real-time infrastructure
23
+ - WebRTC audio handling
24
+ - Voice agent design
25
+ - Latency optimization
26
+
27
+ ## Requirements
28
+
29
+ - Python or Node.js
30
+ - API keys for providers
31
+ - Audio handling knowledge
32
+
33
+ ## Patterns
34
+
35
+ ### OpenAI Realtime API
36
+
37
+ Native voice-to-voice with GPT-4o
38
+
39
+ **When to use**: When you want integrated voice AI without separate STT/TTS
40
+
41
+ ```python
42
+ import asyncio
43
+ import websockets
44
+ import json
45
+ import base64
46
+
47
+ OPENAI_API_KEY = "sk-..."
48
+
49
+ async def voice_session():
50
+ url = "wss://api.openai.com/v1/realtime?model=gpt-4o-realtime-preview"
51
+ headers = {
52
+ "Authorization": f"Bearer {OPENAI_API_KEY}",
53
+ "OpenAI-Beta": "realtime=v1"
54
+ }
55
+
56
+ async with websockets.connect(url, extra_headers=headers) as ws:
57
+ # Configure session
58
+ await ws.send(json.dumps({
59
+ "type": "session.update",
60
+ "session": {
61
+ "modalities": ["text", "audio"],
62
+ "voice": "alloy", # alloy, echo, fable, onyx, nova, shimmer
63
+ "input_audio_format": "pcm16",
64
+ "output_audio_format": "pcm16",
65
+ "input_audio_transcription": {
66
+ "model": "whisper-1"
67
+ },
68
+ "turn_detection": {
69
+ "type": "server_vad", # Voice activity detection
70
+ "threshold": 0.5,
71
+ "prefix_padding_ms": 300,
72
+ "silence_duration_ms": 500
73
+ },
74
+ "tools": [
75
+ {
76
+ "type": "function",
77
+ "name": "get_weather",
78
+ "description": "Get weather for a location",
79
+ "parameters": {
80
+ "type": "object",
81
+ "properties": {
82
+ "location": {"type": "string"}
83
+ }
84
+ }
85
+ }
86
+ ]
87
+ }
88
+ }))
89
+
90
+ # Send audio (PCM16, 24kHz, mono)
91
+ async def send_audio(audio_bytes):
92
+ await ws.send(json.dumps({
93
+ "type": "input_audio_buffer.append",
94
+ "audio": base64.b64encode(audio_bytes).decode()
95
+ }))
96
+
97
+ # Receive events
98
+ async for message in ws:
99
+ event = json.loads(message)
100
+
101
+ if event["type"] == "resp
102
+ ```
103
+
104
+ ### Vapi Voice Agent
105
+
106
+ Build voice agents with Vapi platform
107
+
108
+ **When to use**: Phone-based agents, quick deployment
109
+
110
+ ```python
111
+ # Vapi provides hosted voice agents with webhooks
112
+
113
+ from flask import Flask, request, jsonify
114
+ import vapi
115
+
116
+ app = Flask(__name__)
117
+ client = vapi.Vapi(api_key="...")
118
+
119
+ # Create an assistant
120
+ assistant = client.assistants.create(
121
+ name="Support Agent",
122
+ model={
123
+ "provider": "openai",
124
+ "model": "gpt-4o",
125
+ "messages": [
126
+ {
127
+ "role": "system",
128
+ "content": "You are a helpful support agent..."
129
+ }
130
+ ]
131
+ },
132
+ voice={
133
+ "provider": "11labs",
134
+ "voiceId": "21m00Tcm4TlvDq8ikWAM" # Rachel
135
+ },
136
+ firstMessage="Hi! How can I help you today?",
137
+ transcriber={
138
+ "provider": "deepgram",
139
+ "model": "nova-2"
140
+ }
141
+ )
142
+
143
+ # Webhook for conversation events
144
+ @app.route("/vapi/webhook", methods=["POST"])
145
+ def vapi_webhook():
146
+ event = request.json
147
+
148
+ if event["type"] == "function-call":
149
+ # Handle tool call
150
+ name = event["functionCall"]["name"]
151
+ args = event["functionCall"]["parameters"]
152
+
153
+ if name == "check_order":
154
+ result = check_order(args["order_id"])
155
+ return jsonify({"result": result})
156
+
157
+ elif event["type"] == "end-of-call-report":
158
+ # Call ended - save transcript
159
+ transcript = event["transcript"]
160
+ save_transcript(event["call"]["id"], transcript)
161
+
162
+ return jsonify({"ok": True})
163
+
164
+ # Start outbound call
165
+ call = client.calls.create(
166
+ assistant_id=assistant.id,
167
+ customer={
168
+ "number": "+1234567890"
169
+ },
170
+ phoneNumber={
171
+ "twilioPhoneNumber": "+0987654321"
172
+ }
173
+ )
174
+
175
+ # Or create web call
176
+ web_call = client.calls.create(
177
+ assistant_id=assistant.id,
178
+ type="web"
179
+ )
180
+ # Returns URL for WebRTC connection
181
+ ```
182
+
183
+ ### Deepgram STT + ElevenLabs TTS
184
+
185
+ Best-in-class transcription and synthesis
186
+
187
+ **When to use**: High quality voice, custom pipeline
188
+
189
+ ```python
190
+ import asyncio
191
+ from deepgram import DeepgramClient, LiveTranscriptionEvents
192
+ from elevenlabs import ElevenLabs
193
+
194
+ # Deepgram real-time transcription
195
+ deepgram = DeepgramClient(api_key="...")
196
+
197
+ async def transcribe_stream(audio_stream):
198
+ connection = deepgram.listen.live.v("1")
199
+
200
+ async def on_transcript(result):
201
+ transcript = result.channel.alternatives[0].transcript
202
+ if transcript:
203
+ print(f"Heard: {transcript}")
204
+ if result.is_final:
205
+ # Process final transcript
206
+ await handle_user_input(transcript)
207
+
208
+ connection.on(LiveTranscriptionEvents.Transcript, on_transcript)
209
+
210
+ await connection.start({
211
+ "model": "nova-2", # Best quality
212
+ "language": "en",
213
+ "smart_format": True,
214
+ "interim_results": True, # Get partial results
215
+ "utterance_end_ms": 1000,
216
+ "vad_events": True, # Voice activity detection
217
+ "encoding": "linear16",
218
+ "sample_rate": 16000
219
+ })
220
+
221
+ # Stream audio
222
+ async for chunk in audio_stream:
223
+ await connection.send(chunk)
224
+
225
+ await connection.finish()
226
+
227
+ # ElevenLabs streaming synthesis
228
+ eleven = ElevenLabs(api_key="...")
229
+
230
+ def text_to_speech_stream(text: str):
231
+ """Stream TTS audio chunks."""
232
+ audio_stream = eleven.text_to_speech.convert_as_stream(
233
+ voice_id="21m00Tcm4TlvDq8ikWAM", # Rachel
234
+ model_id="eleven_turbo_v2_5", # Fastest
235
+ text=text,
236
+ output_format="pcm_24000" # Raw PCM for low latency
237
+ )
238
+
239
+ for chunk in audio_stream:
240
+ yield chunk
241
+
242
+ # Or with WebSocket for lowest latency
243
+ async def tts_websocket(text_stream):
244
+ async with eleven.text_to_speech.stream_async(
245
+ voice_id="21m00Tcm4TlvDq8ikWAM",
246
+ model_id="eleven_turbo_v2_5"
247
+ ) as tts:
248
+ async for text_chunk in text_stream:
249
+ audio = await tts.send(text_chunk)
250
+ yield audio
251
+
252
+ # Flush remaining audio
253
+ final_audio = await tts.flush()
254
+ yield final_audio
255
+ ```
256
+
257
+ ## Anti-Patterns
258
+
259
+ ### ❌ Non-streaming Pipeline
260
+
261
+ **Why bad**: Adds seconds of latency.
262
+ User perceives as slow.
263
+ Loses conversation flow.
264
+
265
+ **Instead**: Stream everything:
266
+ - STT: interim results
267
+ - LLM: token streaming
268
+ - TTS: chunk streaming
269
+ Start TTS before LLM finishes.
270
+
271
+ ### ❌ Ignoring Interruptions
272
+
273
+ **Why bad**: Frustrating user experience.
274
+ Feels like talking to a machine.
275
+ Wastes time.
276
+
277
+ **Instead**: Implement barge-in detection.
278
+ Use VAD to detect user speech.
279
+ Stop TTS immediately.
280
+ Clear audio queue.
281
+
282
+ ### ❌ Single Provider Lock-in
283
+
284
+ **Why bad**: May not be best quality.
285
+ Single point of failure.
286
+ Harder to optimize.
287
+
288
+ **Instead**: Mix best providers:
289
+ - Deepgram for STT (speed + accuracy)
290
+ - ElevenLabs for TTS (voice quality)
291
+ - OpenAI/Anthropic for LLM
292
+
293
+ ## Limitations
294
+
295
+ - Latency varies by provider
296
+ - Cost per minute adds up
297
+ - Quality depends on network
298
+ - Complex debugging
299
+
300
+ ## Related Skills
301
+
302
+ Works well with: `langgraph`, `structured-output`, `langfuse`