npm - @laitszkin/apollo-toolkit - Versions diffs - 3.13.2 → 3.14.0 - Mend

@laitszkin/apollo-toolkit 3.13.2 → 3.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (154) hide show

package/AGENTS.md +7 -7
package/CHANGELOG.md +27 -0
package/CLAUDE.md +8 -8
package/analyse-app-logs/SKILL.md +3 -3
package/bin/apollo-toolkit.ts +7 -0
package/codex/codex-memory-manager/SKILL.md +2 -2
package/codex/learn-skill-from-conversations/SKILL.md +3 -3
package/dist/bin/apollo-toolkit.d.ts +2 -0
package/dist/bin/apollo-toolkit.js +7 -0
package/dist/lib/cli.d.ts +41 -0
package/dist/lib/cli.js +655 -0
package/dist/lib/installer.d.ts +59 -0
package/dist/lib/installer.js +404 -0
package/dist/lib/tool-runner.d.ts +19 -0
package/dist/lib/tool-runner.js +536 -0
package/dist/lib/tools/architecture.d.ts +2 -0
package/dist/lib/tools/architecture.js +34 -0
package/dist/lib/tools/create-specs.d.ts +2 -0
package/dist/lib/tools/create-specs.js +175 -0
package/dist/lib/tools/docs-to-voice.d.ts +2 -0
package/dist/lib/tools/docs-to-voice.js +705 -0
package/dist/lib/tools/enforce-video-aspect-ratio.d.ts +2 -0
package/dist/lib/tools/enforce-video-aspect-ratio.js +312 -0
package/dist/lib/tools/extract-conversations.d.ts +2 -0
package/dist/lib/tools/extract-conversations.js +105 -0
package/dist/lib/tools/extract-pdf-text.d.ts +2 -0
package/dist/lib/tools/extract-pdf-text.js +92 -0
package/dist/lib/tools/filter-logs.d.ts +2 -0
package/dist/lib/tools/filter-logs.js +94 -0
package/dist/lib/tools/find-github-issues.d.ts +2 -0
package/dist/lib/tools/find-github-issues.js +176 -0
package/dist/lib/tools/generate-storyboard-images.d.ts +2 -0
package/dist/lib/tools/generate-storyboard-images.js +419 -0
package/dist/lib/tools/log-cli-utils.d.ts +35 -0
package/dist/lib/tools/log-cli-utils.js +233 -0
package/dist/lib/tools/open-github-issue.d.ts +2 -0
package/dist/lib/tools/open-github-issue.js +750 -0
package/dist/lib/tools/read-github-issue.d.ts +2 -0
package/dist/lib/tools/read-github-issue.js +134 -0
package/dist/lib/tools/render-error-book.d.ts +2 -0
package/dist/lib/tools/render-error-book.js +265 -0
package/dist/lib/tools/render-katex.d.ts +2 -0
package/dist/lib/tools/render-katex.js +294 -0
package/dist/lib/tools/review-threads.d.ts +2 -0
package/dist/lib/tools/review-threads.js +491 -0
package/dist/lib/tools/search-logs.d.ts +2 -0
package/dist/lib/tools/search-logs.js +164 -0
package/dist/lib/tools/sync-memory-index.d.ts +2 -0
package/dist/lib/tools/sync-memory-index.js +113 -0
package/dist/lib/tools/validate-openai-agent-config.d.ts +2 -0
package/dist/lib/tools/validate-openai-agent-config.js +184 -0
package/dist/lib/tools/validate-skill-frontmatter.d.ts +2 -0
package/dist/lib/tools/validate-skill-frontmatter.js +118 -0
package/dist/lib/types.d.ts +82 -0
package/dist/lib/types.js +2 -0
package/dist/lib/updater.d.ts +34 -0
package/dist/lib/updater.js +112 -0
package/dist/lib/utils/format.d.ts +2 -0
package/dist/lib/utils/format.js +6 -0
package/dist/lib/utils/terminal.d.ts +12 -0
package/dist/lib/utils/terminal.js +26 -0
package/docs-to-voice/SKILL.md +0 -1
package/generate-spec/SKILL.md +1 -1
package/katex/SKILL.md +1 -2
package/lib/cli.ts +780 -0
package/lib/installer.ts +466 -0
package/lib/tool-runner.ts +561 -0
package/lib/tools/architecture.ts +34 -0
package/lib/tools/create-specs.ts +204 -0
package/lib/tools/docs-to-voice.ts +799 -0
package/lib/tools/enforce-video-aspect-ratio.ts +368 -0
package/lib/tools/extract-conversations.ts +114 -0
package/lib/tools/extract-pdf-text.ts +99 -0
package/lib/tools/filter-logs.ts +118 -0
package/lib/tools/find-github-issues.ts +211 -0
package/lib/tools/generate-storyboard-images.ts +455 -0
package/lib/tools/log-cli-utils.ts +262 -0
package/lib/tools/open-github-issue.ts +930 -0
package/lib/tools/read-github-issue.ts +179 -0
package/lib/tools/render-error-book.ts +300 -0
package/lib/tools/render-katex.ts +325 -0
package/lib/tools/review-threads.ts +590 -0
package/lib/tools/search-logs.ts +200 -0
package/lib/tools/sync-memory-index.ts +114 -0
package/lib/tools/validate-openai-agent-config.ts +209 -0
package/lib/tools/validate-skill-frontmatter.ts +124 -0
package/lib/types.ts +90 -0
package/lib/updater.ts +165 -0
package/lib/utils/format.ts +7 -0
package/lib/utils/terminal.ts +22 -0
package/open-github-issue/SKILL.md +2 -2
package/optimise-skill/SKILL.md +1 -1
package/package.json +13 -4
package/resources/project-architecture/assets/architecture.css +764 -0
package/resources/project-architecture/assets/viewer.client.js +144 -0
package/resources/project-architecture/index.html +42 -0
package/review-spec-related-changes/SKILL.md +1 -1
package/solve-issues-found-during-review/SKILL.md +2 -1
package/tsconfig.json +28 -0
package/analyse-app-logs/scripts/__pycache__/filter_logs_by_time.cpython-312.pyc +0 -0
package/analyse-app-logs/scripts/__pycache__/log_cli_utils.cpython-312.pyc +0 -0
package/analyse-app-logs/scripts/__pycache__/search_logs.cpython-312.pyc +0 -0
package/analyse-app-logs/scripts/filter_logs_by_time.py +0 -64
package/analyse-app-logs/scripts/log_cli_utils.py +0 -112
package/analyse-app-logs/scripts/search_logs.py +0 -137
package/analyse-app-logs/tests/test_filter_logs_by_time.py +0 -95
package/analyse-app-logs/tests/test_search_logs.py +0 -100
package/codex/codex-memory-manager/scripts/extract_recent_conversations.py +0 -369
package/codex/codex-memory-manager/scripts/sync_memory_index.py +0 -130
package/codex/codex-memory-manager/tests/test_extract_recent_conversations.py +0 -177
package/codex/codex-memory-manager/tests/test_memory_template.py +0 -37
package/codex/codex-memory-manager/tests/test_sync_memory_index.py +0 -84
package/codex/learn-skill-from-conversations/scripts/extract_recent_conversations.py +0 -369
package/codex/learn-skill-from-conversations/tests/test_extract_recent_conversations.py +0 -177
package/docs-to-voice/scripts/__pycache__/docs_to_voice.cpython-312.pyc +0 -0
package/docs-to-voice/scripts/docs_to_voice.py +0 -1385
package/docs-to-voice/scripts/docs_to_voice.sh +0 -11
package/docs-to-voice/tests/test_docs_to_voice_api_max_chars.py +0 -210
package/docs-to-voice/tests/test_docs_to_voice_sentence_timeline.py +0 -115
package/docs-to-voice/tests/test_docs_to_voice_settings.py +0 -43
package/docs-to-voice/tests/test_docs_to_voice_shell_wrapper.py +0 -51
package/docs-to-voice/tests/test_docs_to_voice_speech_rate.py +0 -57
package/generate-spec/scripts/__pycache__/create-specscpython-312.pyc +0 -0
package/generate-spec/scripts/create-specs +0 -215
package/generate-spec/tests/test_create_specs.py +0 -200
package/init-project-html/scripts/architecture-bootstrap-render.js +0 -16
package/init-project-html/scripts/architecture.js +0 -296
package/katex/scripts/__pycache__/render_katex.cpython-312.pyc +0 -0
package/katex/scripts/render_katex.py +0 -247
package/katex/scripts/render_katex.sh +0 -11
package/katex/tests/test_render_katex.py +0 -174
package/learning-error-book/scripts/render_error_book_json_to_pdf.py +0 -590
package/learning-error-book/tests/test_render_error_book_json_to_pdf.py +0 -134
package/open-github-issue/scripts/__pycache__/open_github_issue.cpython-312.pyc +0 -0
package/open-github-issue/scripts/open_github_issue.py +0 -705
package/open-github-issue/tests/test_open_github_issue.py +0 -381
package/openai-text-to-image-storyboard/scripts/generate_storyboard_images.py +0 -763
package/openai-text-to-image-storyboard/tests/test_generate_storyboard_images.py +0 -177
package/read-github-issue/scripts/__pycache__/find_issues.cpython-312.pyc +0 -0
package/read-github-issue/scripts/__pycache__/read_issue.cpython-312.pyc +0 -0
package/read-github-issue/scripts/find_issues.py +0 -148
package/read-github-issue/scripts/read_issue.py +0 -108
package/read-github-issue/tests/test_find_issues.py +0 -127
package/read-github-issue/tests/test_read_issue.py +0 -109
package/resolve-review-comments/scripts/__pycache__/review_threads.cpython-312.pyc +0 -0
package/resolve-review-comments/scripts/review_threads.py +0 -425
package/resolve-review-comments/tests/test_review_threads.py +0 -74
package/scripts/validate_openai_agent_config.py +0 -209
package/scripts/validate_skill_frontmatter.py +0 -131
package/text-to-short-video/scripts/__pycache__/enforce_video_aspect_ratio.cpython-312.pyc +0 -0
package/text-to-short-video/scripts/enforce_video_aspect_ratio.py +0 -350
package/text-to-short-video/tests/test_enforce_video_aspect_ratio.py +0 -194
package/weekly-financial-event-report/scripts/extract_pdf_text_pdfkit.swift +0 -99
package/weekly-financial-event-report/tests/test_extract_pdf_text_pdfkit.py +0 -64

package/lib/tools/docs-to-voice.ts ADDED Viewed

@@ -0,0 +1,799 @@
+import { spawn, execSync } from 'node:child_process';
+import fs from 'node:fs';
+import path from 'node:path';
+import https from 'node:https';
+import http from 'node:http';
+import type { ToolContext } from '../types';
+const DEFAULT_API_ENDPOINT =
+  'https://dashscope-intl.aliyuncs.com/api/v1/services/aigc/multimodal-generation/generation';
+const DEFAULT_API_MODEL = 'qwen3-tts';
+const DEFAULT_API_VOICE = 'Cherry';
+interface DocsToVoiceArgs {
+  inputText: string | null;
+  inputFile: string | null;
+  projectDir: string;
+  projectName: string | null;
+  outputName: string | null;
+  mode: string;
+  voice: string | null;
+  rate: string | null;
+  speechRate: string | null;
+  apiEndpoint: string;
+  apiModel: string;
+  apiVoice: string;
+  apiKey: string | null;
+  maxChars: string | null;
+  noAutoProsody: boolean;
+  force: boolean;
+  help: boolean;
+}
+interface TimelineEntry {
+  index: number;
+  text: string;
+  startSeconds: number;
+  endSeconds: number;
+  startMs: number;
+  endMs: number;
+}
+function parseArgs(args: string[]): DocsToVoiceArgs {
+  const parsed: DocsToVoiceArgs = {
+    inputText: null,
+    inputFile: null,
+    projectDir: '.',
+    projectName: null,
+    outputName: null,
+    mode: 'say',
+    voice: null,
+    rate: null,
+    speechRate: null,
+    apiEndpoint: DEFAULT_API_ENDPOINT,
+    apiModel: DEFAULT_API_MODEL,
+    apiVoice: DEFAULT_API_VOICE,
+    apiKey: null,
+    maxChars: null,
+    noAutoProsody: false,
+    force: false,
+    help: false,
+  };
+  for (let i = 0; i < args.length; i++) {
+    const arg = args[i];
+    if (arg === '--help' || arg === '-h') {
+      parsed.help = true;
+      continue;
+    }
+    if (arg.startsWith('--')) {
+      const eqIndex = arg.indexOf('=');
+      let key: string;
+      let value: string;
+      if (eqIndex !== -1) {
+        key = arg.slice(2, eqIndex);
+        value = arg.slice(eqIndex + 1);
+      } else {
+        key = arg.slice(2);
+        value = args[++i] || '';
+      }
+      switch (key) {
+        case 'text':
+          parsed.inputText = value;
+          break;
+        case 'input':
+        case 'input-file':
+          parsed.inputFile = value;
+          break;
+        case 'project-dir':
+          parsed.projectDir = value;
+          break;
+        case 'project-name':
+          parsed.projectName = value;
+          break;
+        case 'output-name':
+          parsed.outputName = value;
+          break;
+        case 'engine':
+        case 'mode':
+          parsed.mode = value.toLowerCase();
+          break;
+        case 'voice':
+          parsed.voice = value;
+          break;
+        case 'rate':
+          parsed.rate = value;
+          break;
+        case 'speech-rate':
+          parsed.speechRate = value;
+          break;
+        case 'api-endpoint':
+          parsed.apiEndpoint = value;
+          break;
+        case 'api-model':
+          parsed.apiModel = value;
+          break;
+        case 'api-voice':
+          parsed.apiVoice = value;
+          break;
+        case 'api-key':
+          parsed.apiKey = value;
+          break;
+        case 'max-chars':
+          parsed.maxChars = value;
+          break;
+        case 'no-auto-prosody':
+          parsed.noAutoProsody = true;
+          break;
+        case 'force':
+          parsed.force = true;
+          break;
+      }
+    }
+  }
+  return parsed;
+}
+function readInputText(opts: DocsToVoiceArgs): string {
+  if (opts.inputFile) {
+    const inputPath = path.resolve(opts.inputFile);
+    if (!fs.existsSync(inputPath)) {
+      throw new Error(`Input file not found: ${inputPath}`);
+    }
+    return fs.readFileSync(inputPath, 'utf-8');
+  }
+  return opts.inputText || '';
+}
+function splitSentences(rawText: string): string[] {
+  const endings = new Set(['。', '！', '？', '!', '?', '；', ';']);
+  const sentences: string[] = [];
+  for (const rawLine of rawText.split('\n')) {
+    const line = rawLine.trim();
+    if (!line) continue;
+    let current: string[] = [];
+    for (const char of line) {
+      current.push(char);
+      if (endings.has(char)) {
+        const sentence = current.join('').trim();
+        if (sentence) sentences.push(sentence);
+        current = [];
+      }
+    }
+    const tail = current.join('').trim();
+    if (tail) sentences.push(tail);
+  }
+  return sentences;
+}
+function sentenceWeight(sentence: string): number {
+  const compact = sentence.replace(/\s+/g, '');
+  if (!compact) return 1.0;
+  let total = 0.0;
+  for (const char of compact) {
+    if (/[A-Za-z0-9]/.test(char)) {
+      total += 0.55;
+    } else if (/[一-鿿]/.test(char)) {
+      total += 1.0;
+    } else if ('，,、:：'.includes(char)) {
+      total += 0.25;
+    } else if ('。.!！?？；;'.includes(char)) {
+      total += 0.45;
+    } else {
+      total += 0.65;
+    }
+  }
+  return Math.max(total, 1.0);
+}
+function srtTime(seconds: number): string {
+  const ms = Math.max(0, Math.round(seconds * 1000));
+  const h = Math.floor(ms / 3600000);
+  const m = Math.floor((ms % 3600000) / 60000);
+  const s = Math.floor((ms % 60000) / 1000);
+  const ml = ms % 1000;
+  return `${String(h).padStart(2, '0')}:${String(m).padStart(2, '0')}:${String(s).padStart(2, '0')},${String(ml).padStart(3, '0')}`;
+}
+function readDurationSeconds(filePath: string): number | null {
+  try {
+    const ext = path.extname(filePath).toLowerCase();
+    if (ext === '.wav') {
+      const header = Buffer.alloc(44);
+      const fd = fs.openSync(filePath, 'r');
+      fs.readSync(fd, header, 0, 44, 0);
+      fs.closeSync(fd);
+      const dataSize = header.readUInt32LE(40);
+      const sampleRate = header.readUInt32LE(24);
+      const channels = header.readUInt16LE(22);
+      const bitsPerSample = header.readUInt16LE(34);
+      const bytesPerSec = sampleRate * channels * (bitsPerSample / 8);
+      if (bytesPerSec > 0) {
+        return dataSize / bytesPerSec;
+      }
+    }
+  } catch {
+    // fallback to afinfo
+  }
+  // Try afinfo on macOS
+  try {
+    const output = execSync(`afinfo "${filePath}" 2>/dev/null`, {
+      encoding: 'utf-8',
+      timeout: 5000,
+    });
+    const match = output.match(/estimated duration:\s*([0-9.]+)\s*sec/i) ||
+                  output.match(/duration:\s*([0-9.]+)\s*sec/i);
+    if (match) return parseFloat(match[1]);
+  } catch {
+    // ignore
+  }
+  return null;
+}
+function writeTimelineFiles(
+  sourceText: string,
+  audioPath: string,
+  sentenceDurations: number[] | null,
+): void {
+  const sentences = splitSentences(sourceText);
+  if (sentences.length === 0) {
+    const stripped = sourceText.trim();
+    if (stripped) sentences.push(stripped);
+  }
+  if (sentences.length === 0) return;
+  const durationSeconds = readDurationSeconds(audioPath) || sentences.length * 2;
+  const entries: TimelineEntry[] = [];
+  let cursor = 0;
+  if (sentenceDurations && sentenceDurations.length === sentences.length) {
+    const totalDuration = sentenceDurations.reduce((a, b) => a + b, 0);
+    const scale = totalDuration > 0 ? durationSeconds / totalDuration : 1;
+    for (let i = 0; i < sentences.length; i++) {
+      const end = i === sentences.length - 1
+        ? durationSeconds
+        : cursor + sentenceDurations[i] * scale;
+      entries.push({
+        index: i + 1,
+        text: sentences[i],
+        startSeconds: Math.round(cursor * 1000) / 1000,
+        endSeconds: Math.round(Math.max(end, cursor) * 1000) / 1000,
+        startMs: Math.round(cursor * 1000),
+        endMs: Math.round(Math.max(end, cursor) * 1000),
+      });
+      cursor = Math.max(end, cursor);
+    }
+  } else {
+    const weights = sentences.map(sentenceWeight);
+    const totalWeight = weights.reduce((a, b) => a + b, 0) || sentences.length;
+    for (let i = 0; i < sentences.length; i++) {
+      const end = i === sentences.length - 1
+        ? durationSeconds
+        : cursor + (durationSeconds * weights[i] / totalWeight);
+      entries.push({
+        index: i + 1,
+        text: sentences[i],
+        startSeconds: Math.round(cursor * 1000) / 1000,
+        endSeconds: Math.round(Math.max(end, cursor) * 1000) / 1000,
+        startMs: Math.round(cursor * 1000),
+        endMs: Math.round(Math.max(end, cursor) * 1000),
+      });
+      cursor = Math.max(end, cursor);
+    }
+  }
+  // Ensure last entry ends at total duration
+  if (entries.length > 0) {
+    entries[entries.length - 1].endSeconds = Math.round(durationSeconds * 1000) / 1000;
+    entries[entries.length - 1].endMs = Math.round(durationSeconds * 1000);
+  }
+  const timelineBase = audioPath.replace(/\.[^.]+$/, '');
+  // Write JSON timeline
+  const jsonPayload = {
+    audio_file: path.basename(audioPath),
+    audio_path: audioPath,
+    audio_duration_seconds: Math.round(durationSeconds * 1000) / 1000,
+    timing_mode: sentenceDurations ? 'sentence-audio' : 'estimated',
+    generated_at: new Date().toISOString(),
+    sentences: entries,
+  };
+  fs.writeFileSync(`${timelineBase}.timeline.json`, JSON.stringify(jsonPayload, null, 2) + '\n', 'utf-8');
+  // Write SRT
+  const srtLines: string[] = [];
+  for (const entry of entries) {
+    srtLines.push(String(entry.index));
+    srtLines.push(`${srtTime(entry.startSeconds)} --> ${srtTime(entry.endSeconds)}`);
+    srtLines.push(entry.text);
+    srtLines.push('');
+  }
+  fs.writeFileSync(`${timelineBase}.srt`, srtLines.join('\n').trim() + '\n', 'utf-8');
+}
+function buildAutoProsodyText(rawText: string): string {
+  return rawText
+    .replace(/\n{2,}/g, ' [[slnc 260]] ')
+    .replace(/\n/g, ' [[slnc 90]] ')
+    .replace(/[，,、:：]/g, (m) => `${m} [[slnc 120]] `)
+    .replace(/[。.]/g, (m) => `${m} [[slnc 180]] `)
+    .replace(/[?？]/g, (m) => `${m} [[slnc 190]] `)
+    .replace(/[!！]/g, (m) => `${m} [[slnc 150]] `)
+    .replace(/[ \t]{2,}/g, ' ');
+}
+function applySpeechRateToAudio(outputPath: string, speechRate: number): void {
+  if (Math.abs(speechRate - 1.0) < 1e-9) return;
+  const tmpPath = `${outputPath}.rate_tmp${path.extname(outputPath)}`;
+  try {
+    execSync(
+      `ffmpeg -hide_banner -loglevel error -y -i "${outputPath}" -filter:a "atempo=${speechRate}" "${tmpPath}"`,
+      { stdio: 'ignore', timeout: 120000 },
+    );
+    if (fs.existsSync(tmpPath) && fs.statSync(tmpPath).size > 0) {
+      fs.renameSync(tmpPath, outputPath);
+    }
+  } catch (err: unknown) {
+    if (fs.existsSync(tmpPath)) fs.unlinkSync(tmpPath);
+    throw new Error(
+      `ffmpeg failed while applying --speech-rate: ${err instanceof Error ? err.message : 'unknown error'}`,
+    );
+  }
+}
+function splitTextForTts(text: string, maxChars: number | null): string[] {
+  text = text.replace(/\r\n/g, '\n').replace(/\r/g, '\n').trim();
+  if (!text) return [];
+  if (!maxChars || text.length <= maxChars) return [text];
+  const chunks: string[] = [];
+  const paragraphs = text.split(/\n{2,}/).map((p) => p.trim()).filter(Boolean);
+  for (const paragraph of paragraphs) {
+    const sentences = paragraph
+      .split(/(?<=[。！？!?；;.!?])/)
+      .map((s) => s.trim())
+      .filter(Boolean);
+    let current = '';
+    for (const sentence of sentences) {
+      if (sentence.length > maxChars) {
+        if (current) {
+          chunks.push(current);
+          current = '';
+        }
+        // split oversized sentence
+        for (let i = 0; i < sentence.length; i += maxChars) {
+          chunks.push(sentence.slice(i, i + maxChars));
+        }
+        continue;
+      }
+      const candidate = current ? `${current} ${sentence}` : sentence;
+      if (candidate.length <= maxChars) {
+        current = candidate;
+      } else {
+        chunks.push(current);
+        current = sentence;
+      }
+    }
+    if (current) chunks.push(current);
+  }
+  return chunks;
+}
+function concatAudioFiles(partPaths: string[], outputPath: string): void {
+  if (partPaths.length === 0) {
+    throw new Error('No chunk audio generated for concatenation.');
+  }
+  if (partPaths.length === 1) {
+    fs.copyFileSync(partPaths[0], outputPath);
+    return;
+  }
+  // Use ffmpeg concat
+  const listContent = partPaths.map((p) => `file '${p.replace(/'/g, "'\\''")}'`).join('\n');
+  const listFile = path.join(fs.mkdtempSync('docs-to-voice-'), 'concat.txt');
+  fs.mkdirSync(path.dirname(listFile), { recursive: true });
+  fs.writeFileSync(listFile, listContent + '\n', 'utf-8');
+  try {
+    execSync(
+      `ffmpeg -hide_banner -loglevel error -y -f concat -safe 0 -i "${listFile}" -c:a copy "${outputPath}"`,
+      { stdio: 'ignore', timeout: 120000 },
+    );
+  } catch (err: unknown) {
+    throw new Error(
+      `ffmpeg concat failed: ${err instanceof Error ? err.message : 'unknown error'}`,
+    );
+  } finally {
+    try { fs.unlinkSync(listFile); fs.rmdirSync(path.dirname(listFile)); } catch { /* ignore */ }
+  }
+}
+function downloadBinary(url: string, outputPath: string): Promise<void> {
+  return new Promise((resolve, reject) => {
+    const protocol = url.startsWith('https') ? https : http;
+    protocol.get(url, { timeout: 300000 }, (response) => {
+      const chunks: Buffer[] = [];
+      response.on('data', (chunk: Buffer) => chunks.push(chunk));
+      response.on('end', () => {
+        fs.writeFileSync(outputPath, Buffer.concat(chunks));
+        resolve();
+      });
+      response.on('error', reject);
+    }).on('error', reject);
+  });
+}
+function requestAlibabaCloudTTS(
+  endpoint: string,
+  apiKey: string,
+  model: string,
+  voice: string,
+  text: string,
+): Promise<{ audioUrl?: string; audioData?: string; audioFormat?: string }> {
+  return new Promise((resolve, reject) => {
+    const payload = JSON.stringify({
+      model,
+      input: { text, voice },
+    });
+    const urlObj = new URL(endpoint);
+    const client = urlObj.protocol === 'https:' ? https : http;
+    const options = {
+      hostname: urlObj.hostname,
+      port: urlObj.port || (urlObj.protocol === 'https:' ? 443 : 80),
+      path: urlObj.pathname,
+      method: 'POST',
+      headers: {
+        'Authorization': `Bearer ${apiKey}`,
+        'Content-Type': 'application/json',
+      },
+      timeout: 300000,
+    };
+    const req = client.request(options, (res) => {
+      const chunks: Buffer[] = [];
+      res.on('data', (chunk: Buffer) => chunks.push(chunk));
+      res.on('end', () => {
+        const rawPayload = Buffer.concat(chunks).toString('utf-8');
+        try {
+          const responseJson = JSON.parse(rawPayload);
+          const output = responseJson.output || {};
+          const audio = output.audio || {};
+          const audioUrl = audio.url || '';
+          const audioData = audio.data || '';
+          const audioFormat = audio.format || audio.mime_type || '';
+          if (!audioUrl && !audioData) {
+            reject(new Error('API response does not contain output.audio.url or output.audio.data'));
+            return;
+          }
+          resolve({ audioUrl, audioData, audioFormat });
+        } catch {
+          reject(new Error('API response is not valid JSON.'));
+        }
+      });
+      res.on('error', reject);
+    });
+    req.on('error', reject);
+    req.on('timeout', () => { req.destroy(); reject(new Error('API request timed out')); });
+    req.write(payload);
+    req.end();
+  });
+}
+export async function docsToVoiceHandler(args: string[], context: ToolContext): Promise<number> {
+  const stdout = context.stdout || process.stdout;
+  const stderr = context.stderr || process.stderr;
+  try {
+    const opts = parseArgs(args);
+    if (opts.help) {
+      stdout.write(`Usage: apltk docs-to-voice [options]
+Convert text into audio and sentence timelines.
+Options:
+  --input, --input-file <path>  Path to input text file
+  --text <string>               Raw text input
+  --project-dir <path>          Root project directory (default: .)
+  --project-name <name>         Folder name under DIR/audio/
+  --output-name <name>          Output filename
+  --engine, --mode <mode>       TTS mode: say (default) | api
+  --voice <name>                macOS say voice
+  --rate <wpm>                  macOS say rate
+  --speech-rate <factor>        Speech rate multiplier (e.g. 1.2)
+  --api-endpoint <url>          Alibaba Cloud TTS endpoint
+  --api-model <name>            Alibaba Cloud model (default: qwen3-tts)
+  --api-voice <name>            Alibaba Cloud voice (default: Cherry)
+  --api-key <key>               Alibaba Cloud API key
+  --max-chars <n>               Max chars per TTS chunk (0 disables)
+  --no-auto-prosody             Disable punctuation pause enhancement
+  --force                       Overwrite existing files
+`);
+      return 0;
+    }
+    if (opts.mode !== 'say' && opts.mode !== 'api') {
+      stderr.write('Error: --mode must be one of: say, api\n');
+      return 1;
+    }
+    const sourceText = readInputText(opts);
+    if (!sourceText.trim()) {
+      stderr.write('Error: No text content found for conversion.\n');
+      return 1;
+    }
+    // Resolve output directory
+    const projectDir = path.resolve(opts.projectDir);
+    const projectName = opts.projectName || path.basename(projectDir);
+    if (!projectName) {
+      stderr.write('Error: Unable to determine project name.\n');
+      return 1;
+    }
+    const outputDir = path.join(projectDir, 'audio', projectName);
+    fs.mkdirSync(outputDir, { recursive: true });
+    const timestamp = new Date().toISOString().replace(/[:.]/g, '-').slice(0, 19);
+    const outputName = opts.outputName || `voice-${timestamp}`;
+    const hasExtension = outputName.includes('.');
+    if (opts.mode === 'say') {
+      // macOS say mode
+      const textChunks = splitTextForTts(sourceText, opts.maxChars ? parseInt(opts.maxChars, 10) || null : null);
+      if (textChunks.length === 0) {
+        stderr.write('Error: No text content found for conversion.\n');
+        return 1;
+      }
+      // Check if `say` is available
+      try {
+        execSync('which say', { stdio: 'ignore' });
+      } catch {
+        stderr.write("Error: macOS 'say' command not found.\n");
+        return 1;
+      }
+      const finalOutputName = hasExtension ? outputName : `${outputName}.aiff`;
+      const outputPath = path.join(outputDir, finalOutputName);
+      if (fs.existsSync(outputPath) && !opts.force) {
+        stderr.write(`Error: Output already exists: ${outputPath}. Use --force to overwrite.\n`);
+        return 1;
+      }
+      // Build prosody-enhanced text
+      const chunks = opts.noAutoProsody ? textChunks : textChunks.map(buildAutoProsodyText);
+      if (chunks.length === 1) {
+        // Single say command
+        const sayArgs = ['-o', outputPath];
+        if (opts.voice) sayArgs.push('-v', opts.voice);
+        if (opts.rate) sayArgs.push('-r', opts.rate);
+        const tmpFile = path.join(fs.mkdtempSync('docs-to-voice-'), 'input.txt');
+        fs.mkdirSync(path.dirname(tmpFile), { recursive: true });
+        fs.writeFileSync(tmpFile, chunks[0], 'utf-8');
+        sayArgs.push('-f', tmpFile);
+        try {
+          execSync(`say ${sayArgs.map((a) => (a.includes(' ') ? `"${a}"` : a)).join(' ')}`, {
+            stdio: 'ignore',
+            timeout: 300000,
+          });
+        } catch (err: unknown) {
+          const msg = err instanceof Error ? err.message : 'unknown error';
+          throw new Error(`say mode failed: ${msg}`);
+        } finally {
+          try { fs.unlinkSync(tmpFile); fs.rmdirSync(path.dirname(tmpFile)); } catch { /* ignore */ }
+        }
+      } else {
+        // Multiple chunks: generate then concat
+        const tempDir = fs.mkdtempSync('docs-to-voice-say-');
+        const partPaths: string[] = [];
+        const partExt = path.extname(outputPath) || '.aiff';
+        try {
+          for (let i = 0; i < chunks.length; i++) {
+            const partPath = path.join(tempDir, `part-${String(i + 1).padStart(4, '0')}${partExt}`);
+            const sayArgs = ['-o', partPath];
+            if (opts.voice) sayArgs.push('-v', opts.voice);
+            if (opts.rate) sayArgs.push('-r', opts.rate);
+            const tmpFile = path.join(tempDir, `chunk-${i}.txt`);
+            fs.writeFileSync(tmpFile, chunks[i], 'utf-8');
+            sayArgs.push('-f', tmpFile);
+            execSync(
+              `say ${sayArgs.map((a) => (a.includes(' ') ? `"${a}"` : a)).join(' ')}`,
+              { stdio: 'ignore', timeout: 300000 },
+            );
+            partPaths.push(partPath);
+          }
+          concatAudioFiles(partPaths, outputPath);
+        } finally {
+          try { fs.rmSync(tempDir, { recursive: true }); } catch { /* ignore */ }
+        }
+      }
+      // Apply speech rate if requested
+      if (opts.speechRate) {
+        const rate = parseFloat(opts.speechRate);
+        if (rate > 0) applySpeechRateToAudio(outputPath, rate);
+      }
+      // Write timeline files
+      writeTimelineFiles(sourceText, outputPath, null);
+      stdout.write(`${outputPath}\n`);
+    } else {
+      // API mode
+      const apiKey = opts.apiKey;
+      if (!apiKey) {
+        stderr.write('Error: --api-key is required for api mode.\n');
+        return 1;
+      }
+      const sentences = splitSentences(sourceText);
+      if (sentences.length === 0) {
+        stderr.write('Error: No text content found for conversion.\n');
+        return 1;
+      }
+      const maxChars = opts.maxChars ? parseInt(opts.maxChars, 10) || null : null;
+      // Build request items from sentences
+      interface RequestItem {
+        sentenceIndex: number;
+        text: string;
+      }
+      const requestItems: RequestItem[] = [];
+      for (let si = 0; si < sentences.length; si++) {
+        const sentence = sentences[si];
+        if (maxChars && sentence.length > maxChars) {
+          for (let i = 0; i < sentence.length; i += maxChars) {
+            requestItems.push({ sentenceIndex: si, text: sentence.slice(i, i + maxChars) });
+          }
+        } else {
+          requestItems.push({ sentenceIndex: si, text: sentence });
+        }
+      }
+      if (requestItems.length === 0) {
+        stderr.write('Error: No text content found for conversion.\n');
+        return 1;
+      }
+      const tempDir = fs.mkdtempSync('docs-to-voice-api-');
+      const partPaths: string[] = [];
+      let partExt = '';
+      const sentenceDurations = new Array(sentences.length).fill(0);
+      const sentenceDurationKnown = new Array(sentences.length).fill(true);
+      try {
+        for (let i = 0; i < requestItems.length; i++) {
+          const item = requestItems[i];
+          const apiResult = await requestAlibabaCloudTTS(
+            opts.apiEndpoint,
+            apiKey,
+            opts.apiModel,
+            opts.apiVoice,
+            item.text,
+          );
+          const currentExt = apiResult.audioFormat || 'wav';
+          if (!partExt) partExt = currentExt;
+          const partPath = path.join(tempDir, `part-${String(i + 1).padStart(4, '0')}.${currentExt}`);
+          if (apiResult.audioUrl) {
+            await downloadBinary(apiResult.audioUrl, partPath);
+          } else if (apiResult.audioData) {
+            fs.writeFileSync(partPath, Buffer.from(apiResult.audioData, 'base64'));
+          } else {
+            throw new Error('No audio data in API response.');
+          }
+          if (!fs.existsSync(partPath) || fs.statSync(partPath).size === 0) {
+            throw new Error(`Failed to generate audio chunk ${i + 1}.`);
+          }
+          partPaths.push(partPath);
+          const partDuration = readDurationSeconds(partPath);
+          if (partDuration === null || partDuration <= 0) {
+            sentenceDurationKnown[item.sentenceIndex] = false;
+          } else {
+            sentenceDurations[item.sentenceIndex] += partDuration;
+          }
+        }
+        const finalOutputName = hasExtension
+          ? outputName
+          : `${outputName}.${partExt || 'wav'}`;
+        const outputPath = path.join(outputDir, finalOutputName);
+        if (fs.existsSync(outputPath) && !opts.force) {
+          stderr.write(`Error: Output already exists: ${outputPath}. Use --force to overwrite.\n`);
+          return 1;
+        }
+        concatAudioFiles(partPaths, outputPath);
+        // Build timeline durations
+        let timelineDurations: number[] | null = null;
+        const unknownIndexes = sentenceDurationKnown
+          .map((known, idx) => (known ? -1 : idx))
+          .filter((idx) => idx >= 0);
+        if (unknownIndexes.length === 0 && sentenceDurations.reduce((a, b) => a + b, 0) > 0) {
+          timelineDurations = sentenceDurations;
+        } else if (unknownIndexes.length > 0) {
+          const outputDuration = readDurationSeconds(outputPath);
+          const knownTotal = sentenceDurations.reduce(
+            (sum, val, idx) => (sentenceDurationKnown[idx] ? sum + val : sum),
+            0,
+          );
+          if (outputDuration && outputDuration > knownTotal) {
+            const remaining = outputDuration - knownTotal;
+            const unknownWeights = unknownIndexes.map((idx) => sentenceWeight(sentences[idx]));
+            const totalUnknownWeight = unknownWeights.reduce((a, b) => a + b, 0);
+            if (totalUnknownWeight > 0) {
+              for (let wi = 0; wi < unknownIndexes.length; wi++) {
+                sentenceDurations[unknownIndexes[wi]] +=
+                  remaining * (unknownWeights[wi] / totalUnknownWeight);
+              }
+              timelineDurations = sentenceDurations;
+            }
+          }
+        }
+        // Apply speech rate if requested
+        if (opts.speechRate) {
+          const rate = parseFloat(opts.speechRate);
+          if (rate > 0) {
+            applySpeechRateToAudio(outputPath, rate);
+            if (timelineDurations) {
+              timelineDurations = timelineDurations.map((d) => d / rate);
+            }
+          }
+        }
+        writeTimelineFiles(sourceText, outputPath, timelineDurations);
+        stdout.write(`${outputPath}\n`);
+      } finally {
+        try { fs.rmSync(tempDir, { recursive: true }); } catch { /* ignore */ }
+      }
+    }
+    return 0;
+  } catch (err: unknown) {
+    const msg = err instanceof Error ? err.message : 'Unknown error';
+    stderr.write(`Error: ${msg}\n`);
+    return 1;
+  }
+}