npm - @cyber-dash-tech/revela - Versions diffs - 0.3.0 → 0.3.1 - Mend

@cyber-dash-tech/revela 0.3.0 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md +2 -2
package/README.zh-CN.md +2 -2
package/lib/agents/research-prompt.ts +1 -1
package/lib/document-materials/extract.ts +139 -2
package/package.json +1 -1
package/tools/extract-document-materials.ts +2 -2

package/README.md CHANGED Viewed

@@ -2,7 +2,7 @@
 **English** | [中文](README.zh-CN.md)
-[![npm version](https://img.shields.io/npm/v/@cyber-dash-tech/revela)](https://www.npmjs.com/package/@cyber-dash-tech/revela) [![license](https://img.shields.io/npm/l/@cyber-dash-tech/revela)](LICENSE) [![tests](https://img.shields.io/badge/tests-109%20passing-brightgreen)](tests/) [![OpenCode plugin](https://img.shields.io/badge/OpenCode-plugin-blue)](https://opencode.ai) [![Bun](https://img.shields.io/badge/Bun-%E2%89%A51.0-orange)](https://bun.sh)
+[![npm version](https://img.shields.io/npm/v/@cyber-dash-tech/revela)](https://www.npmjs.com/package/@cyber-dash-tech/revela) [![license](https://img.shields.io/npm/l/@cyber-dash-tech/revela)](LICENSE) [![tests](https://img.shields.io/badge/tests-125%20passing-brightgreen)](tests/) [![OpenCode plugin](https://img.shields.io/badge/OpenCode-plugin-blue)](https://opencode.ai) [![Bun](https://img.shields.io/badge/Bun-%E2%89%A51.0-orange)](https://bun.sh)
 <p align="center">
   <img src="assets/img/logo.png" alt="Revela" width="800" />
@@ -19,7 +19,7 @@ Enable it for the current session, assign a presentation task, and the agent can
 - injects a presentation-specific system prompt into your current agent with `/revela enable`
 - builds that prompt from 3 layers: core skill, active domain, active design
-- supports workspace document discovery plus transparent extraction for `.pdf`, `.docx`, `.pptx`, and `.xlsx`
+- supports workspace document discovery, transparent text extraction for `.pdf`, `.docx`, `.pptx`, and `.xlsx`, and cached embedded-material extraction for those formats
 - runs automatic layout QA whenever the agent writes `decks/*.html`
 - exports finished decks to PDF and editable PPTX
 - switches designs and domains locally with zero LLM cost

package/README.zh-CN.md CHANGED Viewed

@@ -2,7 +2,7 @@
 [English](README.md) | **中文**
-[![npm version](https://img.shields.io/npm/v/@cyber-dash-tech/revela)](https://www.npmjs.com/package/@cyber-dash-tech/revela) [![license](https://img.shields.io/npm/l/@cyber-dash-tech/revela)](LICENSE) [![tests](https://img.shields.io/badge/tests-109%20passing-brightgreen)](tests/) [![OpenCode plugin](https://img.shields.io/badge/OpenCode-plugin-blue)](https://opencode.ai) [![Bun](https://img.shields.io/badge/Bun-%E2%89%A51.0-orange)](https://bun.sh)
+[![npm version](https://img.shields.io/npm/v/@cyber-dash-tech/revela)](https://www.npmjs.com/package/@cyber-dash-tech/revela) [![license](https://img.shields.io/npm/l/@cyber-dash-tech/revela)](LICENSE) [![tests](https://img.shields.io/badge/tests-125%20passing-brightgreen)](tests/) [![OpenCode plugin](https://img.shields.io/badge/OpenCode-plugin-blue)](https://opencode.ai) [![Bun](https://img.shields.io/badge/Bun-%E2%89%A51.0-orange)](https://bun.sh)
 <p align="center">
   <img src="assets/img/logo.png" alt="Revela" width="800" />
@@ -19,7 +19,7 @@ Revela 是一个 [OpenCode](https://opencode.ai) 插件，可以把你当前使
 - 通过 `/revela enable` 向当前 agent 注入演示文稿专用 system prompt
 - prompt 由 3 层组成：核心 skill、当前 domain、当前 design
-- 支持工作区文档扫描，以及 `.pdf`、`.docx`、`.pptx`、`.xlsx` 的透明文本提取
+- 支持工作区文档扫描，以及 `.pdf`、`.docx`、`.pptx`、`.xlsx` 的透明文本提取和嵌入素材缓存提取
 - agent 每次写入 `decks/*.html` 时自动执行布局 QA
 - 支持导出成 PDF 和可编辑 PPTX
 - design 和 domain 的切换都在本地完成，不消耗 LLM token

package/lib/agents/research-prompt.ts CHANGED Viewed

@@ -40,7 +40,7 @@ files in the workspace (PDF, Word, Excel, PowerPoint, CSV, text).
 Then select the files relevant to your research axis.
 For every selected file, call **\`revela-extract-document-materials\`** first.
-- \`pptx\`, \`docx\`, and \`xlsx\` will produce a manifest plus extracted text and any available embedded materials
+- \`pdf\`, \`pptx\`, \`docx\`, and \`xlsx\` will produce a manifest plus extracted text and any available embedded materials
 - unsupported file types will be skipped automatically
 After that, use the \`read\` tool on:

package/lib/document-materials/extract.ts CHANGED Viewed

@@ -3,7 +3,10 @@ import { existsSync, mkdirSync, readFileSync, realpathSync, statSync, writeFileS
 import { basename, dirname, extname, isAbsolute, join, relative, resolve } from "path"
 import { DOMParser } from "@xmldom/xmldom"
 import { unzipSync } from "fflate"
+import { Jimp } from "jimp"
+import { extractImages, getDocumentProxy } from "unpdf"
 import { extractDocx } from "../read-hooks/extractors/docx"
+import { extractPdfText } from "../read-hooks/extractors/pdf"
 import { extractPptx } from "../read-hooks/extractors/pptx"
 import { extractXlsx } from "../read-hooks/extractors/xlsx"
@@ -48,7 +51,7 @@ export type PptxSlide = {
 export type DocumentMaterialsResult = {
   status: "processed" | "skipped" | "failed"
   source: string
-  type: "pptx" | "docx" | "xlsx" | "other"
+  type: "pptx" | "docx" | "xlsx" | "pdf" | "other"
   cache_dir?: string
   manifest_path?: string
   text_path?: string
@@ -83,8 +86,11 @@ const SUPPORTED_EXTENSIONS: Record<string, SupportedType> = {
   ".pptx": "pptx",
   ".docx": "docx",
   ".xlsx": "xlsx",
+  ".pdf": "pdf",
 }
+type PdfImageData = Awaited<ReturnType<typeof extractImages>>[number]
 function normalizeZipTarget(basePath: string, target: string): string {
   const segments = join(dirname(basePath), target).split("/")
   const normalized: string[] = []
@@ -151,6 +157,47 @@ function materialPath(cacheDir: string, workspaceDir: string, ...segments: strin
   return workspaceRelative(join(cacheDir, ...segments), workspaceDir)
 }
+function toRgbaBuffer(image: PdfImageData): Buffer {
+  const pixelCount = image.width * image.height
+  if (image.channels === 4) {
+    return Buffer.from(image.data.buffer, image.data.byteOffset, image.data.byteLength)
+  }
+  const rgba = Buffer.alloc(pixelCount * 4)
+  for (let i = 0; i < pixelCount; i++) {
+    const dest = i * 4
+    if (image.channels === 3) {
+      const src = i * 3
+      rgba[dest] = image.data[src]!
+      rgba[dest + 1] = image.data[src + 1]!
+      rgba[dest + 2] = image.data[src + 2]!
+      rgba[dest + 3] = 255
+      continue
+    }
+    const value = image.data[i]!
+    rgba[dest] = value
+    rgba[dest + 1] = value
+    rgba[dest + 2] = value
+    rgba[dest + 3] = 255
+  }
+  return rgba
+}
+async function encodePdfImageAsPng(image: PdfImageData): Promise<Buffer> {
+  const bitmap = {
+    data: toRgbaBuffer(image),
+    width: image.width,
+    height: image.height,
+  }
+  const png = Jimp.fromBitmap(bitmap)
+  return await png.getBuffer("image/png")
+}
 function parseXml(files: Record<string, Uint8Array>, path: string): any | null {
   const file = files[path]
   if (!file) return null
@@ -589,6 +636,94 @@ function extractTables(type: SupportedType, textPath: string): DocumentMaterial[
   return [{ path: textPath, source_ref: "workbook", note: "Sheet text and tables extracted to text file" }]
 }
+async function extractPdfImages(buf: Buffer, cacheDir: string, workspaceDir: string): Promise<DocumentMaterial[]> {
+  const pdf = await getDocumentProxy(new Uint8Array(buf))
+  const images: DocumentMaterial[] = []
+  for (let pageNumber = 1; pageNumber <= pdf.numPages; pageNumber++) {
+    const extracted = await extractImages(pdf, pageNumber)
+    for (let index = 0; index < extracted.length; index++) {
+      const image = extracted[index]!
+      const exportedName = `page-${String(pageNumber).padStart(2, "0")}-image-${String(index + 1).padStart(2, "0")}.png`
+      const outputPath = join(cacheDir, "images", exportedName)
+      const png = await encodePdfImageAsPng(image)
+      writeFileSync(outputPath, new Uint8Array(png))
+      images.push({
+        path: materialPath(cacheDir, workspaceDir, "images", exportedName),
+        source_ref: `pdf/page-${String(pageNumber).padStart(2, "0")}/${image.key}`,
+        page_or_slide: `page-${String(pageNumber).padStart(2, "0")}`,
+        note: `Embedded PDF image (${image.width}x${image.height}, ${image.channels} channel${image.channels === 1 ? "" : "s"})`,
+      })
+    }
+  }
+  return images
+}
+async function processPdfFile(filePath: string, workspaceDir: string): Promise<DocumentMaterialsResult> {
+  const relativeSource = workspaceRelative(filePath, workspaceDir)
+  const fingerprint = buildFingerprint(filePath)
+  const cacheDir = join(workspaceDir, ".opencode", "revela", "doc-materials", fingerprint)
+  const manifestPath = join(cacheDir, "manifest.json")
+  if (existsSync(manifestPath)) {
+    const manifest = JSON.parse(readFileSync(manifestPath, "utf-8")) as CachedManifest
+    return {
+      status: "processed",
+      source: manifest.source,
+      type: manifest.type,
+      cache_dir: manifest.cache_dir,
+      manifest_path: manifest.manifest_path,
+      text_path: manifest.text_path,
+      images: manifest.images,
+      skipped_assets: manifest.skipped_assets,
+      slides: manifest.slides,
+      tables: manifest.tables,
+    }
+  }
+  mkdirSync(join(cacheDir, "images"), { recursive: true })
+  mkdirSync(join(cacheDir, "tables"), { recursive: true })
+  const buf = readFileSync(filePath)
+  const text = await extractPdfText(buf)
+  const textPath = join(cacheDir, "text.txt")
+  writeFileSync(textPath, `[Extracted from: ${basename(filePath)}]\n\n${text}`, "utf-8")
+  const images = await extractPdfImages(buf, cacheDir, workspaceDir)
+  const result: DocumentMaterialsResult = {
+    status: "processed",
+    source: relativeSource,
+    type: "pdf",
+    cache_dir: workspaceRelative(cacheDir, workspaceDir),
+    manifest_path: workspaceRelative(manifestPath, workspaceDir),
+    text_path: workspaceRelative(textPath, workspaceDir),
+    images,
+    skipped_assets: [],
+    slides: [],
+    tables: [],
+  }
+  const manifest: CachedManifest = {
+    source: result.source,
+    type: "pdf",
+    fingerprint,
+    cache_dir: result.cache_dir!,
+    manifest_path: result.manifest_path!,
+    text_path: result.text_path!,
+    images: result.images ?? [],
+    skipped_assets: [],
+    slides: [],
+    tables: [],
+  }
+  writeFileSync(manifestPath, JSON.stringify(manifest, null, 2), "utf-8")
+  return result
+}
 async function processOfficeFile(filePath: string, workspaceDir: string, type: SupportedType): Promise<DocumentMaterialsResult> {
   const relativeSource = workspaceRelative(filePath, workspaceDir)
   const fingerprint = buildFingerprint(filePath)
@@ -683,7 +818,9 @@ export async function extractDocumentMaterials(filePath: string, workspaceDir: s
       }
     }
-    return await processOfficeFile(resolvedFile, workspaceDir, type)
+    return type === "pdf"
+      ? await processPdfFile(resolvedFile, workspaceDir)
+      : await processOfficeFile(resolvedFile, workspaceDir, type)
   } catch (e) {
     return {
       status: "failed",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@cyber-dash-tech/revela",
-  "version": "0.3.0",
+  "version": "0.3.1",
   "description": "OpenCode plugin that turns AI into an HTML slide deck generator",
   "type": "module",
   "main": "./index.ts",

package/tools/extract-document-materials.ts CHANGED Viewed

@@ -4,12 +4,12 @@ import { extractDocumentMaterials } from "../lib/document-materials/extract"
 export default tool({
   description:
     "Extract reusable materials from a workspace document into a workspace-local cache. " +
-    "Supports pptx, docx, and xlsx. Produces a manifest plus extracted text, embedded images, and available slide/sheet mappings. " +
+    "Supports pdf, pptx, docx, and xlsx. Produces a manifest plus extracted text, embedded images, and available page/slide/sheet mappings. " +
     "Unsupported file types are skipped instead of failing.",
   args: {
     file: tool.schema
       .string()
-      .describe("Document path relative to workspace root. Supports pptx, docx, and xlsx; other file types are skipped."),
+      .describe("Document path relative to workspace root. Supports pdf, pptx, docx, and xlsx; other file types are skipped."),
   },
   async execute(args, context) {
     const workspaceDir = context.directory ?? process.cwd()