npm - @make-u-free/migi - Versions diffs - 0.5.7 → 0.5.9 - Mend

@make-u-free/migi 0.5.7 → 0.5.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@make-u-free/migi",
-  "version": "0.5.7",
+  "version": "0.5.9",
   "description": "Your AI right-hand agent. Works anywhere, with any LLM API.",
   "type": "module",
   "bin": {

package/src/agent.js CHANGED Viewed

@@ -61,6 +61,21 @@ ${userNameLine}
 - 「どうしますか？」と聞く前に、自分でできることをやりきる
 - 完了したら1〜2文で報告。途中経過は出さない
+## 文脈の自律的な構築と維持
+### 探索
+- 作業前に、関連フォルダの内容を把握していないと感じたら、list_files で探索する
+- 「このフォルダに何があるか分からない」状態で作業しない
+- 過去の記録・決定事項が不明なときは search_content で能動的に探す
+- 「たぶんこうだろう」で進めるより、read_file で確認してから進める
+### MIGI.md の維持（重要）
+- プロジェクトフォルダで重要な作業をしたら、そのフォルダの MIGI.md を必ず更新する
+- MIGI.md に書く内容: プロジェクト概要・重要な決定・現在の状況・次にやること・参照すべきファイル
+- MIGI.md がないフォルダで初めて作業した場合、作業後に作成する
+- MIGI.md は「次回セッションの自分へのブリーフィング」として書く。読み返したとき即座に文脈が戻るように
+- セッション再開時は、該当フォルダの MIGI.md をまず読んでから作業を始める
 ## メモリと文脈の継続
 ワークスペースメモリは ${cwd}/.migi/memory/ に構造化して保存する:
 - projects.md   ── 進行中の仕事・状況

package/src/tools.js CHANGED Viewed

@@ -128,6 +128,41 @@ export const teamsToolSchema = {
   }
 }
+// ---- PDFから埋め込み画像を抽出（ネイティブ依存なし） ----
+function extractImagesFromPdf(buf) {
+  const images = []
+  let i = 0
+  while (i < buf.length - 1) {
+    // JPEG: FF D8 で始まり FF D9 で終わる
+    if (buf[i] === 0xFF && buf[i + 1] === 0xD8) {
+      const eoiIdx = buf.indexOf(Buffer.from([0xFF, 0xD9]), i + 2)
+      if (eoiIdx === -1) break
+      images.push({ data: buf.slice(i, eoiIdx + 2), mime: 'image/jpeg' })
+      i = eoiIdx + 2
+      continue
+    }
+    // PNG: 89 50 4E 47 0D 0A 1A 0A で始まる
+    if (
+      i + 7 < buf.length &&
+      buf[i] === 0x89 && buf[i+1] === 0x50 && buf[i+2] === 0x4E && buf[i+3] === 0x47 &&
+      buf[i+4] === 0x0D && buf[i+5] === 0x0A && buf[i+6] === 0x1A && buf[i+7] === 0x0A
+    ) {
+      const iend = buf.indexOf(Buffer.from([0x49, 0x45, 0x4E, 0x44, 0xAE, 0x42, 0x60, 0x82]), i + 8)
+      if (iend === -1) break
+      images.push({ data: buf.slice(i, iend + 8), mime: 'image/png' })
+      i = iend + 8
+      continue
+    }
+    i++
+  }
+  return images
+}
 // ---- diff 表示 ----
 function showDiff(path, oldContent, newContent) {
@@ -184,13 +219,40 @@ export async function executeTool(name, args, opts = {}) {
       // PDF
       if (ext === '.pdf') {
+        const buf = readFileSync(args.path)
+        // Step 1: テキストPDFとして抽出を試みる
         try {
-          const buf = readFileSync(args.path)
           const data = await pdfParse(buf)
-          return data.text?.trim() || '(テキストが抽出できませんでした)'
-        } catch (err) {
-          return `エラー: PDFの解析に失敗しました: ${err.message}`
-        }
+          const text = data.text?.trim()
+          if (text) return text
+        } catch (_) {}
+        // Step 2: 画像PDFとしてVision APIでOCR（ネイティブ依存なし）
+        if (!opts.apiKey) return '(テキストが抽出できませんでした)'
+        const images = extractImagesFromPdf(buf)
+        if (images.length === 0) return '(テキストも画像も抽出できませんでした)'
+        const client = new OpenAI({
+          apiKey: opts.apiKey,
+          ...(httpsAgent ? { httpAgent: httpsAgent } : {})
+        })
+        const targets = images.slice(0, 10)  // 最大10ページ
+        const res = await client.chat.completions.create({
+          model: opts.model || 'gpt-4.1-2025-04-14',
+          messages: [{
+            role: 'user',
+            content: [
+              { type: 'text', text: 'このPDFのページ画像です。すべてのテキストを正確に書き起こしてください。' },
+              ...targets.map(img => ({
+                type: 'image_url',
+                image_url: { url: `data:${img.mime};base64,${img.data.toString('base64')}` }
+              }))
+            ]
+          }],
+          max_tokens: 4000
+        })
+        return res.choices[0].message.content
       }
       // PowerPoint（PPTX）/ Word（DOCX）→ ZIPを展開してXMLからテキスト抽出