npm - devlyn-cli - Versions diffs - 0.5.2 → 0.5.4 - Mend

devlyn-cli 0.5.2 → 0.5.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

package/bin/devlyn.js +1 -0
package/config/commands/devlyn.team-resolve.md +31 -2
package/optional-skills/dokkit/ANALYSIS.md +198 -0
package/optional-skills/dokkit/COMMANDS.md +365 -0
package/optional-skills/dokkit/DOCX-XML.md +76 -0
package/optional-skills/dokkit/EXPORT.md +102 -0
package/optional-skills/dokkit/FILLING.md +377 -0
package/optional-skills/dokkit/HWPX-XML.md +73 -0
package/optional-skills/dokkit/IMAGE-SOURCING.md +127 -0
package/optional-skills/dokkit/INGESTION.md +65 -0
package/optional-skills/dokkit/SKILL.md +153 -0
package/optional-skills/dokkit/STATE.md +60 -0
package/optional-skills/dokkit/references/docx-field-patterns.md +151 -0
package/optional-skills/dokkit/references/docx-structure.md +58 -0
package/optional-skills/dokkit/references/field-detection-patterns.md +130 -0
package/optional-skills/dokkit/references/hwpx-field-patterns.md +461 -0
package/optional-skills/dokkit/references/hwpx-structure.md +159 -0
package/optional-skills/dokkit/references/image-opportunity-heuristics.md +121 -0
package/optional-skills/dokkit/references/image-xml-patterns.md +338 -0
package/optional-skills/dokkit/references/section-image-interleaving.md +346 -0
package/optional-skills/dokkit/references/section-range-detection.md +118 -0
package/optional-skills/dokkit/references/state-schema.md +143 -0
package/optional-skills/dokkit/references/supported-formats.md +67 -0
package/optional-skills/dokkit/scripts/compile_hwpx.py +134 -0
package/optional-skills/dokkit/scripts/detect_fields.py +301 -0
package/optional-skills/dokkit/scripts/detect_fields_hwpx.py +286 -0
package/optional-skills/dokkit/scripts/export_pdf.py +99 -0
package/optional-skills/dokkit/scripts/parse_hwpx.py +185 -0
package/optional-skills/dokkit/scripts/parse_image_with_gemini.py +159 -0
package/optional-skills/dokkit/scripts/parse_xlsx.py +98 -0
package/optional-skills/dokkit/scripts/source_images.py +365 -0
package/optional-skills/dokkit/scripts/validate_docx.py +142 -0
package/optional-skills/dokkit/scripts/validate_hwpx.py +281 -0
package/optional-skills/dokkit/scripts/validate_state.py +132 -0
package/package.json +1 -1

package/optional-skills/dokkit/scripts/parse_image_with_gemini.py ADDED Viewed

@@ -0,0 +1,159 @@
+#!/usr/bin/env python3
+"""Parse image files using Google Gemini Vision API for OCR and content extraction.
+Usage:
+    python parse_image_with_gemini.py <input-image> [--project-dir <dir>]
+Output:
+    JSON to stdout with 'content_md' and 'metadata' fields.
+Requires:
+    GEMINI_API_KEY in .env or environment variables.
+"""
+import base64
+import json
+import os
+import sys
+import urllib.error
+import urllib.request
+from datetime import datetime
+from pathlib import Path
+def load_api_key(project_dir: Path) -> str:
+    """Load Gemini API key from .env or environment."""
+    # Check environment first
+    key = os.environ.get("GEMINI_API_KEY", "")
+    if key:
+        return key
+    # Check .env file
+    env_path = project_dir / ".env"
+    if env_path.exists():
+        with open(env_path, encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if line.startswith("GEMINI_API_KEY="):
+                    return line.split("=", 1)[1].strip()
+    return ""
+def parse_image(file_path: str, project_dir: str = ".") -> dict:
+    """Parse an image using Gemini Vision API."""
+    path = Path(file_path)
+    proj = Path(project_dir).resolve()
+    api_key = load_api_key(proj)
+    if not api_key:
+        return {"error": "GEMINI_API_KEY not configured. Set it in .env or environment."}
+    # Read and encode image
+    with open(path, "rb") as f:
+        image_data = base64.b64encode(f.read()).decode("utf-8")
+    # Determine MIME type
+    ext = path.suffix.lower()
+    mime_map = {".png": "image/png", ".jpg": "image/jpeg", ".jpeg": "image/jpeg",
+                ".webp": "image/webp", ".gif": "image/gif"}
+    mime_type = mime_map.get(ext, "image/png")
+    # Call Gemini Vision
+    url = f"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash:generateContent"
+    payload = {
+        "contents": [{
+            "parts": [
+                {"text": (
+                    "Extract ALL text from this image. Preserve the layout as much as possible. "
+                    "If there are tables, convert them to markdown tables. "
+                    "If there are form fields, identify labels and values. "
+                    "Output the extracted content as clean markdown. "
+                    "Also identify any key-value pairs (like Name: John) and list them at the end "
+                    "in a section called '## Extracted Key-Value Pairs' as a markdown table."
+                )},
+                {"inlineData": {"mimeType": mime_type, "data": image_data}}
+            ]
+        }]
+    }
+    req = urllib.request.Request(
+        url,
+        data=json.dumps(payload).encode("utf-8"),
+        headers={"Content-Type": "application/json", "x-goog-api-key": api_key},
+        method="POST",
+    )
+    try:
+        with urllib.request.urlopen(req, timeout=60) as resp:
+            result = json.loads(resp.read().decode("utf-8"))
+    except urllib.error.HTTPError as e:
+        body = e.read().decode("utf-8", errors="replace")
+        return {"error": f"Gemini API error ({e.code}): {body}"}
+    except urllib.error.URLError as e:
+        return {"error": f"Gemini API connection error: {e}"}
+    # Extract text from response
+    candidates = result.get("candidates", [])
+    if not candidates:
+        return {"error": "Gemini returned no response"}
+    parts = candidates[0].get("content", {}).get("parts", [])
+    extracted_text = ""
+    for part in parts:
+        if "text" in part:
+            extracted_text += part["text"]
+    if not extracted_text.strip():
+        return {"error": "No text could be extracted from the image"}
+    # Parse key-value pairs from the extracted text
+    key_value_pairs = {}
+    lines = extracted_text.split("\n")
+    for line in lines:
+        if ":" in line and not line.startswith("#"):
+            parts_split = line.split(":", 1)
+            label = parts_split[0].strip().strip("|").strip()
+            value = parts_split[1].strip().strip("|").strip()
+            if label and value and len(label) < 50:
+                key_value_pairs[label] = value
+    content_md = f"# {path.stem}\n\n{extracted_text}"
+    return {
+        "content_md": content_md,
+        "metadata": {
+            "file_name": path.name,
+            "file_type": ext.lstrip("."),
+            "parse_date": datetime.now().isoformat(),
+            "key_value_pairs": key_value_pairs,
+            "sections": ["OCR Content"],
+            "parse_method": "gemini_vision",
+        }
+    }
+def main():
+    if len(sys.argv) < 2:
+        print("Usage: python parse_image_with_gemini.py <image> [--project-dir <dir>]",
+              file=sys.stderr)
+        sys.exit(1)
+    file_path = sys.argv[1]
+    project_dir = "."
+    if "--project-dir" in sys.argv:
+        idx = sys.argv.index("--project-dir")
+        if idx + 1 < len(sys.argv):
+            project_dir = sys.argv[idx + 1]
+    if not Path(file_path).exists():
+        print(json.dumps({"error": f"File not found: {file_path}"}))
+        sys.exit(1)
+    result = parse_image(file_path, project_dir)
+    print(json.dumps(result, ensure_ascii=False, indent=2))
+if __name__ == "__main__":
+    main()

package/optional-skills/dokkit/scripts/parse_xlsx.py ADDED Viewed

@@ -0,0 +1,98 @@
+#!/usr/bin/env python3
+"""Parse XLSX files into Dokkit's dual-file format (Markdown + JSON sidecar).
+Usage:
+    python parse_xlsx.py <input.xlsx>
+Output:
+    JSON to stdout with 'content_md' and 'metadata' fields.
+Requires:
+    pip install openpyxl
+"""
+import json
+import sys
+from datetime import datetime
+from pathlib import Path
+try:
+    import openpyxl
+except ImportError:
+    print(json.dumps({
+        "error": "openpyxl not installed. Run: pip install openpyxl"
+    }))
+    sys.exit(1)
+def parse_xlsx(file_path: str) -> dict:
+    """Parse an XLSX file and return content + metadata."""
+    path = Path(file_path)
+    wb = openpyxl.load_workbook(path, data_only=True)
+    sections = []
+    all_content = []
+    key_value_pairs = {}
+    for sheet_name in wb.sheetnames:
+        ws = wb[sheet_name]
+        sections.append(sheet_name)
+        all_content.append(f"## {sheet_name}\n")
+        rows = list(ws.iter_rows(values_only=True))
+        if not rows:
+            all_content.append("*(empty sheet)*\n")
+            continue
+        # Detect if first row is a header
+        headers = [str(c) if c is not None else "" for c in rows[0]]
+        # Build markdown table
+        all_content.append("| " + " | ".join(headers) + " |")
+        all_content.append("| " + " | ".join(["---"] * len(headers)) + " |")
+        for row in rows[1:]:
+            cells = [str(c) if c is not None else "" for c in row]
+            all_content.append("| " + " | ".join(cells) + " |")
+            # Extract key-value pairs from 2-column patterns
+            if len(cells) >= 2 and cells[0] and cells[1]:
+                # If first column looks like a label (short text, no numbers)
+                label = cells[0].strip()
+                value = cells[1].strip()
+                if len(label) < 50 and not label.replace(" ", "").isdigit():
+                    key_value_pairs[label] = value
+        all_content.append("")
+    content_md = f"# {path.stem}\n\n" + "\n".join(all_content)
+    return {
+        "content_md": content_md,
+        "metadata": {
+            "file_name": path.name,
+            "file_type": "xlsx",
+            "parse_date": datetime.now().isoformat(),
+            "key_value_pairs": key_value_pairs,
+            "sections": sections,
+            "sheet_count": len(wb.sheetnames),
+        }
+    }
+def main():
+    if len(sys.argv) != 2:
+        print("Usage: python parse_xlsx.py <input.xlsx>", file=sys.stderr)
+        sys.exit(1)
+    file_path = sys.argv[1]
+    if not Path(file_path).exists():
+        print(json.dumps({"error": f"File not found: {file_path}"}))
+        sys.exit(1)
+    result = parse_xlsx(file_path)
+    print(json.dumps(result, ensure_ascii=False, indent=2))
+if __name__ == "__main__":
+    main()

package/optional-skills/dokkit/scripts/source_images.py ADDED Viewed

@@ -0,0 +1,365 @@
+#!/usr/bin/env python3
+"""Generate or search images for dokkit template filling.
+Usage:
+    python source_images.py generate \\
+        --prompt "인포그래픽 제목: AI 감정 케어 플랫폼" \\
+        --preset infographic \\
+        --output-dir .dokkit/images/ \\
+        --project-dir . \\
+        [--lang ko] \\
+        [--aspect-ratio 16:9] \\
+        [--no-enhance]
+    python source_images.py search \\
+        --query "company logo example" \\
+        --output-dir .dokkit/images/
+Language options (--lang):
+    ko        Korean only (default). All text in generated images will be Korean.
+    en        English only. All text in generated images will be English.
+    ko+en     Mixed Korean and English. Titles in Korean, technical terms in English.
+    ja        Japanese only.
+    <code>    Any ISO 639-1 language code.
+    <a>+<b>   Mixed: primary language + secondary language.
+Output:
+    Prints __RESULT__ JSON to stdout:
+    {"image_id": "...", "file_path": "...", "source_type": "generated"|"searched"}
+Requires:
+    GEMINI_API_KEY in .env or environment variables.
+"""
+import base64
+import json
+import os
+import sys
+import urllib.error
+import urllib.request
+import uuid
+from pathlib import Path
+# Model for image generation
+IMAGE_MODEL = "gemini-3-pro-image-preview"
+# Language display names for prompt injection
+LANG_NAMES = {
+    "ko": "한국어",
+    "en": "English",
+    "ja": "日本語",
+    "zh": "中文",
+    "es": "español",
+    "fr": "français",
+    "de": "Deutsch",
+    "pt": "português",
+}
+# Preset-to-style mapping for prompt enhancement
+PRESETS = {
+    "technical_illustration": {
+        "style": "깔끔한 기술 다이어그램 스타일. 선명한 선, 레이블이 있는 구성요소, 전문적인 색상.",
+        "aspect_ratio": "16:9",
+    },
+    "infographic": {
+        "style": "전문적인 인포그래픽 스타일. 아이콘 기반, 깔끔한 레이아웃, 기업용 색상 팔레트.",
+        "aspect_ratio": "16:9",
+    },
+    "photorealistic": {
+        "style": "사실적인 사진 스타일. 고품질, 자연스러운 조명.",
+        "aspect_ratio": "4:3",
+    },
+    "concept": {
+        "style": "개념적 일러스트레이션 스타일. 추상적/모던, 비즈니스 제안서에 적합.",
+        "aspect_ratio": "1:1",
+    },
+    "chart": {
+        "style": "깔끔한 차트/그래프 스타일. 정확한 데이터 시각화, 전문적 색상.",
+        "aspect_ratio": "16:9",
+    },
+}
+def load_api_key(project_dir: Path) -> str:
+    """Load Gemini API key from .env or environment."""
+    key = os.environ.get("GEMINI_API_KEY", "")
+    if key:
+        return key
+    env_path = project_dir / ".env"
+    if env_path.exists():
+        with open(env_path, encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if line.startswith("GEMINI_API_KEY="):
+                    return line.split("=", 1)[1].strip()
+    return ""
+def build_lang_instruction(lang: str) -> str:
+    """Build language instruction to append to the prompt.
+    Args:
+        lang: Language code. 'ko', 'en', 'ko+en', etc.
+    Returns:
+        Instruction string to append to the prompt.
+    """
+    if "+" in lang:
+        parts = lang.split("+", 1)
+        primary = parts[0].strip()
+        secondary = parts[1].strip()
+        primary_name = LANG_NAMES.get(primary, primary)
+        secondary_name = LANG_NAMES.get(secondary, secondary)
+        return (
+            f"\n\n[언어 규칙] 이미지의 텍스트는 {primary_name}를 기본으로 하되, "
+            f"기술 용어나 고유명사는 {secondary_name}를 사용할 수 있습니다. "
+            f"제목과 설명은 반드시 {primary_name}로 작성하세요."
+        )
+    else:
+        lang_name = LANG_NAMES.get(lang, lang)
+        if lang == "ko":
+            return (
+                "\n\n[언어 규칙] 이미지의 모든 텍스트는 반드시 한국어로만 작성해야 합니다. "
+                "영어 텍스트를 절대 사용하지 마세요. 제목, 라벨, 설명, 주석 등 "
+                "모든 텍스트 요소를 한국어로 작성하세요."
+            )
+        elif lang == "en":
+            return (
+                "\n\n[Language Rule] All text in the image must be written in English only. "
+                "Do not use any other language. Titles, labels, descriptions, and annotations "
+                "must all be in English."
+            )
+        else:
+            return (
+                f"\n\n[Language Rule] All text in the image must be written in {lang_name} only. "
+                f"Do not use any other language."
+            )
+def enhance_prompt(prompt: str, preset: str, lang: str, no_enhance: bool) -> str:
+    """Enhance the prompt with preset style and language instructions.
+    Args:
+        prompt: User-provided prompt.
+        preset: Preset name (e.g., 'infographic', 'technical_illustration').
+        lang: Language code.
+        no_enhance: If True, skip preset style enhancement (still apply lang).
+    Returns:
+        Enhanced prompt string.
+    """
+    parts = []
+    if not no_enhance and preset in PRESETS:
+        parts.append(f"[스타일] {PRESETS[preset]['style']}")
+    parts.append(prompt)
+    parts.append(build_lang_instruction(lang))
+    return "\n\n".join(parts)
+def generate_image(
+    prompt: str,
+    preset: str,
+    output_dir: str,
+    project_dir: str = ".",
+    lang: str = "ko",
+    aspect_ratio: str = "",
+    no_enhance: bool = False,
+) -> dict:
+    """Generate an image using Gemini image generation model.
+    Args:
+        prompt: Image generation prompt.
+        preset: Style preset name.
+        output_dir: Directory to save the generated image.
+        project_dir: Project root (for .env lookup).
+        lang: Language code for text in images.
+        aspect_ratio: Override aspect ratio (e.g., '16:9', '4:3').
+        no_enhance: Skip preset style enhancement.
+    Returns:
+        Result dict with image_id, file_path, source_type.
+    """
+    proj = Path(project_dir).resolve()
+    api_key = load_api_key(proj)
+    if not api_key:
+        return {"error": "GEMINI_API_KEY not configured. Set it in .env or environment."}
+    # Enhance prompt
+    full_prompt = enhance_prompt(prompt, preset, lang, no_enhance)
+    # Resolve aspect ratio
+    if not aspect_ratio and preset in PRESETS:
+        aspect_ratio = PRESETS[preset]["aspect_ratio"]
+    if not aspect_ratio:
+        aspect_ratio = "16:9"
+    # Build request
+    url = (
+        f"https://generativelanguage.googleapis.com/v1beta/models/"
+        f"{IMAGE_MODEL}:generateContent?key={api_key}"
+    )
+    # Add aspect ratio hint to prompt
+    ratio_hint = f"\n\n[이미지 비율] {aspect_ratio} 비율로 생성해주세요."
+    full_prompt += ratio_hint
+    payload = {
+        "contents": [{"parts": [{"text": full_prompt}]}],
+        "generationConfig": {"responseModalities": ["image", "text"]},
+    }
+    data = json.dumps(payload).encode("utf-8")
+    req = urllib.request.Request(
+        url, data=data, headers={"Content-Type": "application/json"}
+    )
+    try:
+        with urllib.request.urlopen(req, timeout=180) as resp:
+            result = json.loads(resp.read().decode("utf-8"))
+    except urllib.error.HTTPError as e:
+        body = e.read().decode("utf-8", errors="replace")[:500]
+        return {"error": f"Gemini API error ({e.code}): {body}"}
+    except urllib.error.URLError as e:
+        return {"error": f"Gemini API connection error: {e}"}
+    # Extract image from response
+    candidates = result.get("candidates", [])
+    if not candidates:
+        return {"error": "Gemini returned no candidates"}
+    parts = candidates[0].get("content", {}).get("parts", [])
+    for part in parts:
+        if "inlineData" in part:
+            img_b64 = part["inlineData"].get("data", "")
+            mime = part["inlineData"].get("mimeType", "image/png")
+            if img_b64:
+                img_bytes = base64.b64decode(img_b64)
+                # Determine extension
+                ext = ".png" if "png" in mime else ".jpg"
+                image_id = f"gen_{uuid.uuid4().hex[:8]}"
+                filename = f"{image_id}{ext}"
+                out_path = Path(output_dir)
+                out_path.mkdir(parents=True, exist_ok=True)
+                file_path = out_path / filename
+                with open(file_path, "wb") as f:
+                    f.write(img_bytes)
+                return {
+                    "image_id": image_id,
+                    "file_path": str(file_path),
+                    "source_type": "generated",
+                    "file_size": len(img_bytes),
+                    "lang": lang,
+                    "preset": preset,
+                    "model": IMAGE_MODEL,
+                }
+    return {"error": "No image data in Gemini response"}
+def search_image(query: str, output_dir: str) -> dict:
+    """Search for an image (placeholder — not yet implemented).
+    Image search requires additional API setup. For now, returns an error
+    directing the user to provide images manually.
+    """
+    return {
+        "error": (
+            "Image search is not yet implemented. "
+            "Please provide images manually via '/dokkit modify \"use <file>\"'."
+        )
+    }
+def parse_args(argv: list) -> dict:
+    """Parse command-line arguments."""
+    if len(argv) < 2:
+        return {"error": "Usage: source_images.py <generate|search> [options]"}
+    command = argv[1]
+    args = {"command": command}
+    i = 2
+    while i < len(argv):
+        arg = argv[i]
+        if arg == "--prompt" and i + 1 < len(argv):
+            args["prompt"] = argv[i + 1]
+            i += 2
+        elif arg == "--preset" and i + 1 < len(argv):
+            args["preset"] = argv[i + 1]
+            i += 2
+        elif arg == "--output-dir" and i + 1 < len(argv):
+            args["output_dir"] = argv[i + 1]
+            i += 2
+        elif arg == "--project-dir" and i + 1 < len(argv):
+            args["project_dir"] = argv[i + 1]
+            i += 2
+        elif arg == "--lang" and i + 1 < len(argv):
+            args["lang"] = argv[i + 1]
+            i += 2
+        elif arg == "--aspect-ratio" and i + 1 < len(argv):
+            args["aspect_ratio"] = argv[i + 1]
+            i += 2
+        elif arg == "--query" and i + 1 < len(argv):
+            args["query"] = argv[i + 1]
+            i += 2
+        elif arg == "--no-enhance":
+            args["no_enhance"] = True
+            i += 1
+        else:
+            i += 1
+    return args
+def main():
+    args = parse_args(sys.argv)
+    if "error" in args:
+        print(json.dumps(args), file=sys.stderr)
+        sys.exit(1)
+    command = args.get("command")
+    if command == "generate":
+        prompt = args.get("prompt")
+        if not prompt:
+            print(json.dumps({"error": "Missing --prompt"}), file=sys.stderr)
+            sys.exit(1)
+        result = generate_image(
+            prompt=prompt,
+            preset=args.get("preset", "infographic"),
+            output_dir=args.get("output_dir", ".dokkit/images/"),
+            project_dir=args.get("project_dir", "."),
+            lang=args.get("lang", "ko"),
+            aspect_ratio=args.get("aspect_ratio", ""),
+            no_enhance=args.get("no_enhance", False),
+        )
+    elif command == "search":
+        query = args.get("query")
+        if not query:
+            print(json.dumps({"error": "Missing --query"}), file=sys.stderr)
+            sys.exit(1)
+        result = search_image(
+            query=query,
+            output_dir=args.get("output_dir", ".dokkit/images/"),
+        )
+    else:
+        result = {"error": f"Unknown command: {command}. Use 'generate' or 'search'."}
+    # Output result with __RESULT__ marker for agent parsing
+    print(f"__RESULT__{json.dumps(result, ensure_ascii=False)}")
+    if "error" in result:
+        sys.exit(1)
+if __name__ == "__main__":
+    main()