npm - @llm-translate/cli - Versions diffs - 1.0.0-next.1 - Mend

@llm-translate/cli 1.0.0-next.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (157) hide show

package/.dockerignore +51 -0
package/.env.example +33 -0
package/.github/workflows/docs-pages.yml +57 -0
package/.github/workflows/release.yml +49 -0
package/.translaterc.json +44 -0
package/CLAUDE.md +243 -0
package/Dockerfile +55 -0
package/README.md +371 -0
package/RFC.md +1595 -0
package/dist/cli/index.d.ts +2 -0
package/dist/cli/index.js +4494 -0
package/dist/cli/index.js.map +1 -0
package/dist/index.d.ts +1152 -0
package/dist/index.js +3841 -0
package/dist/index.js.map +1 -0
package/docker-compose.yml +56 -0
package/docs/.vitepress/config.ts +161 -0
package/docs/api/agent.md +262 -0
package/docs/api/engine.md +274 -0
package/docs/api/index.md +171 -0
package/docs/api/providers.md +304 -0
package/docs/changelog.md +64 -0
package/docs/cli/dir.md +243 -0
package/docs/cli/file.md +213 -0
package/docs/cli/glossary.md +273 -0
package/docs/cli/index.md +129 -0
package/docs/cli/init.md +158 -0
package/docs/cli/serve.md +211 -0
package/docs/glossary.json +235 -0
package/docs/guide/chunking.md +272 -0
package/docs/guide/configuration.md +139 -0
package/docs/guide/cost-optimization.md +237 -0
package/docs/guide/docker.md +371 -0
package/docs/guide/getting-started.md +150 -0
package/docs/guide/glossary.md +241 -0
package/docs/guide/index.md +86 -0
package/docs/guide/ollama.md +515 -0
package/docs/guide/prompt-caching.md +221 -0
package/docs/guide/providers.md +232 -0
package/docs/guide/quality-control.md +206 -0
package/docs/guide/vitepress-integration.md +265 -0
package/docs/index.md +63 -0
package/docs/ja/api/agent.md +262 -0
package/docs/ja/api/engine.md +274 -0
package/docs/ja/api/index.md +171 -0
package/docs/ja/api/providers.md +304 -0
package/docs/ja/changelog.md +64 -0
package/docs/ja/cli/dir.md +243 -0
package/docs/ja/cli/file.md +213 -0
package/docs/ja/cli/glossary.md +273 -0
package/docs/ja/cli/index.md +111 -0
package/docs/ja/cli/init.md +158 -0
package/docs/ja/guide/chunking.md +271 -0
package/docs/ja/guide/configuration.md +139 -0
package/docs/ja/guide/cost-optimization.md +30 -0
package/docs/ja/guide/getting-started.md +150 -0
package/docs/ja/guide/glossary.md +214 -0
package/docs/ja/guide/index.md +32 -0
package/docs/ja/guide/ollama.md +410 -0
package/docs/ja/guide/prompt-caching.md +221 -0
package/docs/ja/guide/providers.md +232 -0
package/docs/ja/guide/quality-control.md +137 -0
package/docs/ja/guide/vitepress-integration.md +265 -0
package/docs/ja/index.md +58 -0
package/docs/ko/api/agent.md +262 -0
package/docs/ko/api/engine.md +274 -0
package/docs/ko/api/index.md +171 -0
package/docs/ko/api/providers.md +304 -0
package/docs/ko/changelog.md +64 -0
package/docs/ko/cli/dir.md +243 -0
package/docs/ko/cli/file.md +213 -0
package/docs/ko/cli/glossary.md +273 -0
package/docs/ko/cli/index.md +111 -0
package/docs/ko/cli/init.md +158 -0
package/docs/ko/guide/chunking.md +271 -0
package/docs/ko/guide/configuration.md +139 -0
package/docs/ko/guide/cost-optimization.md +30 -0
package/docs/ko/guide/getting-started.md +150 -0
package/docs/ko/guide/glossary.md +214 -0
package/docs/ko/guide/index.md +32 -0
package/docs/ko/guide/ollama.md +410 -0
package/docs/ko/guide/prompt-caching.md +221 -0
package/docs/ko/guide/providers.md +232 -0
package/docs/ko/guide/quality-control.md +137 -0
package/docs/ko/guide/vitepress-integration.md +265 -0
package/docs/ko/index.md +58 -0
package/docs/zh/api/agent.md +262 -0
package/docs/zh/api/engine.md +274 -0
package/docs/zh/api/index.md +171 -0
package/docs/zh/api/providers.md +304 -0
package/docs/zh/changelog.md +64 -0
package/docs/zh/cli/dir.md +243 -0
package/docs/zh/cli/file.md +213 -0
package/docs/zh/cli/glossary.md +273 -0
package/docs/zh/cli/index.md +111 -0
package/docs/zh/cli/init.md +158 -0
package/docs/zh/guide/chunking.md +271 -0
package/docs/zh/guide/configuration.md +139 -0
package/docs/zh/guide/cost-optimization.md +30 -0
package/docs/zh/guide/getting-started.md +150 -0
package/docs/zh/guide/glossary.md +214 -0
package/docs/zh/guide/index.md +32 -0
package/docs/zh/guide/ollama.md +410 -0
package/docs/zh/guide/prompt-caching.md +221 -0
package/docs/zh/guide/providers.md +232 -0
package/docs/zh/guide/quality-control.md +137 -0
package/docs/zh/guide/vitepress-integration.md +265 -0
package/docs/zh/index.md +58 -0
package/package.json +91 -0
package/release.config.mjs +15 -0
package/schemas/glossary.schema.json +110 -0
package/src/cli/commands/dir.ts +469 -0
package/src/cli/commands/file.ts +291 -0
package/src/cli/commands/glossary.ts +221 -0
package/src/cli/commands/init.ts +68 -0
package/src/cli/commands/serve.ts +60 -0
package/src/cli/index.ts +64 -0
package/src/cli/options.ts +59 -0
package/src/core/agent.ts +1119 -0
package/src/core/chunker.ts +391 -0
package/src/core/engine.ts +634 -0
package/src/errors.ts +188 -0
package/src/index.ts +147 -0
package/src/integrations/vitepress.ts +549 -0
package/src/parsers/markdown.ts +383 -0
package/src/providers/claude.ts +259 -0
package/src/providers/interface.ts +109 -0
package/src/providers/ollama.ts +379 -0
package/src/providers/openai.ts +308 -0
package/src/providers/registry.ts +153 -0
package/src/server/index.ts +152 -0
package/src/server/middleware/auth.ts +93 -0
package/src/server/middleware/logger.ts +90 -0
package/src/server/routes/health.ts +84 -0
package/src/server/routes/translate.ts +210 -0
package/src/server/types.ts +138 -0
package/src/services/cache.ts +899 -0
package/src/services/config.ts +217 -0
package/src/services/glossary.ts +247 -0
package/src/types/analysis.ts +164 -0
package/src/types/index.ts +265 -0
package/src/types/modes.ts +121 -0
package/src/types/mqm.ts +157 -0
package/src/utils/logger.ts +141 -0
package/src/utils/tokens.ts +116 -0
package/tests/fixtures/glossaries/ml-glossary.json +53 -0
package/tests/fixtures/input/lynq-installation.ko.md +350 -0
package/tests/fixtures/input/lynq-installation.md +350 -0
package/tests/fixtures/input/simple.ko.md +27 -0
package/tests/fixtures/input/simple.md +27 -0
package/tests/unit/chunker.test.ts +229 -0
package/tests/unit/glossary.test.ts +146 -0
package/tests/unit/markdown.test.ts +205 -0
package/tests/unit/tokens.test.ts +81 -0
package/tsconfig.json +28 -0
package/tsup.config.ts +34 -0
package/vitest.config.ts +16 -0

package/README.md ADDED Viewed

@@ -0,0 +1,371 @@
+# llm-translate
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
+[![Node.js](https://img.shields.io/badge/Node.js-20%2B-green.svg)](https://nodejs.org/)
+[![TypeScript](https://img.shields.io/badge/TypeScript-5.x-blue.svg)](https://www.typescriptlang.org/)
+CLI-based document translation tool powered by Large Language Models with glossary enforcement and quality-aware refinement.
+## Highlights
+- **Glossary-Enforced Consistency** - Domain-specific terminology is translated consistently across documents
+- **Self-Refine Quality Loop** - Iterative improvement until target quality threshold is met
+- **Structure Preservation** - AST-based processing maintains Markdown formatting integrity
+- **Unix-Friendly** - Supports stdin/stdout for pipeline integration
+## Installation
+```bash
+npm install -g llm-translate
+```
+Or run directly with npx:
+```bash
+npx llm-translate file README.md -s en -t ko
+```
+## Quick Start
+```bash
+# Set your API key
+export ANTHROPIC_API_KEY=your-api-key
+# Translate a single file
+llm-translate file README.md -s en -t ko -o README.ko.md
+# Use stdin/stdout pipeline
+cat doc.md | llm-translate file - -s en -t ja > doc.ja.md
+# With glossary for consistent terminology
+llm-translate file guide.md -s en -t ko -g glossary.json -o guide.ko.md
+```
+## How It Works
+llm-translate uses a **Self-Refine** translation algorithm:
+```mermaid
+flowchart TD
+    A[📄 Input Document] --> B[1. PREPARE]
+    B --> |Load glossary & extract text| C[2. TRANSLATE]
+    C --> |Initial translation with glossary| D[3. EVALUATE]
+    D --> E{Quality >= Threshold?}
+    E --> |Yes| F[✅ Output Translation]
+    E --> |No| G[4. REFLECT]
+    G --> |Generate critique| H[5. IMPROVE]
+    H --> |Apply suggestions| I{Max iterations?}
+    I --> |No| D
+    I --> |Yes| F
+    style A fill:#e1f5fe
+    style F fill:#c8e6c9
+    style E fill:#fff9c4
+    style I fill:#fff9c4
+```
+**Quality Evaluation Criteria:**
+| Criteria | Weight | Description |
+|----------|--------|-------------|
+| Semantic Accuracy | 40% | Meaning preservation from source |
+| Fluency | 25% | Natural expression in target language |
+| Glossary Compliance | 20% | Correct use of glossary terms |
+| Format Preservation | 15% | Markdown structure integrity |
+## CLI Usage
+### `llm-translate file <input> [output]`
+Translate a single file.
+```bash
+# Basic usage
+llm-translate file guide.md -s en -t ko -o guide.ko.md
+# With glossary
+llm-translate file doc.md -s en -t ja -g ./glossary.json
+# Dry run (preview without API calls)
+llm-translate file doc.md -s en -t ko --dry-run
+# JSON output format
+llm-translate file doc.md -s en -t ko --json
+# Adjust quality threshold
+llm-translate file doc.md -s en -t ko --quality 90 --max-iterations 5
+# Verbose output
+llm-translate file doc.md -s en -t ko -v
+```
+**Options:**
+| Option | Description |
+|--------|-------------|
+| `-s, --source-lang <lang>` | Source language code (required) |
+| `-t, --target-lang <lang>` | Target language code (required) |
+| `-o, --output <path>` | Output file path |
+| `-g, --glossary <path>` | Path to glossary JSON file |
+| `-p, --provider <name>` | LLM provider (default: claude) |
+| `-m, --model <name>` | Model name |
+| `-f, --format <type>` | Force format: markdown, html, text |
+| `--quality <number>` | Quality threshold 0-100 (default: 85) |
+| `--max-iterations <n>` | Max refinement iterations (default: 4) |
+| `--chunk-size <tokens>` | Chunk size in tokens (default: 1024) |
+| `--context <text>` | Additional context for translation |
+| `--strict-quality` | Fail if quality threshold not met |
+| `--strict-glossary` | Fail if glossary terms not applied |
+| `--dry-run` | Preview without making API calls |
+| `--json` | Output result as JSON |
+| `--no-cache` | Disable translation cache |
+| `-v, --verbose` | Verbose output |
+| `-q, --quiet` | Suppress non-essential output |
+### `llm-translate init`
+Initialize project configuration.
+```bash
+llm-translate init
+# Creates .translaterc.json with default settings
+```
+### `llm-translate glossary <subcommand>`
+Manage glossary files.
+```bash
+# List all terms
+llm-translate glossary list ./glossary.json
+# List terms for specific language
+llm-translate glossary list ./glossary.json -t ko
+# Validate glossary file
+llm-translate glossary validate ./glossary.json
+# Add a term
+llm-translate glossary add ./glossary.json "machine learning" --target ko:머신러닝
+# Remove a term
+llm-translate glossary remove ./glossary.json "machine learning"
+```
+## Configuration
+Create a `.translaterc.json` file in your project root:
+```json
+{
+  "version": "1.0",
+  "languages": {
+    "source": "en",
+    "targets": ["ko", "ja", "zh"]
+  },
+  "provider": {
+    "default": "claude",
+    "model": "claude-haiku-4-5-20251001"
+  },
+  "quality": {
+    "threshold": 85,
+    "maxIterations": 4
+  },
+  "glossary": {
+    "path": "./glossary.json",
+    "strict": false
+  },
+  "chunking": {
+    "maxTokens": 1024,
+    "overlap": 150
+  }
+}
+```
+Configuration is loaded with this priority:
+1. CLI arguments (highest)
+2. Environment variables
+3. `.translaterc.json`
+4. Defaults (lowest)
+## Glossary Format
+The glossary enforces consistent translation of domain-specific terminology:
+```json
+{
+  "metadata": {
+    "name": "Technical Documentation Glossary",
+    "sourceLang": "en",
+    "targetLangs": ["ko", "ja"],
+    "version": "1.0.0"
+  },
+  "terms": [
+    {
+      "source": "machine learning",
+      "targets": {
+        "ko": "머신러닝",
+        "ja": "機械学習"
+      },
+      "context": "AI/ML domain terminology"
+    },
+    {
+      "source": "API",
+      "targets": {},
+      "doNotTranslate": true
+    },
+    {
+      "source": "frontend",
+      "targets": {
+        "ja": "フロントエンド"
+      },
+      "doNotTranslateFor": ["ko"],
+      "caseSensitive": false
+    }
+  ]
+}
+```
+**Term Options:**
+| Field | Description |
+|-------|-------------|
+| `source` | Source term to match |
+| `targets` | Translation map by language code |
+| `doNotTranslate` | Keep source term for all languages |
+| `doNotTranslateFor` | Keep source term for specific languages |
+| `caseSensitive` | Case-sensitive matching (default: true) |
+| `context` | Usage hint for LLM |
+## Environment Variables
+| Variable | Description |
+|----------|-------------|
+| `ANTHROPIC_API_KEY` | Claude API key |
+| `OPENAI_API_KEY` | OpenAI API key |
+| `OLLAMA_BASE_URL` | Ollama server URL (default: `http://localhost:11434`) |
+## Supported Formats
+| Format | Status | Notes |
+|--------|--------|-------|
+| Markdown | Stable | Full AST-based processing, preserves code blocks, links, tables |
+| Plain Text | Stable | Direct translation |
+| HTML | Planned | Coming soon |
+## Exit Codes
+| Code | Meaning |
+|------|---------|
+| 0 | Success |
+| 1 | General error |
+| 2 | Invalid arguments |
+| 3 | File not found |
+| 4 | Quality threshold not met (with `--strict-quality`) |
+| 5 | Provider/API error |
+| 6 | Glossary validation failed |
+## Development
+### Prerequisites
+- Node.js 20+
+- npm or yarn
+### Setup
+```bash
+# Clone the repository
+git clone https://github.com/selenehyun/llm-translate.git
+cd llm-translate
+# Install dependencies
+npm install
+# Build
+npm run build
+# Run in development mode
+npm run dev
+```
+### Scripts
+```bash
+npm run build       # Build with tsup
+npm run dev         # Watch mode
+npm test            # Run tests
+npm run test:run    # Run tests once
+npm run typecheck   # TypeScript check
+npm run lint        # ESLint
+```
+### Project Structure
+```
+src/
+├── cli/              # CLI entry point and commands
+│   ├── commands/     # file, dir, init, glossary commands
+│   └── options.ts    # Shared CLI options
+├── core/             # Translation engine
+│   ├── engine.ts     # Main translation orchestrator
+│   ├── agent.ts      # Self-refine translation agent
+│   ├── chunker.ts    # Semantic document chunker
+│   └── evaluator.ts  # Quality evaluation
+├── parsers/          # Format-specific parsers
+│   └── markdown.ts   # Markdown AST parser
+├── providers/        # LLM provider adapters
+│   ├── interface.ts  # Provider interface
+│   ├── registry.ts   # Provider registry
+│   └── claude.ts     # Claude provider
+├── services/         # Supporting services
+│   ├── glossary.ts   # Glossary loading and resolution
+│   └── config.ts     # Configuration loader
+├── types/            # Type definitions
+└── utils/            # Utilities
+```
+## Roadmap
+### v0.1.0 (Current)
+- [x] Single file translation
+- [x] Claude provider
+- [x] Markdown parser with structure preservation
+- [x] Self-Refine quality loop
+- [x] Glossary enforcement
+- [x] stdin/stdout support
+- [x] Configuration system
+### v0.2.0 (Planned)
+- [ ] OpenAI provider
+- [ ] Ollama provider (local LLMs)
+- [ ] HTML parser
+- [ ] Translation cache
+- [ ] Batch directory processing
+### v0.3.0 (Future)
+- [ ] Parallel file processing
+- [ ] Progress reporting
+- [ ] MCP server integration
+## Contributing
+Contributions are welcome! Please read our contributing guidelines before submitting a PR.
+1. Fork the repository
+2. Create your feature branch (`git checkout -b feature/amazing-feature`)
+3. Commit your changes (`git commit -m 'Add amazing feature'`)
+4. Push to the branch (`git push origin feature/amazing-feature`)
+5. Open a Pull Request
+## License
+MIT License - see [LICENSE](LICENSE) for details.
+## Acknowledgments
+Built with:
+- [Vercel AI SDK](https://sdk.vercel.ai/) - LLM integration
+- [Commander.js](https://github.com/tj/commander.js/) - CLI framework
+- [unified/remark](https://unifiedjs.com/) - Markdown processing
+- [Zod](https://zod.dev/) - Schema validation