npm - kordoc - Versions diffs - 1.7.2 → 1.9.0 - Mend

kordoc 1.7.2 → 1.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/README.md +36 -15
package/dist/chunk-AHW56LNX.js +93 -0
package/dist/chunk-AHW56LNX.js.map +1 -0
package/dist/{chunk-NJ3R7LNR.js → chunk-MDRW3HYC.js} +1165 -234
package/dist/chunk-MDRW3HYC.js.map +1 -0
package/dist/chunk-MOL7MDBG.js +35 -0
package/dist/chunk-MOL7MDBG.js.map +1 -0
package/dist/cli.js +11 -7
package/dist/cli.js.map +1 -1
package/dist/index.cjs +1253 -195
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +17 -5
package/dist/index.d.ts +17 -5
package/dist/index.js +1248 -194
package/dist/index.js.map +1 -1
package/dist/mcp.js +10 -7
package/dist/mcp.js.map +1 -1
package/dist/page-range-737B4EZW.js +8 -0
package/dist/page-range-737B4EZW.js.map +1 -0
package/dist/provider-A4FHJSID.js +0 -0
package/dist/utils-VU6Z7HNR.js +22 -0
package/dist/utils-VU6Z7HNR.js.map +1 -0
package/dist/{watch-AKTZTPVF.js → watch-5IOZWFDD.js} +13 -5
package/dist/watch-5IOZWFDD.js.map +1 -0
package/package.json +77 -75
package/dist/chunk-NJ3R7LNR.js.map +0 -1
package/dist/watch-AKTZTPVF.js.map +0 -1

package/dist/index.d.cts CHANGED Viewed

@@ -61,6 +61,7 @@ interface IRTable {
     rows: number;
     cols: number;
     cells: IRCell[][];
+    /** 첫 행을 헤더로 렌더링할지 여부 (현재: rows > 1이면 true — 의미적 감지가 아닌 레이아웃 힌트) */
     hasHeader: boolean;
 }
 interface IRCell {
@@ -124,10 +125,10 @@ interface OutlineItem {
 }
 /** 구조화된 에러 코드 — 프로그래밍적 에러 핸들링용 */
 type ErrorCode = "EMPTY_INPUT" | "UNSUPPORTED_FORMAT" | "ENCRYPTED" | "DRM_PROTECTED" | "CORRUPTED" | "DECOMPRESSION_BOMB" | "ZIP_BOMB" | "IMAGE_BASED_PDF" | "NO_SECTIONS" | "PARSE_ERROR";
-type FileType = "hwpx" | "hwp" | "pdf" | "unknown";
+type FileType = "hwpx" | "hwp" | "pdf" | "xlsx" | "docx" | "unknown";
 interface ParseResultBase {
     fileType: FileType;
-    /** PDF 페이지 수 */
+    /** 페이지/섹션 수 — PDF: 실제 페이지 수, HWP/HWPX: 섹션 수, XLSX: 시트 수 */
     pageCount?: number;
     /** 이미지 기반 PDF 여부 (텍스트 추출 불가) */
     isImageBased?: boolean;
@@ -252,14 +253,21 @@ declare function markdownToHwpx(markdown: string): Promise<ArrayBuffer>;
 /** 매직 바이트 기반 파일 포맷 감지 */
-/** HWPX (ZIP 기반 한컴 문서): PK\x03\x04 */
+/** ZIP 파일 여부: PK\x03\x04 */
+declare function isZipFile(buffer: ArrayBuffer): boolean;
+/** HWPX (ZIP 기반 한컴 문서): PK\x03\x04 — 하위 호환용 */
 declare function isHwpxFile(buffer: ArrayBuffer): boolean;
 /** HWP 5.x (OLE2 바이너리 한컴 문서): \xD0\xCF\x11\xE0 */
 declare function isOldHwpFile(buffer: ArrayBuffer): boolean;
 /** PDF 문서: %PDF */
 declare function isPdfFile(buffer: ArrayBuffer): boolean;
-/** 버퍼로부터 파일 포맷 감지 */
+/** 동기 포맷 감지 — ZIP은 모두 "hwpx"로 반환 (하위 호환) */
 declare function detectFormat(buffer: ArrayBuffer): FileType;
+/**
+ * ZIP 내부 구조 기반 포맷 세분화.
+ * HWPX, XLSX, DOCX 모두 ZIP이므로 내부 파일로 구분.
+ */
+declare function detectZipFormat(buffer: ArrayBuffer): Promise<"hwpx" | "xlsx" | "docx" | "unknown">;
 /** 2-pass colSpan/rowSpan 테이블 빌더 및 Markdown 변환 */
@@ -293,5 +301,9 @@ declare function parseHwpx(buffer: ArrayBuffer, options?: ParseOptions): Promise
 declare function parseHwp(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
 /** PDF 파일에서 텍스트를 추출하여 Markdown으로 변환 */
 declare function parsePdf(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
+/** XLSX 파일을 Markdown으로 변환 */
+declare function parseXlsx(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
+/** DOCX 파일을 Markdown으로 변환 */
+declare function parseDocx(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
-export { type BlockDiff, type BoundingBox, type CellContext, type CellDiff, type DiffChangeType, type DiffResult, type DocumentMetadata, type ErrorCode, type ExtractedImage, type FileType, type FormField, type FormResult, type IRBlock, type IRBlockType, type IRCell, type IRTable, type ImageData, type InlineStyle, type OcrProvider, type OutlineItem, type ParseFailure, type ParseOptions, type ParseResult, type ParseSuccess, type ParseWarning, VERSION, type WarningCode, type WatchOptions, blocksToMarkdown, compare, detectFormat, diffBlocks, extractFormFields, isHwpxFile, isOldHwpFile, isPdfFile, markdownToHwpx, parse, parseHwp, parseHwpx, parsePdf };
+export { type BlockDiff, type BoundingBox, type CellContext, type CellDiff, type DiffChangeType, type DiffResult, type DocumentMetadata, type ErrorCode, type ExtractedImage, type FileType, type FormField, type FormResult, type IRBlock, type IRBlockType, type IRCell, type IRTable, type ImageData, type InlineStyle, type OcrProvider, type OutlineItem, type ParseFailure, type ParseOptions, type ParseResult, type ParseSuccess, type ParseWarning, VERSION, type WarningCode, type WatchOptions, blocksToMarkdown, compare, detectFormat, detectZipFormat, diffBlocks, extractFormFields, isHwpxFile, isOldHwpFile, isPdfFile, isZipFile, markdownToHwpx, parse, parseDocx, parseHwp, parseHwpx, parsePdf, parseXlsx };

package/dist/index.d.ts CHANGED Viewed

@@ -61,6 +61,7 @@ interface IRTable {
     rows: number;
     cols: number;
     cells: IRCell[][];
+    /** 첫 행을 헤더로 렌더링할지 여부 (현재: rows > 1이면 true — 의미적 감지가 아닌 레이아웃 힌트) */
     hasHeader: boolean;
 }
 interface IRCell {
@@ -124,10 +125,10 @@ interface OutlineItem {
 }
 /** 구조화된 에러 코드 — 프로그래밍적 에러 핸들링용 */
 type ErrorCode = "EMPTY_INPUT" | "UNSUPPORTED_FORMAT" | "ENCRYPTED" | "DRM_PROTECTED" | "CORRUPTED" | "DECOMPRESSION_BOMB" | "ZIP_BOMB" | "IMAGE_BASED_PDF" | "NO_SECTIONS" | "PARSE_ERROR";
-type FileType = "hwpx" | "hwp" | "pdf" | "unknown";
+type FileType = "hwpx" | "hwp" | "pdf" | "xlsx" | "docx" | "unknown";
 interface ParseResultBase {
     fileType: FileType;
-    /** PDF 페이지 수 */
+    /** 페이지/섹션 수 — PDF: 실제 페이지 수, HWP/HWPX: 섹션 수, XLSX: 시트 수 */
     pageCount?: number;
     /** 이미지 기반 PDF 여부 (텍스트 추출 불가) */
     isImageBased?: boolean;
@@ -252,14 +253,21 @@ declare function markdownToHwpx(markdown: string): Promise<ArrayBuffer>;
 /** 매직 바이트 기반 파일 포맷 감지 */
-/** HWPX (ZIP 기반 한컴 문서): PK\x03\x04 */
+/** ZIP 파일 여부: PK\x03\x04 */
+declare function isZipFile(buffer: ArrayBuffer): boolean;
+/** HWPX (ZIP 기반 한컴 문서): PK\x03\x04 — 하위 호환용 */
 declare function isHwpxFile(buffer: ArrayBuffer): boolean;
 /** HWP 5.x (OLE2 바이너리 한컴 문서): \xD0\xCF\x11\xE0 */
 declare function isOldHwpFile(buffer: ArrayBuffer): boolean;
 /** PDF 문서: %PDF */
 declare function isPdfFile(buffer: ArrayBuffer): boolean;
-/** 버퍼로부터 파일 포맷 감지 */
+/** 동기 포맷 감지 — ZIP은 모두 "hwpx"로 반환 (하위 호환) */
 declare function detectFormat(buffer: ArrayBuffer): FileType;
+/**
+ * ZIP 내부 구조 기반 포맷 세분화.
+ * HWPX, XLSX, DOCX 모두 ZIP이므로 내부 파일로 구분.
+ */
+declare function detectZipFormat(buffer: ArrayBuffer): Promise<"hwpx" | "xlsx" | "docx" | "unknown">;
 /** 2-pass colSpan/rowSpan 테이블 빌더 및 Markdown 변환 */
@@ -293,5 +301,9 @@ declare function parseHwpx(buffer: ArrayBuffer, options?: ParseOptions): Promise
 declare function parseHwp(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
 /** PDF 파일에서 텍스트를 추출하여 Markdown으로 변환 */
 declare function parsePdf(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
+/** XLSX 파일을 Markdown으로 변환 */
+declare function parseXlsx(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
+/** DOCX 파일을 Markdown으로 변환 */
+declare function parseDocx(buffer: ArrayBuffer, options?: ParseOptions): Promise<ParseResult>;
-export { type BlockDiff, type BoundingBox, type CellContext, type CellDiff, type DiffChangeType, type DiffResult, type DocumentMetadata, type ErrorCode, type ExtractedImage, type FileType, type FormField, type FormResult, type IRBlock, type IRBlockType, type IRCell, type IRTable, type ImageData, type InlineStyle, type OcrProvider, type OutlineItem, type ParseFailure, type ParseOptions, type ParseResult, type ParseSuccess, type ParseWarning, VERSION, type WarningCode, type WatchOptions, blocksToMarkdown, compare, detectFormat, diffBlocks, extractFormFields, isHwpxFile, isOldHwpFile, isPdfFile, markdownToHwpx, parse, parseHwp, parseHwpx, parsePdf };
+export { type BlockDiff, type BoundingBox, type CellContext, type CellDiff, type DiffChangeType, type DiffResult, type DocumentMetadata, type ErrorCode, type ExtractedImage, type FileType, type FormField, type FormResult, type IRBlock, type IRBlockType, type IRCell, type IRTable, type ImageData, type InlineStyle, type OcrProvider, type OutlineItem, type ParseFailure, type ParseOptions, type ParseResult, type ParseSuccess, type ParseWarning, VERSION, type WarningCode, type WatchOptions, blocksToMarkdown, compare, detectFormat, detectZipFormat, diffBlocks, extractFormFields, isHwpxFile, isOldHwpFile, isPdfFile, isZipFile, markdownToHwpx, parse, parseDocx, parseHwp, parseHwpx, parsePdf, parseXlsx };