@hamster-note/document-parser 0.2.1 → 0.3.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.d.ts +26 -2
- package/dist/index.js +14 -1
- package/dist/index.js.map +1 -1
- package/package.json +6 -2
package/dist/index.d.ts
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { IntermediateDocument, Number2 } from "@hamster-note/types";
|
|
1
|
+
import { IntermediateDocument, IntermediateOutline, Number2 } from "@hamster-note/types";
|
|
2
2
|
|
|
3
3
|
//#region src/types/DocumentAnchor.d.ts
|
|
4
4
|
interface DocumentAnchorWithTextId {
|
|
@@ -49,5 +49,29 @@ declare function listRegisteredParsers(): {
|
|
|
49
49
|
parser: DocumentParserConstructor<DocumentParser>;
|
|
50
50
|
}[];
|
|
51
51
|
//#endregion
|
|
52
|
-
|
|
52
|
+
//#region src/Page/index.d.ts
|
|
53
|
+
declare enum RenderViews {
|
|
54
|
+
THUMBNAIL = "thumbnail",
|
|
55
|
+
TEXT = "text",
|
|
56
|
+
}
|
|
57
|
+
interface RenderOptions {
|
|
58
|
+
views: RenderViews[];
|
|
59
|
+
scale: number;
|
|
60
|
+
}
|
|
61
|
+
declare abstract class HamsterPage {
|
|
62
|
+
abstract render(container: HTMLDivElement, options?: RenderOptions): Promise<void>;
|
|
63
|
+
abstract getNumber(): number;
|
|
64
|
+
abstract getSize(scale: number): Number2;
|
|
65
|
+
abstract getPureText(): string;
|
|
66
|
+
}
|
|
67
|
+
//#endregion
|
|
68
|
+
//#region src/Document/index.d.ts
|
|
69
|
+
declare abstract class HamsterDocument {
|
|
70
|
+
abstract getPages(): Promise<HamsterPage[]>;
|
|
71
|
+
abstract getPage(pageNumber: number): Promise<HamsterPage | undefined>;
|
|
72
|
+
abstract getOutline(): Promise<IntermediateOutline | undefined>;
|
|
73
|
+
abstract getCover(): Promise<HTMLCanvasElement | HTMLImageElement>;
|
|
74
|
+
}
|
|
75
|
+
//#endregion
|
|
76
|
+
export { DocumentAnchor, DocumentAnchorWithPosition, DocumentAnchorWithTextId, DocumentParser, DocumentParserConstructor, HamsterDocument, HamsterPage, ParseOptions, ParserInput, RenderOptions, RenderViews, getParserByExt, listRegisteredParsers, parse, registerParser, unregisterParser };
|
|
53
77
|
//# sourceMappingURL=index.d.ts.map
|
package/dist/index.js
CHANGED
|
@@ -62,5 +62,18 @@ function listRegisteredParsers() {
|
|
|
62
62
|
}
|
|
63
63
|
|
|
64
64
|
//#endregion
|
|
65
|
-
|
|
65
|
+
//#region src/Page/index.ts
|
|
66
|
+
let RenderViews = /* @__PURE__ */ function(RenderViews$1) {
|
|
67
|
+
RenderViews$1["THUMBNAIL"] = "thumbnail";
|
|
68
|
+
RenderViews$1["TEXT"] = "text";
|
|
69
|
+
return RenderViews$1;
|
|
70
|
+
}({});
|
|
71
|
+
var HamsterPage = class {};
|
|
72
|
+
|
|
73
|
+
//#endregion
|
|
74
|
+
//#region src/Document/index.ts
|
|
75
|
+
var HamsterDocument = class {};
|
|
76
|
+
|
|
77
|
+
//#endregion
|
|
78
|
+
export { DocumentParser, HamsterDocument, HamsterPage, RenderViews, getParserByExt, listRegisteredParsers, parse, registerParser, unregisterParser };
|
|
66
79
|
//# sourceMappingURL=index.js.map
|
package/dist/index.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.js","names":[],"sources":["../src/Parser/index.ts","../src/register/index.ts"],"sourcesContent":["import type { IntermediateDocument } from '@hamster-note/types'\n\n// 解析器通用输入,兼容 Browser / Worker / Node(Buffer 属于 ArrayBufferView)\nexport type ParserInput = ArrayBuffer | ArrayBufferView | Blob\n\nexport abstract class DocumentParser {\n // 子类必须声明支持的扩展名列表(不带点),用于注册分发\n static readonly exts: readonly string[] = []\n\n /**\n * 将原始输入解析为中间文档结构。\n * - 输入必须是内存态数据(ArrayBuffer / ArrayBufferView / Blob)\n * - 失败时抛出异常;不要返回 undefined。\n */\n abstract encode(input: ParserInput): Promise<IntermediateDocument>\n\n /**\n * 可选:从中间文档逆序列化回原始文件数据。\n * 默认不支持,需要的子类自行实现。\n */\n decode(_intermediateDocument: IntermediateDocument): Promise<ParserInput> {\n return Promise.reject(new Error('decode is not implemented'))\n }\n\n // 将各种输入转换为 ArrayBuffer,方便子类直接消费二进制\n protected static async toArrayBuffer(\n input: ParserInput\n ): Promise<ArrayBuffer> {\n if (input instanceof ArrayBuffer) {\n return input\n }\n if (ArrayBuffer.isView(input)) {\n // 拷贝为独立的 ArrayBuffer,避免 SharedArrayBuffer 兼容性问题\n const buffer = new ArrayBuffer(input.byteLength)\n new Uint8Array(buffer).set(\n new Uint8Array(input.buffer, input.byteOffset, input.byteLength)\n )\n return buffer\n }\n if (typeof Blob !== 'undefined' && input instanceof Blob) {\n return input.arrayBuffer()\n }\n throw new TypeError('Unsupported parser input')\n }\n\n // 子类若需要 Uint8Array,可直接复用\n protected static async toUint8Array(input: ParserInput): Promise<Uint8Array> {\n const buffer = await DocumentParser.toArrayBuffer(input)\n return new Uint8Array(buffer)\n }\n}\n","import type { DocumentParser, ParserInput } from '../Parser/index'\nimport type { IntermediateDocument } from '@hamster-note/types'\n\nexport interface DocumentParserConstructor<\n T extends DocumentParser = DocumentParser\n> {\n new (): T\n readonly exts: readonly string[]\n}\n\nconst parserMap: Map<string, DocumentParserConstructor> = new Map()\n\nconst normalizeExt = (ext: string) => ext.replace(/^\\./, '').toLowerCase()\n\n// 注册解析器:防止重复注册同扩展名的不同类\nexport const registerParser = (Parser: DocumentParserConstructor) => {\n if (!Array.isArray(Parser.exts) || Parser.exts.length === 0) {\n throw new Error('Parser.exts 必须是非空数组')\n }\n Parser.exts.forEach((ext) => {\n const key = normalizeExt(ext)\n const exists = parserMap.get(key)\n if (exists && exists !== Parser) {\n throw new Error(`扩展名 ${key} 已被其他解析器占用`)\n }\n parserMap.set(key, Parser)\n })\n}\n\nexport function unregisterParser(Parser: DocumentParserConstructor) {\n Parser.exts.forEach((ext) => {\n const key = normalizeExt(ext)\n const exists = parserMap.get(key)\n if (exists === Parser) {\n parserMap.delete(key)\n }\n })\n}\n\nexport function getParserByExt(\n ext?: string\n): DocumentParserConstructor | undefined {\n if (!ext) return undefined\n return parserMap.get(normalizeExt(ext))\n}\n\nexport interface ParseOptions {\n filename?: string\n ext?: string\n parser?: DocumentParserConstructor\n}\n\nexport async function parse(\n input: ParserInput,\n options: ParseOptions = {}\n): Promise<IntermediateDocument> {\n const extFromName = options.filename?.split('.').pop()\n const ext = options.ext ?? extFromName\n const Parser = options.parser ?? getParserByExt(ext)\n\n if (!Parser) {\n throw new Error(\n `未找到匹配的解析器,扩展名: ${ext ?? '未知'},已注册: ${[\n ...parserMap.keys()\n ].join(', ')}`\n )\n }\n\n const parser = new Parser()\n return parser.encode(input)\n}\n\n// 便于测试或运行时可观测性\nexport function listRegisteredParsers() {\n return [...parserMap.entries()].map(([ext, ctor]) => ({ ext, parser: ctor }))\n}\n"],"mappings":";AAKA,IAAsB,iBAAtB,MAAsB,eAAe;CAEnC,OAAgB,OAA0B,EAAE;;;;;CAa5C,OAAO,uBAAmE;AACxE,SAAO,QAAQ,uBAAO,IAAI,MAAM,4BAA4B,CAAC;;CAI/D,aAAuB,cACrB,OACsB;AACtB,MAAI,iBAAiB,YACnB,QAAO;AAET,MAAI,YAAY,OAAO,MAAM,EAAE;GAE7B,MAAM,SAAS,IAAI,YAAY,MAAM,WAAW;AAChD,OAAI,WAAW,OAAO,CAAC,IACrB,IAAI,WAAW,MAAM,QAAQ,MAAM,YAAY,MAAM,WAAW,CACjE;AACD,UAAO;;AAET,MAAI,OAAO,SAAS,eAAe,iBAAiB,KAClD,QAAO,MAAM,aAAa;AAE5B,QAAM,IAAI,UAAU,2BAA2B;;CAIjD,aAAuB,aAAa,OAAyC;EAC3E,MAAM,SAAS,MAAM,eAAe,cAAc,MAAM;AACxD,SAAO,IAAI,WAAW,OAAO;;;;;;ACtCjC,MAAM,4BAAoD,IAAI,KAAK;AAEnE,MAAM,gBAAgB,QAAgB,IAAI,QAAQ,OAAO,GAAG,CAAC,aAAa;AAG1E,MAAa,kBAAkB,WAAsC;AACnE,KAAI,CAAC,MAAM,QAAQ,OAAO,KAAK,IAAI,OAAO,KAAK,WAAW,EACxD,OAAM,IAAI,MAAM,sBAAsB;AAExC,QAAO,KAAK,SAAS,QAAQ;EAC3B,MAAM,MAAM,aAAa,IAAI;EAC7B,MAAM,SAAS,UAAU,IAAI,IAAI;AACjC,MAAI,UAAU,WAAW,OACvB,OAAM,IAAI,MAAM,OAAO,IAAI,YAAY;AAEzC,YAAU,IAAI,KAAK,OAAO;GAC1B;;AAGJ,SAAgB,iBAAiB,QAAmC;AAClE,QAAO,KAAK,SAAS,QAAQ;EAC3B,MAAM,MAAM,aAAa,IAAI;AAE7B,MADe,UAAU,IAAI,IAAI,KAClB,OACb,WAAU,OAAO,IAAI;GAEvB;;AAGJ,SAAgB,eACd,KACuC;AACvC,KAAI,CAAC,IAAK,QAAO;AACjB,QAAO,UAAU,IAAI,aAAa,IAAI,CAAC;;AASzC,eAAsB,MACpB,OACA,UAAwB,EAAE,EACK;CAC/B,MAAM,cAAc,QAAQ,UAAU,MAAM,IAAI,CAAC,KAAK;CACtD,MAAM,MAAM,QAAQ,OAAO;CAC3B,MAAM,SAAS,QAAQ,UAAU,eAAe,IAAI;AAEpD,KAAI,CAAC,OACH,OAAM,IAAI,MACR,kBAAkB,OAAO,KAAK,QAAQ,CACpC,GAAG,UAAU,MAAM,CACpB,CAAC,KAAK,KAAK,GACb;AAIH,QADe,IAAI,QAAQ,CACb,OAAO,MAAM;;AAI7B,SAAgB,wBAAwB;AACtC,QAAO,CAAC,GAAG,UAAU,SAAS,CAAC,CAAC,KAAK,CAAC,KAAK,WAAW;EAAE;EAAK,QAAQ;EAAM,EAAE"}
|
|
1
|
+
{"version":3,"file":"index.js","names":[],"sources":["../src/Parser/index.ts","../src/register/index.ts","../src/Page/index.ts","../src/Document/index.ts"],"sourcesContent":["import type { IntermediateDocument } from '@hamster-note/types'\n\n// 解析器通用输入,兼容 Browser / Worker / Node(Buffer 属于 ArrayBufferView)\nexport type ParserInput = ArrayBuffer | ArrayBufferView | Blob\n\nexport abstract class DocumentParser {\n // 子类必须声明支持的扩展名列表(不带点),用于注册分发\n static readonly exts: readonly string[] = []\n\n /**\n * 将原始输入解析为中间文档结构。\n * - 输入必须是内存态数据(ArrayBuffer / ArrayBufferView / Blob)\n * - 失败时抛出异常;不要返回 undefined。\n */\n abstract encode(input: ParserInput): Promise<IntermediateDocument>\n\n /**\n * 可选:从中间文档逆序列化回原始文件数据。\n * 默认不支持,需要的子类自行实现。\n */\n decode(_intermediateDocument: IntermediateDocument): Promise<ParserInput> {\n return Promise.reject(new Error('decode is not implemented'))\n }\n\n // 将各种输入转换为 ArrayBuffer,方便子类直接消费二进制\n protected static async toArrayBuffer(\n input: ParserInput\n ): Promise<ArrayBuffer> {\n if (input instanceof ArrayBuffer) {\n return input\n }\n if (ArrayBuffer.isView(input)) {\n // 拷贝为独立的 ArrayBuffer,避免 SharedArrayBuffer 兼容性问题\n const buffer = new ArrayBuffer(input.byteLength)\n new Uint8Array(buffer).set(\n new Uint8Array(input.buffer, input.byteOffset, input.byteLength)\n )\n return buffer\n }\n if (typeof Blob !== 'undefined' && input instanceof Blob) {\n return input.arrayBuffer()\n }\n throw new TypeError('Unsupported parser input')\n }\n\n // 子类若需要 Uint8Array,可直接复用\n protected static async toUint8Array(input: ParserInput): Promise<Uint8Array> {\n const buffer = await DocumentParser.toArrayBuffer(input)\n return new Uint8Array(buffer)\n }\n}\n","import type { DocumentParser, ParserInput } from '../Parser/index'\nimport type { IntermediateDocument } from '@hamster-note/types'\n\nexport interface DocumentParserConstructor<\n T extends DocumentParser = DocumentParser\n> {\n new (): T\n readonly exts: readonly string[]\n}\n\nconst parserMap: Map<string, DocumentParserConstructor> = new Map()\n\nconst normalizeExt = (ext: string) => ext.replace(/^\\./, '').toLowerCase()\n\n// 注册解析器:防止重复注册同扩展名的不同类\nexport const registerParser = (Parser: DocumentParserConstructor) => {\n if (!Array.isArray(Parser.exts) || Parser.exts.length === 0) {\n throw new Error('Parser.exts 必须是非空数组')\n }\n Parser.exts.forEach((ext) => {\n const key = normalizeExt(ext)\n const exists = parserMap.get(key)\n if (exists && exists !== Parser) {\n throw new Error(`扩展名 ${key} 已被其他解析器占用`)\n }\n parserMap.set(key, Parser)\n })\n}\n\nexport function unregisterParser(Parser: DocumentParserConstructor) {\n Parser.exts.forEach((ext) => {\n const key = normalizeExt(ext)\n const exists = parserMap.get(key)\n if (exists === Parser) {\n parserMap.delete(key)\n }\n })\n}\n\nexport function getParserByExt(\n ext?: string\n): DocumentParserConstructor | undefined {\n if (!ext) return undefined\n return parserMap.get(normalizeExt(ext))\n}\n\nexport interface ParseOptions {\n filename?: string\n ext?: string\n parser?: DocumentParserConstructor\n}\n\nexport async function parse(\n input: ParserInput,\n options: ParseOptions = {}\n): Promise<IntermediateDocument> {\n const extFromName = options.filename?.split('.').pop()\n const ext = options.ext ?? extFromName\n const Parser = options.parser ?? getParserByExt(ext)\n\n if (!Parser) {\n throw new Error(\n `未找到匹配的解析器,扩展名: ${ext ?? '未知'},已注册: ${[\n ...parserMap.keys()\n ].join(', ')}`\n )\n }\n\n const parser = new Parser()\n return parser.encode(input)\n}\n\n// 便于测试或运行时可观测性\nexport function listRegisteredParsers() {\n return [...parserMap.entries()].map(([ext, ctor]) => ({ ext, parser: ctor }))\n}\n","import { Number2 } from '@hamster-note/types'\n\nexport enum RenderViews {\n THUMBNAIL = 'thumbnail',\n TEXT = 'text'\n}\n\nexport interface RenderOptions {\n views: RenderViews[]\n scale: number\n}\n\nexport abstract class HamsterPage {\n abstract render(\n container: HTMLDivElement,\n options?: RenderOptions\n ): Promise<void>\n abstract getNumber(): number\n abstract getSize(scale: number): Number2\n abstract getPureText(): string\n}\n","import { HamsterPage } from '../Page'\nimport { IntermediateOutline } from '@hamster-note/types'\n\nexport abstract class HamsterDocument {\n abstract getPages(): Promise<HamsterPage[]>\n abstract getPage(pageNumber: number): Promise<HamsterPage | undefined>\n abstract getOutline(): Promise<IntermediateOutline | undefined>\n abstract getCover(): Promise<HTMLCanvasElement | HTMLImageElement>\n}\n"],"mappings":";AAKA,IAAsB,iBAAtB,MAAsB,eAAe;CAEnC,OAAgB,OAA0B,EAAE;;;;;CAa5C,OAAO,uBAAmE;AACxE,SAAO,QAAQ,uBAAO,IAAI,MAAM,4BAA4B,CAAC;;CAI/D,aAAuB,cACrB,OACsB;AACtB,MAAI,iBAAiB,YACnB,QAAO;AAET,MAAI,YAAY,OAAO,MAAM,EAAE;GAE7B,MAAM,SAAS,IAAI,YAAY,MAAM,WAAW;AAChD,OAAI,WAAW,OAAO,CAAC,IACrB,IAAI,WAAW,MAAM,QAAQ,MAAM,YAAY,MAAM,WAAW,CACjE;AACD,UAAO;;AAET,MAAI,OAAO,SAAS,eAAe,iBAAiB,KAClD,QAAO,MAAM,aAAa;AAE5B,QAAM,IAAI,UAAU,2BAA2B;;CAIjD,aAAuB,aAAa,OAAyC;EAC3E,MAAM,SAAS,MAAM,eAAe,cAAc,MAAM;AACxD,SAAO,IAAI,WAAW,OAAO;;;;;;ACtCjC,MAAM,4BAAoD,IAAI,KAAK;AAEnE,MAAM,gBAAgB,QAAgB,IAAI,QAAQ,OAAO,GAAG,CAAC,aAAa;AAG1E,MAAa,kBAAkB,WAAsC;AACnE,KAAI,CAAC,MAAM,QAAQ,OAAO,KAAK,IAAI,OAAO,KAAK,WAAW,EACxD,OAAM,IAAI,MAAM,sBAAsB;AAExC,QAAO,KAAK,SAAS,QAAQ;EAC3B,MAAM,MAAM,aAAa,IAAI;EAC7B,MAAM,SAAS,UAAU,IAAI,IAAI;AACjC,MAAI,UAAU,WAAW,OACvB,OAAM,IAAI,MAAM,OAAO,IAAI,YAAY;AAEzC,YAAU,IAAI,KAAK,OAAO;GAC1B;;AAGJ,SAAgB,iBAAiB,QAAmC;AAClE,QAAO,KAAK,SAAS,QAAQ;EAC3B,MAAM,MAAM,aAAa,IAAI;AAE7B,MADe,UAAU,IAAI,IAAI,KAClB,OACb,WAAU,OAAO,IAAI;GAEvB;;AAGJ,SAAgB,eACd,KACuC;AACvC,KAAI,CAAC,IAAK,QAAO;AACjB,QAAO,UAAU,IAAI,aAAa,IAAI,CAAC;;AASzC,eAAsB,MACpB,OACA,UAAwB,EAAE,EACK;CAC/B,MAAM,cAAc,QAAQ,UAAU,MAAM,IAAI,CAAC,KAAK;CACtD,MAAM,MAAM,QAAQ,OAAO;CAC3B,MAAM,SAAS,QAAQ,UAAU,eAAe,IAAI;AAEpD,KAAI,CAAC,OACH,OAAM,IAAI,MACR,kBAAkB,OAAO,KAAK,QAAQ,CACpC,GAAG,UAAU,MAAM,CACpB,CAAC,KAAK,KAAK,GACb;AAIH,QADe,IAAI,QAAQ,CACb,OAAO,MAAM;;AAI7B,SAAgB,wBAAwB;AACtC,QAAO,CAAC,GAAG,UAAU,SAAS,CAAC,CAAC,KAAK,CAAC,KAAK,WAAW;EAAE;EAAK,QAAQ;EAAM,EAAE;;;;;ACxE/E,IAAY,sDAAL;AACL;AACA;;;AAQF,IAAsB,cAAtB,MAAkC;;;;ACTlC,IAAsB,kBAAtB,MAAsC"}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@hamster-note/document-parser",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.3.1",
|
|
4
4
|
"description": "",
|
|
5
5
|
"scripts": {
|
|
6
6
|
"build:all": "rolldown --config rolldown.config.ts",
|
|
@@ -8,10 +8,12 @@
|
|
|
8
8
|
"test": "echo 'no-test'",
|
|
9
9
|
"lint": "echo 'no-lint'"
|
|
10
10
|
},
|
|
11
|
-
"dependencies": {
|
|
11
|
+
"dependencies": {},
|
|
12
|
+
"peerDependencies": {
|
|
12
13
|
"@hamster-note/types": "^0.5.1"
|
|
13
14
|
},
|
|
14
15
|
"devDependencies": {
|
|
16
|
+
"@hamster-note/types": "^0.5.1",
|
|
15
17
|
"@eslint/js": "^9.39.2",
|
|
16
18
|
"rolldown": "^1.0.0-beta.58",
|
|
17
19
|
"rolldown-plugin-dts": "^0.20.0",
|
|
@@ -38,6 +40,8 @@
|
|
|
38
40
|
"exports": {
|
|
39
41
|
".": {
|
|
40
42
|
"types": "./dist/index.d.ts",
|
|
43
|
+
"require": "./dist/index.js",
|
|
44
|
+
"default": "./dist/index.js",
|
|
41
45
|
"import": "./dist/index.js"
|
|
42
46
|
}
|
|
43
47
|
},
|