npm - @ontos-ai/knowhere-sdk - Versions diffs - 0.2.0 → 0.3.0 - Mend

@ontos-ai/knowhere-sdk 0.2.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md CHANGED Viewed

@@ -163,6 +163,83 @@ const jobResult = await client.jobs.wait(job.jobId, {
 const result = await client.jobs.load(jobResult);
 ```
+### Retrieval and Document Lifecycle
+Published documents are queryable through the retrieval API after a job
+finishes. `client.jobs.create(...)` does not return a usable `documentId`;
+persist `jobResult.documentId` after publication if you need to update or
+archive the same document later.
+```typescript
+const job = await client.jobs.create({
+  sourceType: 'url',
+  sourceUrl: 'https://example.com/manual.pdf',
+  namespace: 'support-center',
+});
+const jobResult = await client.jobs.wait(job.jobId);
+const documentId = jobResult.documentId;
+if (!documentId) {
+  throw new Error('Expected documentId after successful publication.');
+}
+console.log(documentId);
+const response = await client.retrieval.query({
+  namespace: 'support-center',
+  query: 'How do I reset Bluetooth pairing?',
+  topK: 5,
+});
+for (const result of response.results) {
+  console.log(result.content);
+  console.log(result.score);
+  console.log(result.source.sourceFileName, result.source.sectionPath);
+}
+```
+Retrieval results use one canonical source object:
+```typescript
+result.content;
+result.chunkType;
+result.score;
+result.assetUrl;
+result.source.documentId;
+result.source.sourceFileName;
+result.source.sectionPath;
+```
+Use `documentId` to update or archive a document:
+```typescript
+const updateJob = await client.jobs.create({
+  sourceType: 'url',
+  sourceUrl: 'https://example.com/manual-v2.pdf',
+  documentId,
+});
+const documents = await client.documents.list({ namespace: 'support-center' });
+const document = await client.documents.get(documentId);
+const archived = await client.documents.archive(documentId);
+console.log(documents.documents.length);
+console.log(document.status);
+console.log(archived.status);
+```
+Follow-up queries can exclude documents or sections for one request:
+```typescript
+const followUp = await client.retrieval.query({
+  namespace: 'support-center',
+  query: 'battery charging',
+  excludeDocumentIds: ['doc_old'],
+  excludeSections: [{ documentId: 'doc_123', sectionPath: 'Appendix / Legal' }],
+});
+```
 ### Error Handling
 ```typescript

package/dist/index.d.mts CHANGED Viewed

@@ -41,6 +41,8 @@ interface Job {
     sourceType: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
     /** Job creation timestamp */
     createdAt: Date;
     /** Presigned URL for file upload (if sourceType is 'file') */
@@ -75,6 +77,10 @@ interface JobResult {
     sourceType: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Stable document identifier for retrieval/document lifecycle APIs */
+    documentId?: string;
     /** Job creation timestamp */
     createdAt: Date;
     /** Processing progress information */
@@ -157,6 +163,10 @@ interface CreateJobParams {
     fileName?: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Existing document identifier when updating a published document */
+    documentId?: string;
     /** Parsing configuration */
     parsingParams?: ParsingParams;
     /** Webhook configuration */
@@ -216,9 +226,13 @@ interface ParseParams {
     /** Generate table summaries */
     summaryTable?: boolean;
     /** Generate text summaries */
-    summaryText?: boolean;
+    summaryTxt?: boolean;
     /** Custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Existing document identifier when updating a published document */
+    documentId?: string;
     /** Additional fragment description */
     addFragDesc?: string;
     /** Knowledge base directory */
@@ -282,6 +296,30 @@ interface Statistics {
 interface FileIndex {
     [chunkId: string]: string;
 }
+/**
+ * Processing cost details emitted by manifest v2
+ */
+interface ProcessingCost {
+    microDollars?: number;
+    credits?: number;
+}
+/**
+ * Processing timing details emitted by manifest v2
+ */
+interface ProcessingTiming {
+    startedAt?: Date;
+    completedAt?: Date;
+    durationMs?: number;
+}
+/**
+ * Processing metadata emitted by manifest v2
+ */
+interface ProcessingMetadata {
+    pageCount?: number;
+    billingStatus?: string;
+    cost?: ProcessingCost;
+    timing?: ProcessingTiming;
+}
 /**
  * Manifest containing metadata about the parse result
  */
@@ -295,11 +333,29 @@ interface Manifest {
     /** Original source file name */
     sourceFileName: string;
     /** Processing completion date */
-    processingDate: Date;
+    /** Processing completion date (optional: only present if emitted by the worker) */
+    processingDate?: Date;
+    /** Worker-side processing metadata emitted by manifest v2 */
+    processing?: ProcessingMetadata;
     /** Statistics */
     statistics: Statistics;
-    /** File index */
-    files: FileIndex;
+    /** Legacy file index from earlier ZIP manifests */
+    files?: FileIndex;
+}
+/**
+ * Chunk relationship entry (metadata.connect_to per schema v2.1)
+ */
+interface ConnectTo {
+    /** Target chunk_id */
+    target: string;
+    /** Relationship type */
+    relation: 'embeds' | 'related';
+    /** Placeholder ref in content, e.g. '[images/a.png]' (embeds only) */
+    ref?: string;
+    /** Semantic similarity score (related only) */
+    score?: number;
+    /** Shared keywords (related only) */
+    keywords?: string[];
 }
 /**
  * Base chunk properties
@@ -313,6 +369,17 @@ interface BaseChunk {
     content: string;
     /** Relative path in ZIP */
     path: string;
+    /** Page numbers spanned by this chunk when provided by the backend */
+    pageNums?: number[];
+}
+/**
+ * Minimal chunk representation emitted in chunks_slim.json
+ */
+interface SlimChunk {
+    type: 'text' | 'image' | 'table';
+    path: string;
+    content: string;
+    summary?: string;
 }
 /**
  * Text chunk
@@ -321,13 +388,18 @@ interface TextChunk extends BaseChunk {
     type: 'text';
     /** Content length */
     length: number;
-    /** Tokens or token count, depending on backend payload */
-    tokens?: number | string[];
+    /** Extracted tokens from the current backend payload */
+    tokens?: string[];
     /** Extracted keywords */
     keywords?: string[];
     /** Generated summary */
     summary?: string;
-    /** Related chunk IDs */
+    /** Chunk relationships (schema v2.1: metadata.connect_to) */
+    connectTo?: ConnectTo[];
+    /**
+     * @deprecated Use connectTo instead. Retained for backward compatibility.
+     * Previously populated from metadata.relationships which is no longer emitted by the API.
+     */
     relationships?: string[];
 }
 /**
@@ -378,10 +450,18 @@ interface ParseResult {
     manifest: Manifest;
     /** All chunks */
     chunks: Chunk[];
+    /** Minimal chunk projection from chunks_slim.json (if available) */
+    chunksSlim?: SlimChunk[];
     /** Full document as Markdown (if available) */
     fullMarkdown?: string;
     /** Document hierarchy (if available) */
     hierarchy?: unknown;
+    /** Table-of-contents hierarchy hints (if available) */
+    tocHierarchies?: unknown;
+    /** Knowledge-base CSV export (if available) */
+    kbCsv?: string;
+    /** Pre-rendered hierarchy HTML view (if available) */
+    hierarchyViewHtml?: string;
     /** Raw ZIP buffer */
     rawZip: Buffer;
     /** Text chunks only */
@@ -392,6 +472,10 @@ interface ParseResult {
     readonly tableChunks: TableChunk[];
     /** Job ID */
     readonly jobId: string;
+    /** Effective retrieval namespace when loaded from a job result */
+    namespace?: string;
+    /** Canonical document identifier when loaded from a job result */
+    documentId?: string;
     /** Statistics */
     readonly statistics: Statistics;
     /** Find a specific chunk by ID */
@@ -500,12 +584,165 @@ declare class Jobs extends BaseResource {
     private resolveLoadJobResult;
 }
+/**
+ * Section exclusion for follow-up retrieval queries.
+ */
+interface RetrievalSectionExclusion {
+    /** Document containing the section to exclude */
+    documentId: string;
+    /** Human-readable section path to exclude */
+    sectionPath: string;
+}
+/**
+ * Supported retrieval channel names.
+ */
+type RetrievalChannel = 'path' | 'content' | 'term';
+/**
+ * Path filtering mode for retrieval queries.
+ */
+type RetrievalFilterMode = 'delete' | 'keep';
+/**
+ * Retrieval query parameters.
+ */
+interface RetrievalQueryParams {
+    /** Search query text */
+    query: string;
+    /** Retrieval namespace. Defaults to the server's default namespace when omitted. */
+    namespace?: string;
+    /** Maximum number of results to return */
+    topK?: number;
+    /** Chunk type filter: 1=all, 2=text, 3=image, 4=table, 5=text+image, 6=text+table */
+    dataType?: 1 | 2 | 3 | 4 | 5 | 6;
+    /** Path keywords for include/exclude filtering */
+    signalPaths?: string[];
+    /** Signal path filter mode */
+    filterMode?: RetrievalFilterMode;
+    /** Retrieval channels to run. Defaults to all channels when omitted. */
+    channels?: RetrievalChannel[];
+    /** Per-channel weight overrides for reciprocal-rank fusion */
+    channelWeights?: Partial<Record<RetrievalChannel, number>>;
+    /** Enable LLM reranking after channel fusion */
+    rerank?: boolean;
+    /** Minimum retrieval score threshold after fusion */
+    threshold?: number;
+    /** Override the internal per-channel recall count */
+    internalRecallK?: number;
+    /** Documents to exclude for this request only */
+    excludeDocumentIds?: string[];
+    /** Document sections to exclude for this request only */
+    excludeSections?: RetrievalSectionExclusion[];
+}
+/**
+ * Caller-facing source reference attached to a retrieval result.
+ */
+interface RetrievalSource {
+    /** Stable document identifier */
+    documentId?: string;
+    /** Original source file name */
+    sourceFileName?: string;
+    /** Human-readable section path */
+    sectionPath?: string;
+}
+/**
+ * Canonical chunk result returned by retrieval query.
+ */
+interface RetrievalResult {
+    /** Knowledge content to use directly in the caller's answer */
+    content: string;
+    /** Chunk type, for example text, image, or table */
+    chunkType: string;
+    /** Retrieval score returned by the API */
+    score: number;
+    /** Presigned asset URL for media chunks when available */
+    assetUrl?: string;
+    /** Source reference for this result */
+    source: RetrievalSource;
+}
+/**
+ * Response from POST /v1/retrieval/query.
+ */
+interface RetrievalQueryResponse {
+    /** Namespace searched by the API */
+    namespace: string;
+    /** Echoed query text */
+    query: string;
+    /** Retrieval router path used by the API for this query */
+    routerUsed?: string;
+    /** Ranked retrieval results */
+    results: RetrievalResult[];
+}
+/**
+ * Resource for querying published retrieval documents.
+ */
+declare class Retrieval extends BaseResource {
+    /**
+     * Query published documents.
+     */
+    query(params: RetrievalQueryParams): Promise<RetrievalQueryResponse>;
+}
+/**
+ * Canonical document state returned by document lifecycle endpoints.
+ */
+interface Document {
+    /** Stable document identifier */
+    documentId: string;
+    /** Retrieval namespace */
+    namespace: string;
+    /** Current lifecycle status */
+    status: string;
+    /** Current published job result identifier */
+    currentJobResultId?: string;
+    /** Original source file name */
+    sourceFileName?: string;
+    /** Document creation timestamp */
+    createdAt?: Date;
+    /** Last update timestamp */
+    updatedAt?: Date;
+    /** Archive timestamp, when archived */
+    archivedAt?: Date;
+}
+/**
+ * Response from GET /v1/documents.
+ */
+interface DocumentListResponse {
+    /** Namespace listed by the API */
+    namespace: string;
+    /** Documents visible in the namespace */
+    documents: Document[];
+}
+/**
+ * Resource for canonical document lifecycle operations.
+ */
+declare class Documents extends BaseResource {
+    /**
+     * List canonical documents in a namespace.
+     */
+    list(params?: {
+        namespace?: string;
+    }): Promise<DocumentListResponse>;
+    /**
+     * Get one canonical document by ID.
+     */
+    get(documentId: string): Promise<Document>;
+    /**
+     * Archive one canonical document by ID.
+     */
+    archive(documentId: string): Promise<Document>;
+}
 /**
  * Main Knowhere SDK client
  */
 declare class Knowhere {
     /** Jobs resource for low-level API */
     readonly jobs: Jobs;
+    /** Retrieval resource for querying published documents */
+    readonly retrieval: Retrieval;
+    /** Documents resource for canonical document lifecycle operations */
+    readonly documents: Documents;
     private httpClient;
     /**
      * Create a new Knowhere client
@@ -665,4 +902,4 @@ declare class JobFailedError extends KnowhereError {
     constructor(message: string, code: string, jobResult: JobResult);
 }
-export { APIError, AuthenticationError, BadRequestError, type BaseChunk, ChecksumError, type Chunk, ConflictError, type CreateJobParams, type DocType, type FileIndex, GatewayTimeoutError, type ImageChunk, InternalServerError, InvalidStateError, type Job, type JobError, JobFailedError, type JobResult, type JobStatus, Jobs, Knowhere, KnowhereError, type KnowhereOptions, type LoadOptions, type Manifest, NetworkError, NotFoundError, type ParseParams, type ParseResult, type ParsingModel, type ParsingParams, PaymentRequiredError, PermissionDeniedError, type PollProgress, PollingTimeoutError, RateLimitError, ServiceUnavailableError, type Statistics, type TableChunk, type TextChunk, TimeoutError, type UploadParams, type UploadProgress, VERSION, ValidationError, type WaitOptions, type WebhookConfig, Knowhere as default };
+export { APIError, AuthenticationError, BadRequestError, type BaseChunk, ChecksumError, type Chunk, ConflictError, type CreateJobParams, type DocType, type Document, type DocumentListResponse, Documents, type FileIndex, GatewayTimeoutError, type ImageChunk, InternalServerError, InvalidStateError, type Job, type JobError, JobFailedError, type JobResult, type JobStatus, Jobs, Knowhere, KnowhereError, type KnowhereOptions, type LoadOptions, type Manifest, NetworkError, NotFoundError, type ParseParams, type ParseResult, type ParsingModel, type ParsingParams, PaymentRequiredError, PermissionDeniedError, type PollProgress, PollingTimeoutError, RateLimitError, Retrieval, type RetrievalChannel, type RetrievalFilterMode, type RetrievalQueryParams, type RetrievalQueryResponse, type RetrievalResult, type RetrievalSectionExclusion, type RetrievalSource, ServiceUnavailableError, type Statistics, type TableChunk, type TextChunk, TimeoutError, type UploadParams, type UploadProgress, VERSION, ValidationError, type WaitOptions, type WebhookConfig, Knowhere as default };

package/dist/index.d.ts CHANGED Viewed

@@ -41,6 +41,8 @@ interface Job {
     sourceType: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
     /** Job creation timestamp */
     createdAt: Date;
     /** Presigned URL for file upload (if sourceType is 'file') */
@@ -75,6 +77,10 @@ interface JobResult {
     sourceType: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Stable document identifier for retrieval/document lifecycle APIs */
+    documentId?: string;
     /** Job creation timestamp */
     createdAt: Date;
     /** Processing progress information */
@@ -157,6 +163,10 @@ interface CreateJobParams {
     fileName?: string;
     /** Optional custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Existing document identifier when updating a published document */
+    documentId?: string;
     /** Parsing configuration */
     parsingParams?: ParsingParams;
     /** Webhook configuration */
@@ -216,9 +226,13 @@ interface ParseParams {
     /** Generate table summaries */
     summaryTable?: boolean;
     /** Generate text summaries */
-    summaryText?: boolean;
+    summaryTxt?: boolean;
     /** Custom data identifier */
     dataId?: string;
+    /** Retrieval namespace for the canonical document */
+    namespace?: string;
+    /** Existing document identifier when updating a published document */
+    documentId?: string;
     /** Additional fragment description */
     addFragDesc?: string;
     /** Knowledge base directory */
@@ -282,6 +296,30 @@ interface Statistics {
 interface FileIndex {
     [chunkId: string]: string;
 }
+/**
+ * Processing cost details emitted by manifest v2
+ */
+interface ProcessingCost {
+    microDollars?: number;
+    credits?: number;
+}
+/**
+ * Processing timing details emitted by manifest v2
+ */
+interface ProcessingTiming {
+    startedAt?: Date;
+    completedAt?: Date;
+    durationMs?: number;
+}
+/**
+ * Processing metadata emitted by manifest v2
+ */
+interface ProcessingMetadata {
+    pageCount?: number;
+    billingStatus?: string;
+    cost?: ProcessingCost;
+    timing?: ProcessingTiming;
+}
 /**
  * Manifest containing metadata about the parse result
  */
@@ -295,11 +333,29 @@ interface Manifest {
     /** Original source file name */
     sourceFileName: string;
     /** Processing completion date */
-    processingDate: Date;
+    /** Processing completion date (optional: only present if emitted by the worker) */
+    processingDate?: Date;
+    /** Worker-side processing metadata emitted by manifest v2 */
+    processing?: ProcessingMetadata;
     /** Statistics */
     statistics: Statistics;
-    /** File index */
-    files: FileIndex;
+    /** Legacy file index from earlier ZIP manifests */
+    files?: FileIndex;
+}
+/**
+ * Chunk relationship entry (metadata.connect_to per schema v2.1)
+ */
+interface ConnectTo {
+    /** Target chunk_id */
+    target: string;
+    /** Relationship type */
+    relation: 'embeds' | 'related';
+    /** Placeholder ref in content, e.g. '[images/a.png]' (embeds only) */
+    ref?: string;
+    /** Semantic similarity score (related only) */
+    score?: number;
+    /** Shared keywords (related only) */
+    keywords?: string[];
 }
 /**
  * Base chunk properties
@@ -313,6 +369,17 @@ interface BaseChunk {
     content: string;
     /** Relative path in ZIP */
     path: string;
+    /** Page numbers spanned by this chunk when provided by the backend */
+    pageNums?: number[];
+}
+/**
+ * Minimal chunk representation emitted in chunks_slim.json
+ */
+interface SlimChunk {
+    type: 'text' | 'image' | 'table';
+    path: string;
+    content: string;
+    summary?: string;
 }
 /**
  * Text chunk
@@ -321,13 +388,18 @@ interface TextChunk extends BaseChunk {
     type: 'text';
     /** Content length */
     length: number;
-    /** Tokens or token count, depending on backend payload */
-    tokens?: number | string[];
+    /** Extracted tokens from the current backend payload */
+    tokens?: string[];
     /** Extracted keywords */
     keywords?: string[];
     /** Generated summary */
     summary?: string;
-    /** Related chunk IDs */
+    /** Chunk relationships (schema v2.1: metadata.connect_to) */
+    connectTo?: ConnectTo[];
+    /**
+     * @deprecated Use connectTo instead. Retained for backward compatibility.
+     * Previously populated from metadata.relationships which is no longer emitted by the API.
+     */
     relationships?: string[];
 }
 /**
@@ -378,10 +450,18 @@ interface ParseResult {
     manifest: Manifest;
     /** All chunks */
     chunks: Chunk[];
+    /** Minimal chunk projection from chunks_slim.json (if available) */
+    chunksSlim?: SlimChunk[];
     /** Full document as Markdown (if available) */
     fullMarkdown?: string;
     /** Document hierarchy (if available) */
     hierarchy?: unknown;
+    /** Table-of-contents hierarchy hints (if available) */
+    tocHierarchies?: unknown;
+    /** Knowledge-base CSV export (if available) */
+    kbCsv?: string;
+    /** Pre-rendered hierarchy HTML view (if available) */
+    hierarchyViewHtml?: string;
     /** Raw ZIP buffer */
     rawZip: Buffer;
     /** Text chunks only */
@@ -392,6 +472,10 @@ interface ParseResult {
     readonly tableChunks: TableChunk[];
     /** Job ID */
     readonly jobId: string;
+    /** Effective retrieval namespace when loaded from a job result */
+    namespace?: string;
+    /** Canonical document identifier when loaded from a job result */
+    documentId?: string;
     /** Statistics */
     readonly statistics: Statistics;
     /** Find a specific chunk by ID */
@@ -500,12 +584,165 @@ declare class Jobs extends BaseResource {
     private resolveLoadJobResult;
 }
+/**
+ * Section exclusion for follow-up retrieval queries.
+ */
+interface RetrievalSectionExclusion {
+    /** Document containing the section to exclude */
+    documentId: string;
+    /** Human-readable section path to exclude */
+    sectionPath: string;
+}
+/**
+ * Supported retrieval channel names.
+ */
+type RetrievalChannel = 'path' | 'content' | 'term';
+/**
+ * Path filtering mode for retrieval queries.
+ */
+type RetrievalFilterMode = 'delete' | 'keep';
+/**
+ * Retrieval query parameters.
+ */
+interface RetrievalQueryParams {
+    /** Search query text */
+    query: string;
+    /** Retrieval namespace. Defaults to the server's default namespace when omitted. */
+    namespace?: string;
+    /** Maximum number of results to return */
+    topK?: number;
+    /** Chunk type filter: 1=all, 2=text, 3=image, 4=table, 5=text+image, 6=text+table */
+    dataType?: 1 | 2 | 3 | 4 | 5 | 6;
+    /** Path keywords for include/exclude filtering */
+    signalPaths?: string[];
+    /** Signal path filter mode */
+    filterMode?: RetrievalFilterMode;
+    /** Retrieval channels to run. Defaults to all channels when omitted. */
+    channels?: RetrievalChannel[];
+    /** Per-channel weight overrides for reciprocal-rank fusion */
+    channelWeights?: Partial<Record<RetrievalChannel, number>>;
+    /** Enable LLM reranking after channel fusion */
+    rerank?: boolean;
+    /** Minimum retrieval score threshold after fusion */
+    threshold?: number;
+    /** Override the internal per-channel recall count */
+    internalRecallK?: number;
+    /** Documents to exclude for this request only */
+    excludeDocumentIds?: string[];
+    /** Document sections to exclude for this request only */
+    excludeSections?: RetrievalSectionExclusion[];
+}
+/**
+ * Caller-facing source reference attached to a retrieval result.
+ */
+interface RetrievalSource {
+    /** Stable document identifier */
+    documentId?: string;
+    /** Original source file name */
+    sourceFileName?: string;
+    /** Human-readable section path */
+    sectionPath?: string;
+}
+/**
+ * Canonical chunk result returned by retrieval query.
+ */
+interface RetrievalResult {
+    /** Knowledge content to use directly in the caller's answer */
+    content: string;
+    /** Chunk type, for example text, image, or table */
+    chunkType: string;
+    /** Retrieval score returned by the API */
+    score: number;
+    /** Presigned asset URL for media chunks when available */
+    assetUrl?: string;
+    /** Source reference for this result */
+    source: RetrievalSource;
+}
+/**
+ * Response from POST /v1/retrieval/query.
+ */
+interface RetrievalQueryResponse {
+    /** Namespace searched by the API */
+    namespace: string;
+    /** Echoed query text */
+    query: string;
+    /** Retrieval router path used by the API for this query */
+    routerUsed?: string;
+    /** Ranked retrieval results */
+    results: RetrievalResult[];
+}
+/**
+ * Resource for querying published retrieval documents.
+ */
+declare class Retrieval extends BaseResource {
+    /**
+     * Query published documents.
+     */
+    query(params: RetrievalQueryParams): Promise<RetrievalQueryResponse>;
+}
+/**
+ * Canonical document state returned by document lifecycle endpoints.
+ */
+interface Document {
+    /** Stable document identifier */
+    documentId: string;
+    /** Retrieval namespace */
+    namespace: string;
+    /** Current lifecycle status */
+    status: string;
+    /** Current published job result identifier */
+    currentJobResultId?: string;
+    /** Original source file name */
+    sourceFileName?: string;
+    /** Document creation timestamp */
+    createdAt?: Date;
+    /** Last update timestamp */
+    updatedAt?: Date;
+    /** Archive timestamp, when archived */
+    archivedAt?: Date;
+}
+/**
+ * Response from GET /v1/documents.
+ */
+interface DocumentListResponse {
+    /** Namespace listed by the API */
+    namespace: string;
+    /** Documents visible in the namespace */
+    documents: Document[];
+}
+/**
+ * Resource for canonical document lifecycle operations.
+ */
+declare class Documents extends BaseResource {
+    /**
+     * List canonical documents in a namespace.
+     */
+    list(params?: {
+        namespace?: string;
+    }): Promise<DocumentListResponse>;
+    /**
+     * Get one canonical document by ID.
+     */
+    get(documentId: string): Promise<Document>;
+    /**
+     * Archive one canonical document by ID.
+     */
+    archive(documentId: string): Promise<Document>;
+}
 /**
  * Main Knowhere SDK client
  */
 declare class Knowhere {
     /** Jobs resource for low-level API */
     readonly jobs: Jobs;
+    /** Retrieval resource for querying published documents */
+    readonly retrieval: Retrieval;
+    /** Documents resource for canonical document lifecycle operations */
+    readonly documents: Documents;
     private httpClient;
     /**
      * Create a new Knowhere client
@@ -665,4 +902,4 @@ declare class JobFailedError extends KnowhereError {
     constructor(message: string, code: string, jobResult: JobResult);
 }
-export { APIError, AuthenticationError, BadRequestError, type BaseChunk, ChecksumError, type Chunk, ConflictError, type CreateJobParams, type DocType, type FileIndex, GatewayTimeoutError, type ImageChunk, InternalServerError, InvalidStateError, type Job, type JobError, JobFailedError, type JobResult, type JobStatus, Jobs, Knowhere, KnowhereError, type KnowhereOptions, type LoadOptions, type Manifest, NetworkError, NotFoundError, type ParseParams, type ParseResult, type ParsingModel, type ParsingParams, PaymentRequiredError, PermissionDeniedError, type PollProgress, PollingTimeoutError, RateLimitError, ServiceUnavailableError, type Statistics, type TableChunk, type TextChunk, TimeoutError, type UploadParams, type UploadProgress, VERSION, ValidationError, type WaitOptions, type WebhookConfig, Knowhere as default };
+export { APIError, AuthenticationError, BadRequestError, type BaseChunk, ChecksumError, type Chunk, ConflictError, type CreateJobParams, type DocType, type Document, type DocumentListResponse, Documents, type FileIndex, GatewayTimeoutError, type ImageChunk, InternalServerError, InvalidStateError, type Job, type JobError, JobFailedError, type JobResult, type JobStatus, Jobs, Knowhere, KnowhereError, type KnowhereOptions, type LoadOptions, type Manifest, NetworkError, NotFoundError, type ParseParams, type ParseResult, type ParsingModel, type ParsingParams, PaymentRequiredError, PermissionDeniedError, type PollProgress, PollingTimeoutError, RateLimitError, Retrieval, type RetrievalChannel, type RetrievalFilterMode, type RetrievalQueryParams, type RetrievalQueryResponse, type RetrievalResult, type RetrievalSectionExclusion, type RetrievalSource, ServiceUnavailableError, type Statistics, type TableChunk, type TextChunk, TimeoutError, type UploadParams, type UploadProgress, VERSION, ValidationError, type WaitOptions, type WebhookConfig, Knowhere as default };

package/dist/index.js CHANGED Viewed

@@ -35,6 +35,7 @@ __export(index_exports, {
   BadRequestError: () => BadRequestError,
   ChecksumError: () => ChecksumError,
   ConflictError: () => ConflictError,
+  Documents: () => Documents,
   GatewayTimeoutError: () => GatewayTimeoutError,
   InternalServerError: () => InternalServerError,
   InvalidStateError: () => InvalidStateError,
@@ -48,6 +49,7 @@ __export(index_exports, {
   PermissionDeniedError: () => PermissionDeniedError,
   PollingTimeoutError: () => PollingTimeoutError,
   RateLimitError: () => RateLimitError,
+  Retrieval: () => Retrieval,
   ServiceUnavailableError: () => ServiceUnavailableError,
   TimeoutError: () => TimeoutError,
   VERSION: () => VERSION,
@@ -344,6 +346,15 @@ function enrichJobResult(jobResult) {
   }
   return jobResult;
 }
+function enrichParseResult(parseResult2, scope) {
+  if (scope.namespace !== void 0) {
+    parseResult2.namespace = scope.namespace;
+  }
+  if (scope.documentId !== void 0) {
+    parseResult2.documentId = scope.documentId;
+  }
+  return parseResult2;
+}
 function sanitizePath(path2) {
   let sanitized = path2.replace(/^\/+/, "");
   sanitized = sanitized.replace(/\.\.(\/|\\)/g, "");
@@ -839,11 +850,39 @@ async function parseResult(httpClient, resultUrl, options) {
     const hierarchyContent = await hierarchyFile.async("string");
     hierarchy = JSON.parse(hierarchyContent);
   }
+  let chunksSlim;
+  const chunksSlimFile = zip.file("chunks_slim.json");
+  if (chunksSlimFile) {
+    const chunksSlimContent = await chunksSlimFile.async("string");
+    let chunksSlimData = JSON.parse(chunksSlimContent);
+    chunksSlimData = keysToCamel(chunksSlimData);
+    chunksSlim = extractSlimChunks(chunksSlimData);
+  }
+  let tocHierarchies;
+  const tocHierarchiesFile = zip.file("toc_hierarchies.json");
+  if (tocHierarchiesFile) {
+    const tocHierarchiesContent = await tocHierarchiesFile.async("string");
+    tocHierarchies = keysToCamel(JSON.parse(tocHierarchiesContent));
+  }
+  let kbCsv;
+  const kbCsvFile = zip.file("kb.csv");
+  if (kbCsvFile) {
+    kbCsv = await kbCsvFile.async("string");
+  }
+  let hierarchyViewHtml;
+  const hierarchyViewFile = zip.file("hierarchy_view.html");
+  if (hierarchyViewFile) {
+    hierarchyViewHtml = await hierarchyViewFile.async("string");
+  }
   const result = {
     manifest,
     chunks,
+    chunksSlim,
     fullMarkdown,
     hierarchy,
+    tocHierarchies,
+    kbCsv,
+    hierarchyViewHtml,
     rawZip: zipBuffer,
     get textChunks() {
       return chunks.filter((c) => c.type === "text");
@@ -867,12 +906,30 @@ async function parseResult(httpClient, resultUrl, options) {
       await import_fs2.promises.mkdir(directory, { recursive: true });
       await import_fs2.promises.writeFile((0, import_path.join)(directory, "manifest.json"), JSON.stringify(manifest, null, 2));
       await import_fs2.promises.writeFile((0, import_path.join)(directory, "chunks.json"), JSON.stringify(chunks, null, 2));
+      if (chunksSlim) {
+        await import_fs2.promises.writeFile(
+          (0, import_path.join)(directory, "chunks_slim.json"),
+          JSON.stringify({ chunks: chunksSlim }, null, 2)
+        );
+      }
       if (fullMarkdown) {
         await import_fs2.promises.writeFile((0, import_path.join)(directory, "full.md"), fullMarkdown);
       }
       if (hierarchy) {
         await import_fs2.promises.writeFile((0, import_path.join)(directory, "hierarchy.json"), JSON.stringify(hierarchy, null, 2));
       }
+      if (tocHierarchies) {
+        await import_fs2.promises.writeFile(
+          (0, import_path.join)(directory, "toc_hierarchies.json"),
+          JSON.stringify(tocHierarchies, null, 2)
+        );
+      }
+      if (kbCsv) {
+        await import_fs2.promises.writeFile((0, import_path.join)(directory, "kb.csv"), kbCsv);
+      }
+      if (hierarchyViewHtml) {
+        await import_fs2.promises.writeFile((0, import_path.join)(directory, "hierarchy_view.html"), hierarchyViewHtml);
+      }
       for (const imageChunk of this.imageChunks) {
         await imageChunk.save(directory);
       }
@@ -894,6 +951,15 @@ function extractChunks(payload) {
   }
   return [];
 }
+function extractSlimChunks(payload) {
+  if (Array.isArray(payload)) {
+    return payload;
+  }
+  if (Array.isArray(payload.chunks)) {
+    return payload.chunks;
+  }
+  return [];
+}
 function getChunkMetadata(chunkData) {
   if (!chunkData.metadata) {
     return {};
@@ -904,18 +970,38 @@ function getChunkFilePath(chunkData) {
   const metadata = getChunkMetadata(chunkData);
   return chunkData.filePath ?? metadata.filePath ?? chunkData.path;
 }
+function normalizePageNums(pageNums) {
+  if (!Array.isArray(pageNums)) {
+    return void 0;
+  }
+  const normalized = pageNums.filter((pageNum) => typeof pageNum === "number");
+  return normalized.length > 0 ? normalized : void 0;
+}
+function normalizeTokens(tokens) {
+  if (!Array.isArray(tokens)) {
+    return void 0;
+  }
+  if (!tokens.every((token) => typeof token === "string")) {
+    return void 0;
+  }
+  return tokens;
+}
 function normalizeTextChunk(chunkData) {
   const metadata = getChunkMetadata(chunkData);
+  const connectTo = metadata.connectTo ?? chunkData.connectTo;
+  const relationships = metadata.relationships ?? chunkData.relationships;
   return {
     chunkId: chunkData.chunkId ?? "",
     type: "text",
     content: chunkData.content ?? "",
     path: chunkData.path ?? "",
+    pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
     length: metadata.length ?? chunkData.length ?? 0,
-    tokens: metadata.tokens ?? chunkData.tokens,
+    tokens: normalizeTokens(metadata.tokens ?? chunkData.tokens),
     keywords: metadata.keywords ?? chunkData.keywords,
     summary: metadata.summary ?? chunkData.summary,
-    relationships: metadata.relationships ?? chunkData.relationships
+    ...connectTo !== void 0 && { connectTo },
+    ...relationships !== void 0 && { relationships }
   };
 }
 async function processChunk(zip, chunkData) {
@@ -939,6 +1025,7 @@ async function processChunk(zip, chunkData) {
       type: "image",
       content: chunkData.content ?? "",
       path: chunkData.path ?? "",
+      pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
       length: metadata.length ?? chunkData.length ?? 0,
       filePath,
       summary: metadata.summary ?? chunkData.summary,
@@ -973,6 +1060,7 @@ async function processChunk(zip, chunkData) {
       type: "table",
       content: chunkData.content ?? "",
       path: chunkData.path ?? "",
+      pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
       length: metadata.length ?? chunkData.length ?? 0,
       filePath,
       tableType: metadata.tableType ?? chunkData.tableType,
@@ -998,7 +1086,11 @@ var Jobs = class extends BaseResource {
    * Create a new parsing job
    */
   async create(params) {
-    const job = await this.httpClient.post("/v1/jobs", params);
+    const job = await this.httpClient.post(
+      "/v1/jobs",
+      params
+    );
+    delete job.documentId;
     if (job.uploadUrl) {
       this.pendingUploadJobs.set(job.jobId, job);
     }
@@ -1046,7 +1138,8 @@ var Jobs = class extends BaseResource {
     if (!jobResult.resultUrl) {
       throw new NotFoundError("Result URL not available");
     }
-    return parseResult(this.httpClient, jobResult.resultUrl, options);
+    const result = await parseResult(this.httpClient, jobResult.resultUrl, options);
+    return enrichParseResult(result, jobResult);
   }
   isHttpUrl(value) {
     return /^https?:\/\//i.test(value);
@@ -1097,6 +1190,43 @@ var Jobs = class extends BaseResource {
   }
 };
+// src/resources/retrieval.ts
+var Retrieval = class extends BaseResource {
+  /**
+   * Query published documents.
+   */
+  async query(params) {
+    return this.httpClient.post("/v1/retrieval/query", params);
+  }
+};
+// src/resources/documents.ts
+var Documents = class extends BaseResource {
+  /**
+   * List canonical documents in a namespace.
+   */
+  async list(params) {
+    const requestConfig = params?.namespace ? {
+      params: {
+        namespace: params.namespace
+      }
+    } : void 0;
+    return this.httpClient.get("/v1/documents", requestConfig);
+  }
+  /**
+   * Get one canonical document by ID.
+   */
+  async get(documentId) {
+    return this.httpClient.get(`/v1/documents/${documentId}`);
+  }
+  /**
+   * Archive one canonical document by ID.
+   */
+  async archive(documentId) {
+    return this.httpClient.post(`/v1/documents/${documentId}/archive`);
+  }
+};
 // src/client.ts
 function inferFileName(file, explicitFileName) {
   if (explicitFileName) {
@@ -1116,6 +1246,10 @@ function isReadStream2(file) {
 var Knowhere = class {
   /** Jobs resource for low-level API */
   jobs;
+  /** Retrieval resource for querying published documents */
+  retrieval;
+  /** Documents resource for canonical document lifecycle operations */
+  documents;
   httpClient;
   /**
    * Create a new Knowhere client
@@ -1139,6 +1273,8 @@ var Knowhere = class {
       httpsAgent: options.httpsAgent
     });
     this.jobs = new Jobs(this.httpClient);
+    this.retrieval = new Retrieval(this.httpClient);
+    this.documents = new Documents(this.httpClient);
   }
   /**
    * High-level API: Parse a document and return structured results
@@ -1181,7 +1317,7 @@ var Knowhere = class {
       smartTitleParse: params.smartTitleParse,
       summaryImage: params.summaryImage,
       summaryTable: params.summaryTable,
-      summaryTxt: params.summaryText,
+      summaryTxt: params.summaryTxt,
       addFragDesc: params.addFragDesc,
       kbDir: params.kbDir
     };
@@ -1196,6 +1332,8 @@ var Knowhere = class {
       sourceUrl: params.url,
       fileName: resolvedFileName,
       dataId: params.dataId,
+      namespace: params.namespace,
+      documentId: params.documentId,
       parsingParams: Object.keys(parsingParams).length > 0 ? parsingParams : void 0,
       webhook
     });
@@ -1215,7 +1353,7 @@ var Knowhere = class {
     const result = await this.jobs.load(jobResult, {
       verifyChecksum: params.verifyChecksum
     });
-    return result;
+    return enrichParseResult(result, jobResult);
   }
 };
 // Annotate the CommonJS export names for ESM import in node:
@@ -1225,6 +1363,7 @@ var Knowhere = class {
   BadRequestError,
   ChecksumError,
   ConflictError,
+  Documents,
   GatewayTimeoutError,
   InternalServerError,
   InvalidStateError,
@@ -1238,6 +1377,7 @@ var Knowhere = class {
   PermissionDeniedError,
   PollingTimeoutError,
   RateLimitError,
+  Retrieval,
   ServiceUnavailableError,
   TimeoutError,
   VERSION,

package/dist/index.mjs CHANGED Viewed

@@ -286,6 +286,15 @@ function enrichJobResult(jobResult) {
   }
   return jobResult;
 }
+function enrichParseResult(parseResult2, scope) {
+  if (scope.namespace !== void 0) {
+    parseResult2.namespace = scope.namespace;
+  }
+  if (scope.documentId !== void 0) {
+    parseResult2.documentId = scope.documentId;
+  }
+  return parseResult2;
+}
 function sanitizePath(path2) {
   let sanitized = path2.replace(/^\/+/, "");
   sanitized = sanitized.replace(/\.\.(\/|\\)/g, "");
@@ -781,11 +790,39 @@ async function parseResult(httpClient, resultUrl, options) {
     const hierarchyContent = await hierarchyFile.async("string");
     hierarchy = JSON.parse(hierarchyContent);
   }
+  let chunksSlim;
+  const chunksSlimFile = zip.file("chunks_slim.json");
+  if (chunksSlimFile) {
+    const chunksSlimContent = await chunksSlimFile.async("string");
+    let chunksSlimData = JSON.parse(chunksSlimContent);
+    chunksSlimData = keysToCamel(chunksSlimData);
+    chunksSlim = extractSlimChunks(chunksSlimData);
+  }
+  let tocHierarchies;
+  const tocHierarchiesFile = zip.file("toc_hierarchies.json");
+  if (tocHierarchiesFile) {
+    const tocHierarchiesContent = await tocHierarchiesFile.async("string");
+    tocHierarchies = keysToCamel(JSON.parse(tocHierarchiesContent));
+  }
+  let kbCsv;
+  const kbCsvFile = zip.file("kb.csv");
+  if (kbCsvFile) {
+    kbCsv = await kbCsvFile.async("string");
+  }
+  let hierarchyViewHtml;
+  const hierarchyViewFile = zip.file("hierarchy_view.html");
+  if (hierarchyViewFile) {
+    hierarchyViewHtml = await hierarchyViewFile.async("string");
+  }
   const result = {
     manifest,
     chunks,
+    chunksSlim,
     fullMarkdown,
     hierarchy,
+    tocHierarchies,
+    kbCsv,
+    hierarchyViewHtml,
     rawZip: zipBuffer,
     get textChunks() {
       return chunks.filter((c) => c.type === "text");
@@ -809,12 +846,30 @@ async function parseResult(httpClient, resultUrl, options) {
       await fs2.mkdir(directory, { recursive: true });
       await fs2.writeFile(join(directory, "manifest.json"), JSON.stringify(manifest, null, 2));
       await fs2.writeFile(join(directory, "chunks.json"), JSON.stringify(chunks, null, 2));
+      if (chunksSlim) {
+        await fs2.writeFile(
+          join(directory, "chunks_slim.json"),
+          JSON.stringify({ chunks: chunksSlim }, null, 2)
+        );
+      }
       if (fullMarkdown) {
         await fs2.writeFile(join(directory, "full.md"), fullMarkdown);
       }
       if (hierarchy) {
         await fs2.writeFile(join(directory, "hierarchy.json"), JSON.stringify(hierarchy, null, 2));
       }
+      if (tocHierarchies) {
+        await fs2.writeFile(
+          join(directory, "toc_hierarchies.json"),
+          JSON.stringify(tocHierarchies, null, 2)
+        );
+      }
+      if (kbCsv) {
+        await fs2.writeFile(join(directory, "kb.csv"), kbCsv);
+      }
+      if (hierarchyViewHtml) {
+        await fs2.writeFile(join(directory, "hierarchy_view.html"), hierarchyViewHtml);
+      }
       for (const imageChunk of this.imageChunks) {
         await imageChunk.save(directory);
       }
@@ -836,6 +891,15 @@ function extractChunks(payload) {
   }
   return [];
 }
+function extractSlimChunks(payload) {
+  if (Array.isArray(payload)) {
+    return payload;
+  }
+  if (Array.isArray(payload.chunks)) {
+    return payload.chunks;
+  }
+  return [];
+}
 function getChunkMetadata(chunkData) {
   if (!chunkData.metadata) {
     return {};
@@ -846,18 +910,38 @@ function getChunkFilePath(chunkData) {
   const metadata = getChunkMetadata(chunkData);
   return chunkData.filePath ?? metadata.filePath ?? chunkData.path;
 }
+function normalizePageNums(pageNums) {
+  if (!Array.isArray(pageNums)) {
+    return void 0;
+  }
+  const normalized = pageNums.filter((pageNum) => typeof pageNum === "number");
+  return normalized.length > 0 ? normalized : void 0;
+}
+function normalizeTokens(tokens) {
+  if (!Array.isArray(tokens)) {
+    return void 0;
+  }
+  if (!tokens.every((token) => typeof token === "string")) {
+    return void 0;
+  }
+  return tokens;
+}
 function normalizeTextChunk(chunkData) {
   const metadata = getChunkMetadata(chunkData);
+  const connectTo = metadata.connectTo ?? chunkData.connectTo;
+  const relationships = metadata.relationships ?? chunkData.relationships;
   return {
     chunkId: chunkData.chunkId ?? "",
     type: "text",
     content: chunkData.content ?? "",
     path: chunkData.path ?? "",
+    pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
     length: metadata.length ?? chunkData.length ?? 0,
-    tokens: metadata.tokens ?? chunkData.tokens,
+    tokens: normalizeTokens(metadata.tokens ?? chunkData.tokens),
     keywords: metadata.keywords ?? chunkData.keywords,
     summary: metadata.summary ?? chunkData.summary,
-    relationships: metadata.relationships ?? chunkData.relationships
+    ...connectTo !== void 0 && { connectTo },
+    ...relationships !== void 0 && { relationships }
   };
 }
 async function processChunk(zip, chunkData) {
@@ -881,6 +965,7 @@ async function processChunk(zip, chunkData) {
       type: "image",
       content: chunkData.content ?? "",
       path: chunkData.path ?? "",
+      pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
       length: metadata.length ?? chunkData.length ?? 0,
       filePath,
       summary: metadata.summary ?? chunkData.summary,
@@ -915,6 +1000,7 @@ async function processChunk(zip, chunkData) {
       type: "table",
       content: chunkData.content ?? "",
       path: chunkData.path ?? "",
+      pageNums: normalizePageNums(metadata.pageNums ?? chunkData.pageNums),
       length: metadata.length ?? chunkData.length ?? 0,
       filePath,
       tableType: metadata.tableType ?? chunkData.tableType,
@@ -940,7 +1026,11 @@ var Jobs = class extends BaseResource {
    * Create a new parsing job
    */
   async create(params) {
-    const job = await this.httpClient.post("/v1/jobs", params);
+    const job = await this.httpClient.post(
+      "/v1/jobs",
+      params
+    );
+    delete job.documentId;
     if (job.uploadUrl) {
       this.pendingUploadJobs.set(job.jobId, job);
     }
@@ -988,7 +1078,8 @@ var Jobs = class extends BaseResource {
     if (!jobResult.resultUrl) {
       throw new NotFoundError("Result URL not available");
     }
-    return parseResult(this.httpClient, jobResult.resultUrl, options);
+    const result = await parseResult(this.httpClient, jobResult.resultUrl, options);
+    return enrichParseResult(result, jobResult);
   }
   isHttpUrl(value) {
     return /^https?:\/\//i.test(value);
@@ -1039,6 +1130,43 @@ var Jobs = class extends BaseResource {
   }
 };
+// src/resources/retrieval.ts
+var Retrieval = class extends BaseResource {
+  /**
+   * Query published documents.
+   */
+  async query(params) {
+    return this.httpClient.post("/v1/retrieval/query", params);
+  }
+};
+// src/resources/documents.ts
+var Documents = class extends BaseResource {
+  /**
+   * List canonical documents in a namespace.
+   */
+  async list(params) {
+    const requestConfig = params?.namespace ? {
+      params: {
+        namespace: params.namespace
+      }
+    } : void 0;
+    return this.httpClient.get("/v1/documents", requestConfig);
+  }
+  /**
+   * Get one canonical document by ID.
+   */
+  async get(documentId) {
+    return this.httpClient.get(`/v1/documents/${documentId}`);
+  }
+  /**
+   * Archive one canonical document by ID.
+   */
+  async archive(documentId) {
+    return this.httpClient.post(`/v1/documents/${documentId}/archive`);
+  }
+};
 // src/client.ts
 function inferFileName(file, explicitFileName) {
   if (explicitFileName) {
@@ -1058,6 +1186,10 @@ function isReadStream2(file) {
 var Knowhere = class {
   /** Jobs resource for low-level API */
   jobs;
+  /** Retrieval resource for querying published documents */
+  retrieval;
+  /** Documents resource for canonical document lifecycle operations */
+  documents;
   httpClient;
   /**
    * Create a new Knowhere client
@@ -1081,6 +1213,8 @@ var Knowhere = class {
       httpsAgent: options.httpsAgent
     });
     this.jobs = new Jobs(this.httpClient);
+    this.retrieval = new Retrieval(this.httpClient);
+    this.documents = new Documents(this.httpClient);
   }
   /**
    * High-level API: Parse a document and return structured results
@@ -1123,7 +1257,7 @@ var Knowhere = class {
       smartTitleParse: params.smartTitleParse,
       summaryImage: params.summaryImage,
       summaryTable: params.summaryTable,
-      summaryTxt: params.summaryText,
+      summaryTxt: params.summaryTxt,
       addFragDesc: params.addFragDesc,
       kbDir: params.kbDir
     };
@@ -1138,6 +1272,8 @@ var Knowhere = class {
       sourceUrl: params.url,
       fileName: resolvedFileName,
       dataId: params.dataId,
+      namespace: params.namespace,
+      documentId: params.documentId,
       parsingParams: Object.keys(parsingParams).length > 0 ? parsingParams : void 0,
       webhook
     });
@@ -1157,7 +1293,7 @@ var Knowhere = class {
     const result = await this.jobs.load(jobResult, {
       verifyChecksum: params.verifyChecksum
     });
-    return result;
+    return enrichParseResult(result, jobResult);
   }
 };
 export {
@@ -1166,6 +1302,7 @@ export {
   BadRequestError,
   ChecksumError,
   ConflictError,
+  Documents,
   GatewayTimeoutError,
   InternalServerError,
   InvalidStateError,
@@ -1179,6 +1316,7 @@ export {
   PermissionDeniedError,
   PollingTimeoutError,
   RateLimitError,
+  Retrieval,
   ServiceUnavailableError,
   TimeoutError,
   VERSION,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@ontos-ai/knowhere-sdk",
-  "version": "0.2.0",
+  "version": "0.3.0",
   "description": "Official Node.js SDK for Knowhere document parsing API",
   "keywords": [
     "knowhere",