npm - @pdfvector/instance-contract - Versions diffs - 0.0.27 → 0.0.29 - Mend

@pdfvector/instance-contract 0.0.27 → 0.0.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/.tsc/lib/router/academic/index.d.ts +2 -0
package/.tsc/lib/router/academic/index.js +2 -0
package/.tsc/lib/router/academic/paper-graph.d.ts +85 -0
package/.tsc/lib/router/academic/paper-graph.js +140 -0
package/.tsc/lib/router/academic/similar-papers.d.ts +70 -0
package/.tsc/lib/router/academic/similar-papers.js +139 -0
package/.tsc/lib/router/bankStatement/ask.js +6 -22
package/.tsc/lib/router/bankStatement/extract.js +6 -22
package/.tsc/lib/router/bankStatement/parse.js +5 -15
package/.tsc/lib/router/document/ask.js +6 -22
package/.tsc/lib/router/document/extract.js +6 -22
package/.tsc/lib/router/document/parse.js +6 -22
package/.tsc/lib/router/free/bank-statement-parse.js +4 -11
package/.tsc/lib/router/identity/ask.js +6 -22
package/.tsc/lib/router/identity/extract.js +6 -22
package/.tsc/lib/router/identity/parse.js +5 -15
package/.tsc/lib/router/invoice/ask.js +6 -22
package/.tsc/lib/router/invoice/extract.js +6 -22
package/.tsc/lib/router/invoice/parse.js +5 -15
package/.tsc/lib/supported-mimes.d.ts +29 -0
package/.tsc/lib/supported-mimes.js +122 -0
package/CHANGELOG.md +14 -0
package/package.json +1 -1

package/.tsc/lib/router/document/ask.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { documentAskModelDescription, outputAskModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const askInputSchema = z.object({
     url: z
@@ -9,17 +10,9 @@ const askInputSchema = z.object({
         .describe("URL of the document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -32,12 +25,7 @@ const askInputSchema = z.object({
         .enum(["auto", ...pdfvectorModelSchema.options])
         .optional()
         .default("auto")
-        .describe("Model tier for answering the question. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 2 credits/page. Fastest and cheapest. Best for simple questions about straightforward documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 4 credits/page. Balanced speed and accuracy. Handles moderately complex questions. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 8 credits/page. High accuracy for nuanced questions about complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 16 credits/page. Maximum accuracy with the most capable models. Best for difficult questions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+        .describe(documentAskModelDescription),
     callback: z
         .object({
         url: z
@@ -61,11 +49,7 @@ const askOutputSchema = z
         .number()
         .int()
         .describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to answer the question. " +
-        "'nano': Fastest, best for simple questions. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex questions. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputAskModelDescription),
     credits: z
         .number()
         .int()
@@ -132,7 +116,7 @@ const requestExamples = {
 export const ask = oc
     .route({
     summary: "Ask a question about a document",
-    description: "Parse a document and answer a question about its content using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Files up to 1000 pages and up to 500MB in size. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse a document and answer a question about its content using AI. Supports ${supportedFileTypesLong}. Files up to 1000 pages and up to 500MB in size. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Document"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/document/extract.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { documentExtractModelDescription, outputExtractModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const extractInputSchema = z.object({
     url: z
@@ -9,17 +10,9 @@ const extractInputSchema = z.object({
         .describe("URL of the document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -59,12 +52,7 @@ const extractInputSchema = z.object({
         .enum(["auto", ...pdfvectorModelSchema.options])
         .optional()
         .default("auto")
-        .describe("Model tier for extracting structured data. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 2 credits/page. Fastest and cheapest. Best for simple documents with straightforward schemas. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 4 credits/page. Balanced speed and accuracy. Handles moderately complex documents and schemas. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 8 credits/page. High accuracy for complex documents with large or nested schemas. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 16 credits/page. Maximum accuracy with the most capable models. Best for difficult extractions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+        .describe(documentExtractModelDescription),
     callback: z
         .object({
         url: z
@@ -92,11 +80,7 @@ const extractOutputSchema = z
         .number()
         .int()
         .describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to extract the data. " +
-        "'nano': Fastest, best for simple documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputExtractModelDescription),
     credits: z
         .number()
         .int()
@@ -175,7 +159,7 @@ const requestExamples = {
 export const extract = oc
     .route({
     summary: "Extract structured data from a document",
-    description: "Parse a document and extract structured data matching a provided JSON Schema using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Files up to 1000 pages and up to 500MB in size. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse a document and extract structured data matching a provided JSON Schema using AI. Supports ${supportedFileTypesLong}. Files up to 1000 pages and up to 500MB in size. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Document"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/document/parse.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { documentParseModelDescription, outputModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const parseInputSchema = z.object({
     url: z
@@ -9,17 +10,9 @@ const parseInputSchema = z.object({
         .describe("URL of the document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -28,12 +21,7 @@ const parseInputSchema = z.object({
         .enum(["auto", ...pdfvectorModelSchema.options])
         .optional()
         .default("auto")
-        .describe("Model tier for parsing. " +
-        "'auto' (default): Automatically selects the best parsing strategy with intelligent fallback. File up to 1000 pages, up to 500MB in size. Supports PDF, Word, Excel, CSV, Image. " +
-        "'nano': 1 credit/page. For simple documents with plain text content. File up to 30 pages, up to 10MB in size. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 2 credits/page. For documents with tables and structured content. File up to 30 pages, up to 10MB in size. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 4 credits/page. For documents up to 30 pages with tables, handwritten text, figures, math, and Arabic. File up to 30 pages, up to 40MB in size. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 8 credits/page. For large documents with full Pro capabilities plus enhanced multilingual support. File up to 1000 pages, up to 500MB in size. Supports PDF, Word, Excel, CSV, Image."),
+        .describe(documentParseModelDescription),
     callback: z
         .object({
         url: z
@@ -53,11 +41,7 @@ const parseInputSchema = z.object({
 const parseOutputSchema = z.object({
     markdown: z.string().describe("Extracted text content from the document"),
     pageCount: z.number().int().describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to parse the document. " +
-        "'nano': Fastest, best for simple documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputModelDescription),
     credits: z
         .number()
         .int()
@@ -120,7 +104,7 @@ const requestExamples = {
 export const parse = oc
     .route({
     summary: "Parse a document",
-    description: "Extract text and page count from a document. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Extract text and page count from a document. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Document"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/free/bank-statement-parse.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
+import { supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 const inputSchema = z.object({
     url: z
         .url()
@@ -7,17 +8,9 @@ const inputSchema = z.object({
         .describe("URL of the bank statement file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Bank statement file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Bank statement file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -70,7 +63,7 @@ const responseExample = {
 export const bankStatementParse = oc
     .route({
     summary: "Free: Parse a bank statement",
-    description: "Extract text and structured data from a bank statement. Supports PDF, Word, Excel, CSV, and Image files. Free tier: max 5 pages, max 5 MB. Rate limited to 5 requests per IP per day.",
+    description: `Extract text and structured data from a bank statement. Supports ${supportedFileTypesLong}. Free tier: max 5 pages, max 5 MB. Rate limited to 5 requests per IP per day.`,
     tags: ["Free"],
     spec: (op) => {
         op.security = [];

package/.tsc/lib/router/identity/ask.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { outputAskModelDescription, specializedAskModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedModelSchema = z
     .enum(["auto", ...pdfvectorModelSchema.options])
@@ -12,17 +13,9 @@ const askInputSchema = z.object({
         .describe("URL of the identity document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Identity document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Identity document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -31,12 +24,7 @@ const askInputSchema = z.object({
         .string()
         .min(4, "question must be at least 4 characters")
         .describe("The question to answer about the identity document"),
-    model: specializedModelSchema.describe("Model tier for answering the question. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 6 credits/page. Fastest and cheapest. Best for simple questions about straightforward documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 10 credits/page. Balanced speed and accuracy. Handles moderately complex questions. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 14 credits/page. High accuracy for nuanced questions about complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 18 credits/page. Maximum accuracy with the most capable models. Best for difficult questions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: specializedModelSchema.describe(specializedAskModelDescription),
     callback: z
         .object({
         url: z
@@ -56,11 +44,7 @@ const askInputSchema = z.object({
 const askOutputSchema = z.object({
     markdown: z.string().describe("The answer to the question"),
     pageCount: z.number().int().describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to answer the question. " +
-        "'nano': Fastest, best for simple questions. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex questions. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputAskModelDescription),
     credits: z
         .number()
         .int()
@@ -93,7 +77,7 @@ const requestExamples = {
 export const ask = oc
     .route({
     summary: "Ask a question about an identity document",
-    description: "Parse an identity document and answer a question about its content using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse an identity document and answer a question about its content using AI. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Identity"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/identity/extract.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { outputExtractModelDescription, specializedExtractModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedModelSchema = z
     .enum(["auto", ...pdfvectorModelSchema.options])
@@ -12,17 +13,9 @@ const extractInputSchema = z.object({
         .describe("URL of the identity document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Identity document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Identity document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
@@ -57,12 +50,7 @@ const extractInputSchema = z.object({
         }),
     ])
         .describe("JSON Schema describing the structure of the data to extract from the identity document. Can be a JSON object or a JSON string."),
-    model: specializedModelSchema.describe("Model tier for extracting structured data. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 6 credits/page. Fastest and cheapest. Best for simple documents with straightforward schemas. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 10 credits/page. Balanced speed and accuracy. Handles moderately complex documents and schemas. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 14 credits/page. High accuracy for complex documents with large or nested schemas. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 18 credits/page. Maximum accuracy with the most capable models. Best for difficult extractions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: specializedModelSchema.describe(specializedExtractModelDescription),
     callback: z
         .object({
         url: z
@@ -86,11 +74,7 @@ const extractOutputSchema = z.object({
         (typeof val !== "object" || Object.keys(val).length > 0), { message: "Extracted data must not be empty" })
         .describe("Extracted structured data matching the provided JSON Schema"),
     pageCount: z.number().int().describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to extract the data. " +
-        "'nano': Fastest, best for simple documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputExtractModelDescription),
     credits: z
         .number()
         .int()
@@ -125,7 +109,7 @@ const requestExamples = {
 export const extract = oc
     .route({
     summary: "Extract structured data from an identity document",
-    description: "Parse an identity document and extract structured data matching a provided JSON Schema using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse an identity document and extract structured data matching a provided JSON Schema using AI. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Identity"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/identity/parse.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
+import { specializedParseModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedParseModelSchema = z
     .enum(["pro", "max", "auto"], {
@@ -13,25 +14,14 @@ const parseInputSchema = z.object({
         .describe("URL of the identity document file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Identity document file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Identity document file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z
         .string()
         .optional()
         .describe("Base64-encoded identity document file content"),
-    model: specializedParseModelSchema.describe("Model tier for parsing. " +
-        "'auto' (default): Automatically selects the best parsing strategy with intelligent fallback. " +
-        "'pro': 6 credits/page. Extracts structured identity document fields with standard accuracy. " +
-        "'max': 10 credits/page. Extracts structured identity document fields with highest accuracy."),
+    model: specializedParseModelSchema.describe(specializedParseModelDescription("identity document")),
     callback: z
         .object({
         url: z
@@ -101,7 +91,7 @@ const requestExamples = {
 export const parse = oc
     .route({
     summary: "Parse an identity document",
-    description: "Extract text and structured data from an identity document. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Extract text and structured data from an identity document. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Identity"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/invoice/ask.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { outputAskModelDescription, specializedAskModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedModelSchema = z
     .enum(["auto", ...pdfvectorModelSchema.options])
@@ -12,28 +13,15 @@ const askInputSchema = z.object({
         .describe("URL of the invoice file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Invoice file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Invoice file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z.string().optional().describe("Base64-encoded invoice file content"),
     question: z
         .string()
         .min(4, "question must be at least 4 characters")
         .describe("The question to answer about the invoice"),
-    model: specializedModelSchema.describe("Model tier for answering the question. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 6 credits/page. Fastest and cheapest. Best for simple questions about straightforward documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 10 credits/page. Balanced speed and accuracy. Handles moderately complex questions. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 14 credits/page. High accuracy for nuanced questions about complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 18 credits/page. Maximum accuracy with the most capable models. Best for difficult questions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: specializedModelSchema.describe(specializedAskModelDescription),
     callback: z
         .object({
         url: z
@@ -53,11 +41,7 @@ const askInputSchema = z.object({
 const askOutputSchema = z.object({
     markdown: z.string().describe("The answer to the question"),
     pageCount: z.number().int().describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to answer the question. " +
-        "'nano': Fastest, best for simple questions. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex questions. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputAskModelDescription),
     credits: z
         .number()
         .int()
@@ -83,7 +67,7 @@ const requestExamples = {
 export const ask = oc
     .route({
     summary: "Ask a question about an invoice",
-    description: "Parse an invoice and answer a question about its content using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse an invoice and answer a question about its content using AI. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Invoice"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/invoice/extract.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
 import { pdfvectorModelSchema } from "../../pdfvector-model-schema";
+import { outputExtractModelDescription, specializedExtractModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedModelSchema = z
     .enum(["auto", ...pdfvectorModelSchema.options])
@@ -12,17 +13,9 @@ const extractInputSchema = z.object({
         .describe("URL of the invoice file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Invoice file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Invoice file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z.string().optional().describe("Base64-encoded invoice file content"),
     prompt: z
         .string()
@@ -54,12 +47,7 @@ const extractInputSchema = z.object({
         }),
     ])
         .describe("JSON Schema describing the structure of the data to extract from the invoice. Can be a JSON object or a JSON string."),
-    model: specializedModelSchema.describe("Model tier for extracting structured data. " +
-        "'auto' (default): Automatically selects the best tier based on document complexity. " +
-        "'nano': 6 credits/page. Fastest and cheapest. Best for simple documents with straightforward schemas. Supports PDF, Word, Excel, CSV. " +
-        "'mini': 10 credits/page. Balanced speed and accuracy. Handles moderately complex documents and schemas. Supports PDF, Word, Excel, CSV. " +
-        "'pro': 14 credits/page. High accuracy for complex documents with large or nested schemas. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': 18 credits/page. Maximum accuracy with the most capable models. Best for difficult extractions requiring deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: specializedModelSchema.describe(specializedExtractModelDescription),
     callback: z
         .object({
         url: z
@@ -83,11 +71,7 @@ const extractOutputSchema = z.object({
         (typeof val !== "object" || Object.keys(val).length > 0), { message: "Extracted data must not be empty" })
         .describe("Extracted structured data matching the provided JSON Schema"),
     pageCount: z.number().int().describe("Total number of pages in the document"),
-    model: pdfvectorModelSchema.describe("Model tier used to extract the data. " +
-        "'nano': Fastest, best for simple documents. Supports PDF, Word, Excel, CSV. " +
-        "'mini': Balanced speed and accuracy. Supports PDF, Word, Excel, CSV. " +
-        "'pro': High accuracy for complex documents. Supports PDF, Word, Excel, CSV, Image. " +
-        "'max': Maximum accuracy with deep reasoning. Supports PDF, Word, Excel, CSV, Image."),
+    model: pdfvectorModelSchema.describe(outputExtractModelDescription),
     credits: z
         .number()
         .int()
@@ -131,7 +115,7 @@ const requestExamples = {
 export const extract = oc
     .route({
     summary: "Extract structured data from an invoice",
-    description: "Parse an invoice and extract structured data matching a provided JSON Schema using AI. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Parse an invoice and extract structured data matching a provided JSON Schema using AI. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Invoice"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/router/invoice/parse.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { oc } from "@orpc/contract";
 import { z } from "zod";
+import { specializedParseModelDescription, supportedFileFormatsDescription, supportedFileMimes, supportedFileTypesLong, } from "../../supported-mimes";
 import { getDefaultSpec } from "./get-default-spec";
 const specializedParseModelSchema = z
     .enum(["pro", "max", "auto"], {
@@ -13,22 +14,11 @@ const parseInputSchema = z.object({
         .describe("URL of the invoice file to fetch and parse"),
     file: z
         .file()
-        .mime([
-        "application/pdf",
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-        "text/csv",
-        "application/csv",
-        "image/png",
-        "image/jpeg",
-    ])
+        .mime([...supportedFileMimes])
         .optional()
-        .describe("Invoice file upload via multipart form-data (PDF, DOCX, XLSX, CSV, PNG, JPG)"),
+        .describe(`Invoice file upload via multipart form-data (${supportedFileFormatsDescription})`),
     base64: z.string().optional().describe("Base64-encoded invoice file content"),
-    model: specializedParseModelSchema.describe("Model tier for parsing. " +
-        "'auto' (default): Automatically selects the best parsing strategy with intelligent fallback. " +
-        "'pro': 6 credits/page. Extracts structured invoice fields with standard accuracy. " +
-        "'max': 10 credits/page. Extracts structured invoice fields with highest accuracy and fallback."),
+    model: specializedParseModelSchema.describe(specializedParseModelDescription("invoice")),
     callback: z
         .object({
         url: z
@@ -92,7 +82,7 @@ const requestExamples = {
 export const parse = oc
     .route({
     summary: "Parse an invoice",
-    description: "Extract text and structured data from an invoice. Supports PDF, Word (.docx), Excel (.xlsx), CSV, and Image (.png, .jpg) files. Provide the document via file upload, a public URL, or a base64-encoded string.",
+    description: `Extract text and structured data from an invoice. Supports ${supportedFileTypesLong}. Provide the document via file upload, a public URL, or a base64-encoded string.`,
     tags: ["Invoice"],
     spec: (op) => getDefaultSpec(op, requestExamples),
 })

package/.tsc/lib/supported-mimes.d.ts ADDED Viewed

@@ -0,0 +1,29 @@
+/**
+ * All MIME types accepted for file uploads across all API endpoints.
+ * Single source of truth — imported by all contract schemas.
+ */
+export declare const supportedFileMimes: readonly ["application/pdf", "application/vnd.openxmlformats-officedocument.wordprocessingml.document", "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet", "application/vnd.openxmlformats-officedocument.presentationml.presentation", "text/csv", "application/csv", "image/png", "image/jpeg", "image/tiff", "image/bmp", "image/heif", "image/heic", "text/plain", "text/markdown", "text/tab-separated-values", "text/xml", "application/xml", "application/rtf", "text/rtf", "text/html", "application/epub+zip", "application/vnd.oasis.opendocument.text", "application/vnd.oasis.opendocument.spreadsheet", "application/vnd.oasis.opendocument.presentation", "application/x-bibtex"];
+export declare const supportedFileFormatsDescription = "PDF, DOCX, XLSX, PPTX, CSV, PNG, JPG, TIFF, BMP, HEIF, TXT, MD, TSV, XML, RTF, HTML, ODT, ODS, ODP, EPUB, BIB, RIS, NBIB, ENW";
+/**
+ * Human-readable description of supported file types with extensions.
+ * Used in route-level API descriptions.
+ */
+export declare const supportedFileTypesLong: string;
+/** Model tier descriptions for document parse endpoints. */
+export declare const documentParseModelDescription: string;
+/** Model tier descriptions for document extract endpoints. */
+export declare const documentExtractModelDescription: string;
+/** Model tier descriptions for document ask endpoints. */
+export declare const documentAskModelDescription: string;
+/** Model tier descriptions for invoice/identity/bankStatement parse endpoints (pro/max/auto only). */
+export declare const specializedParseModelDescription: (type: string) => string;
+/** Model tier descriptions for invoice/identity/bankStatement extract endpoints. */
+export declare const specializedExtractModelDescription: string;
+/** Model tier descriptions for invoice/identity/bankStatement ask endpoints. */
+export declare const specializedAskModelDescription: string;
+/** Output model description for parse results. */
+export declare const outputModelDescription: string;
+/** Output model description for extract results. */
+export declare const outputExtractModelDescription: string;
+/** Output model description for ask results. */
+export declare const outputAskModelDescription: string;