@exulu/backend 1.57.0 → 1.58.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -630,7 +630,7 @@ async function processDocument(
630
630
  source: filePath,
631
631
  }
632
632
 
633
- const stripped = filePath.split('.').pop()?.trim();
633
+ const stripped = filePath.split('.').pop()?.trim().toLowerCase();
634
634
  let result: ProcessorOutput;
635
635
  switch (stripped) {
636
636
  case 'txt':
@@ -1017,7 +1017,7 @@ export async function documentProcessor({
1017
1017
  supportedTypes = ['pdf', 'docx', 'doc', 'txt', 'md', 'jpg', 'jpeg', 'png', 'gif', 'webp'];
1018
1018
  break;
1019
1019
  case "officeparser":
1020
- supportedTypes = [];
1020
+ supportedTypes = ['docx', 'pptx', 'xlsx', 'odt', 'odp', 'ods', 'pdf', 'rtf', 'csv', 'md', 'html'];
1021
1021
  break;
1022
1022
  case "liteparse":
1023
1023
  supportedTypes = ['pdf', 'doc', 'docx', 'docm', 'odt', 'rtf', 'ppt', 'pptx', 'pptm', 'odp', 'xls', 'xlsx', 'xlsm', 'ods', 'csv', 'tsv'];
@@ -1027,8 +1027,8 @@ export async function documentProcessor({
1027
1027
  break;
1028
1028
  }
1029
1029
 
1030
- if (!supportedTypes.includes(fileType)) {
1031
- throw new Error(`[EXULU] Unsupported file type: ${fileType} for Exulu document processor, the ${config?.processor.name} processor only supports the following file types: ${supportedTypes.join(', ')}.`);
1030
+ if (!supportedTypes.includes(fileType.toLowerCase())) {
1031
+ throw new Error(`[EXULU] Unsupported file type: ${fileType.toLowerCase()} for Exulu document processor, the ${config?.processor.name} processor only supports the following file types: ${supportedTypes.join(', ')}.`);
1032
1032
  }
1033
1033
 
1034
1034
  // Process document with VLM validation enabled
@@ -1043,7 +1043,6 @@ export async function documentProcessor({
1043
1043
 
1044
1044
  return content.json;
1045
1045
 
1046
-
1047
1046
  } catch (error) {
1048
1047
  console.error('Error during chunking:', error);
1049
1048
  throw error;
@@ -2,3 +2,4 @@ docling
2
2
  transformers
3
3
  pyinstaller
4
4
  docling-hierarchical-pdf
5
+ defusedxml
package/ee/workers.ts CHANGED
@@ -405,6 +405,9 @@ export const createWorkers = async (
405
405
  // not part of the database, so remove it here before
406
406
  // we upadte the item in the db.
407
407
  delete processorResult.field;
408
+ // fts is a generated column (tsvector GENERATED ALWAYS AS ... STORED)
409
+ // and Postgres rejects any explicit update to it.
410
+ delete processorResult.fts;
408
411
 
409
412
  // Memory optimization: For large processor results (e.g., documents),
410
413
  // extract only the fields we need for the database update to avoid
package/package.json CHANGED
@@ -1,7 +1,7 @@
1
1
  {
2
2
  "name": "@exulu/backend",
3
3
  "author": "Qventu Bv.",
4
- "version": "1.57.0",
4
+ "version": "1.58.0",
5
5
  "main": "./dist/index.js",
6
6
  "private": false,
7
7
  "publishConfig": {
@@ -88,8 +88,8 @@
88
88
  "dependencies": {
89
89
  "@ai-sdk/anthropic": "^3.0.23",
90
90
  "@ai-sdk/azure": "^3.0.53",
91
- "@ai-sdk/cerebras": "^2.0.29",
92
- "@ai-sdk/google-vertex": "^4.0.28",
91
+ "@ai-sdk/cerebras": "^2.0.51",
92
+ "@ai-sdk/google-vertex": "^4.0.136",
93
93
  "@ai-sdk/openai": "^3.0.18",
94
94
  "@ai-sdk/openai-compatible": "^2.0.37",
95
95
  "@anthropic-ai/sandbox-runtime": "^0.0.49",