@botpress/api 0.50.1 → 0.50.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/src/gen/state.ts CHANGED
@@ -10548,6 +10548,10 @@ export const state = {
10548
10548
  "minimum": 50,
10549
10549
  "maximum": 2000,
10550
10550
  "description": "The minimum length a standalone paragraph should have. If a paragraph is shorter than this, it will be merged with the next immediate paragraph."
10551
+ },
10552
+ "smartCleanup": {
10553
+ "type": "boolean",
10554
+ "description": "(Team/Enterprise plan only, charged as AI Spend) Enabling this will use a lightweight/inexpensive LLM to clean up the extracted content of PDF files before indexing them to increase the quality of the stored vectors, as PDFs often store raw text in unusual ways which when extracted may result in formatting issues (e.g. broken sentences/paragraphs, unexpected headings, garbled characters, etc.) that can affect retrieval performance for certain user queries if left untouched.\n\nNotes:\n- This feature is only available in Team and Enterprise plans.\n- This feature is only available for PDF files. If the file isn't a PDF, this setting will be ignored and no AI Spend will be incurred.\n- We recommend using this feature for PDFs that have custom layouts or design. For simple text-based PDFs like documents and books, this feature is usually not necessary.\n- The smart cleanup takes some time to perform due to the LLM calls involved, so enabling it will increase the total time it takes to index the file.\n- We take steps to prevent the original text from being fundamentally changed but due to the nature of LLMs this could theoretically still happen so it's recommended to review the passages generated for the file after indexing to ensure the content is still accurate.\n- This feature is limited to the first 30 pages or 20 KB of text in the PDF file (whichever comes first). If the file has more content than these limits then the rest of the file will be indexed as-is without any cleanup. If you need to clean up the content of the entire file, consider splitting it into smaller files."
10551
10555
  }
10552
10556
  },
10553
10557
  "additionalProperties": false
@@ -10580,7 +10584,7 @@ export const state = {
10580
10584
  "enable": {
10581
10585
  "default": false,
10582
10586
  "type": "boolean",
10583
- "description": "Create summaries for this file and index them as standalone vectors. Enabling this option will incur in AI Spend cost (charged to the workspace of the bot) to generate the summaries based on the amount of content in the file and the summarization model used. Please note that this feature is only available in Team/Enterprise plans."
10587
+ "description": "(Team/Enterprise plan only, charged as AI Spend) Create summaries for this file and index them as standalone vectors. Enabling this option will incur in AI Spend cost (charged to the workspace of the bot) to generate the summaries based on the amount of content in the file and the summarization model used.\n\nPlease note that this feature is only available in Team and Enterprise plans."
10584
10588
  },
10585
10589
  "modelType": {
10586
10590
  "default": "balanced",
@@ -12427,7 +12431,7 @@ export const state = {
12427
12431
  "title": "Botpress API",
12428
12432
  "description": "API for Botpress Cloud",
12429
12433
  "server": "https://api.botpress.cloud",
12430
- "version": "0.50.1",
12434
+ "version": "0.50.2",
12431
12435
  "prefix": "v1"
12432
12436
  },
12433
12437
  "errors": [