@arbidocs/client 0.3.46 → 0.3.48

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.d.cts CHANGED
@@ -2350,7 +2350,7 @@ interface components {
2350
2350
  * @default {
2351
2351
  * "API_TYPE": "remote",
2352
2352
  * "ENABLE_THINKING": true,
2353
- * "MODEL_NAME": "GLM5@Fireworks",
2353
+ * "MODEL_NAME": "Premium",
2354
2354
  * "SYSTEM_INSTRUCTION": "You are a code execution agent. You write and run code to accomplish tasks.\n\nYou have access to an execute_code tool that runs code in a sandboxed Docker container.\n\nThe sandbox has:\n- Python 3.12 with numpy, pandas, matplotlib, requests, beautifulsoup4,\n httpx, pillow, sympy, pyyaml (plus uv for installing more)\n- Node.js 22 with TypeScript (ts-node) and npm\n- Bash with git, curl, wget, jq, sqlite3, build-essential\n- Network access (can pip/npm install additional packages)\n\nInstructions:\n1. Write clean, correct code to accomplish the user's task\n2. Always call execute_code to run your code — never guess the output\n3. If execution errors, analyze the traceback, fix the code, and retry\n4. Once you have the correct output, respond with ONLY the final result\n\nKeep code simple and direct. Prefer Python unless the task specifically requires another language.",
2355
2355
  * "TEMPERATURE": 0.2,
2356
2356
  * "MAX_TOKENS": 8000,
@@ -2400,8 +2400,7 @@ interface components {
2400
2400
  /**
2401
2401
  * @default {
2402
2402
  * "MAX_CHUNK_TOKENS": 1200,
2403
- * "TOKENIZER_TYPE": "huggingface",
2404
- * "TOKENIZER_NAME": "Qwen/Qwen3-Embedding-0.6B"
2403
+ * "TOKENIZER_NAME": "cl100k_base"
2405
2404
  * }
2406
2405
  */
2407
2406
  Chunker: components['schemas']['ChunkerConfig'];
@@ -2762,21 +2761,14 @@ interface components {
2762
2761
  ChunkerConfig: {
2763
2762
  /**
2764
2763
  * Max Chunk Tokens
2765
- * @description Maximum tokens per chunk. The tokenizer used depends on TOKENIZER_TYPE.
2764
+ * @description Maximum tokens per chunk. Enforces a hard upper bound on chunk size; the tiktoken encoding is model-agnostic and used only for counting.
2766
2765
  * @default 1200
2767
2766
  */
2768
2767
  MAX_CHUNK_TOKENS: number;
2769
- /**
2770
- * Tokenizer Type
2771
- * @description Tokenizer backend: 'tiktoken' for OpenAI models (cl100k_base, etc.) or 'huggingface' for HF models (Qwen3-Embedding, etc.).
2772
- * @default huggingface
2773
- * @enum {string}
2774
- */
2775
- TOKENIZER_TYPE: 'tiktoken' | 'huggingface';
2776
2768
  /**
2777
2769
  * Tokenizer Name
2778
- * @description Tokenizer name. For tiktoken: 'cl100k_base', 'o200k_base', etc. For huggingface: model name like 'Qwen/Qwen3-Embedding-0.6B'.
2779
- * @default Qwen/Qwen3-Embedding-0.6B
2770
+ * @description Name of the tiktoken encoding used for chunk-size counting (e.g. 'cl100k_base', 'o200k_base').
2771
+ * @default cl100k_base
2780
2772
  */
2781
2773
  TOKENIZER_NAME: string;
2782
2774
  };
@@ -2820,7 +2812,7 @@ interface components {
2820
2812
  /**
2821
2813
  * Model Name
2822
2814
  * @description Model for code generation. Should be a strong coding model.
2823
- * @default GLM5@Fireworks
2815
+ * @default Premium
2824
2816
  */
2825
2817
  MODEL_NAME: string;
2826
2818
  /**
@@ -3410,8 +3402,8 @@ interface components {
3410
3402
  * @description A pair of documents identified as near-duplicates by centroid similarity.
3411
3403
  */
3412
3404
  DocSimPair: {
3413
- doc_a: components['schemas']['DocResponse'];
3414
- doc_b: components['schemas']['DocResponse'];
3405
+ doc_a: components['schemas']['DocSimSummary'];
3406
+ doc_b: components['schemas']['DocSimSummary'];
3415
3407
  /** Similarity */
3416
3408
  similarity: number;
3417
3409
  };
@@ -3425,6 +3417,16 @@ interface components {
3425
3417
  /** Pairs */
3426
3418
  pairs: components['schemas']['DocSimPair'][];
3427
3419
  };
3420
+ /**
3421
+ * DocSimSummary
3422
+ * @description Lightweight document summary for the similar-documents endpoint.
3423
+ */
3424
+ DocSimSummary: {
3425
+ /** External Id */
3426
+ external_id: string;
3427
+ /** File Name */
3428
+ file_name?: string | null;
3429
+ };
3428
3430
  /**
3429
3431
  * DocTagResponse
3430
3432
  * @description Response for doctag operations - the link between a document and a tag.
@@ -7117,6 +7119,11 @@ interface components {
7117
7119
  * @default false
7118
7120
  */
7119
7121
  show_agent_sessions: boolean;
7122
+ /**
7123
+ * Use S3 Direct Upload
7124
+ * @default false
7125
+ */
7126
+ use_s3_direct_upload: boolean;
7120
7127
  /**
7121
7128
  * Hide Online Status
7122
7129
  * @default false
@@ -7161,6 +7168,8 @@ interface components {
7161
7168
  show_pa_mode?: boolean | null;
7162
7169
  /** Show Agent Sessions */
7163
7170
  show_agent_sessions?: boolean | null;
7171
+ /** Use S3 Direct Upload */
7172
+ use_s3_direct_upload?: boolean | null;
7164
7173
  /** Hide Online Status */
7165
7174
  hide_online_status?: boolean | null;
7166
7175
  /** Muted Users */
@@ -8676,7 +8685,7 @@ interface operations {
8676
8685
  get_similar_documents: {
8677
8686
  parameters: {
8678
8687
  query?: {
8679
- /** @description Minimum similarity score (default 0.92 for near-duplicates) */
8688
+ /** @description Minimum similarity score (default 0.95 for near-duplicates) */
8680
8689
  threshold?: number;
8681
8690
  /** @description Filter pairs involving a specific document */
8682
8691
  doc_ext_id?: string | null;
package/dist/index.d.ts CHANGED
@@ -2350,7 +2350,7 @@ interface components {
2350
2350
  * @default {
2351
2351
  * "API_TYPE": "remote",
2352
2352
  * "ENABLE_THINKING": true,
2353
- * "MODEL_NAME": "GLM5@Fireworks",
2353
+ * "MODEL_NAME": "Premium",
2354
2354
  * "SYSTEM_INSTRUCTION": "You are a code execution agent. You write and run code to accomplish tasks.\n\nYou have access to an execute_code tool that runs code in a sandboxed Docker container.\n\nThe sandbox has:\n- Python 3.12 with numpy, pandas, matplotlib, requests, beautifulsoup4,\n httpx, pillow, sympy, pyyaml (plus uv for installing more)\n- Node.js 22 with TypeScript (ts-node) and npm\n- Bash with git, curl, wget, jq, sqlite3, build-essential\n- Network access (can pip/npm install additional packages)\n\nInstructions:\n1. Write clean, correct code to accomplish the user's task\n2. Always call execute_code to run your code — never guess the output\n3. If execution errors, analyze the traceback, fix the code, and retry\n4. Once you have the correct output, respond with ONLY the final result\n\nKeep code simple and direct. Prefer Python unless the task specifically requires another language.",
2355
2355
  * "TEMPERATURE": 0.2,
2356
2356
  * "MAX_TOKENS": 8000,
@@ -2400,8 +2400,7 @@ interface components {
2400
2400
  /**
2401
2401
  * @default {
2402
2402
  * "MAX_CHUNK_TOKENS": 1200,
2403
- * "TOKENIZER_TYPE": "huggingface",
2404
- * "TOKENIZER_NAME": "Qwen/Qwen3-Embedding-0.6B"
2403
+ * "TOKENIZER_NAME": "cl100k_base"
2405
2404
  * }
2406
2405
  */
2407
2406
  Chunker: components['schemas']['ChunkerConfig'];
@@ -2762,21 +2761,14 @@ interface components {
2762
2761
  ChunkerConfig: {
2763
2762
  /**
2764
2763
  * Max Chunk Tokens
2765
- * @description Maximum tokens per chunk. The tokenizer used depends on TOKENIZER_TYPE.
2764
+ * @description Maximum tokens per chunk. Enforces a hard upper bound on chunk size; the tiktoken encoding is model-agnostic and used only for counting.
2766
2765
  * @default 1200
2767
2766
  */
2768
2767
  MAX_CHUNK_TOKENS: number;
2769
- /**
2770
- * Tokenizer Type
2771
- * @description Tokenizer backend: 'tiktoken' for OpenAI models (cl100k_base, etc.) or 'huggingface' for HF models (Qwen3-Embedding, etc.).
2772
- * @default huggingface
2773
- * @enum {string}
2774
- */
2775
- TOKENIZER_TYPE: 'tiktoken' | 'huggingface';
2776
2768
  /**
2777
2769
  * Tokenizer Name
2778
- * @description Tokenizer name. For tiktoken: 'cl100k_base', 'o200k_base', etc. For huggingface: model name like 'Qwen/Qwen3-Embedding-0.6B'.
2779
- * @default Qwen/Qwen3-Embedding-0.6B
2770
+ * @description Name of the tiktoken encoding used for chunk-size counting (e.g. 'cl100k_base', 'o200k_base').
2771
+ * @default cl100k_base
2780
2772
  */
2781
2773
  TOKENIZER_NAME: string;
2782
2774
  };
@@ -2820,7 +2812,7 @@ interface components {
2820
2812
  /**
2821
2813
  * Model Name
2822
2814
  * @description Model for code generation. Should be a strong coding model.
2823
- * @default GLM5@Fireworks
2815
+ * @default Premium
2824
2816
  */
2825
2817
  MODEL_NAME: string;
2826
2818
  /**
@@ -3410,8 +3402,8 @@ interface components {
3410
3402
  * @description A pair of documents identified as near-duplicates by centroid similarity.
3411
3403
  */
3412
3404
  DocSimPair: {
3413
- doc_a: components['schemas']['DocResponse'];
3414
- doc_b: components['schemas']['DocResponse'];
3405
+ doc_a: components['schemas']['DocSimSummary'];
3406
+ doc_b: components['schemas']['DocSimSummary'];
3415
3407
  /** Similarity */
3416
3408
  similarity: number;
3417
3409
  };
@@ -3425,6 +3417,16 @@ interface components {
3425
3417
  /** Pairs */
3426
3418
  pairs: components['schemas']['DocSimPair'][];
3427
3419
  };
3420
+ /**
3421
+ * DocSimSummary
3422
+ * @description Lightweight document summary for the similar-documents endpoint.
3423
+ */
3424
+ DocSimSummary: {
3425
+ /** External Id */
3426
+ external_id: string;
3427
+ /** File Name */
3428
+ file_name?: string | null;
3429
+ };
3428
3430
  /**
3429
3431
  * DocTagResponse
3430
3432
  * @description Response for doctag operations - the link between a document and a tag.
@@ -7117,6 +7119,11 @@ interface components {
7117
7119
  * @default false
7118
7120
  */
7119
7121
  show_agent_sessions: boolean;
7122
+ /**
7123
+ * Use S3 Direct Upload
7124
+ * @default false
7125
+ */
7126
+ use_s3_direct_upload: boolean;
7120
7127
  /**
7121
7128
  * Hide Online Status
7122
7129
  * @default false
@@ -7161,6 +7168,8 @@ interface components {
7161
7168
  show_pa_mode?: boolean | null;
7162
7169
  /** Show Agent Sessions */
7163
7170
  show_agent_sessions?: boolean | null;
7171
+ /** Use S3 Direct Upload */
7172
+ use_s3_direct_upload?: boolean | null;
7164
7173
  /** Hide Online Status */
7165
7174
  hide_online_status?: boolean | null;
7166
7175
  /** Muted Users */
@@ -8676,7 +8685,7 @@ interface operations {
8676
8685
  get_similar_documents: {
8677
8686
  parameters: {
8678
8687
  query?: {
8679
- /** @description Minimum similarity score (default 0.92 for near-duplicates) */
8688
+ /** @description Minimum similarity score (default 0.95 for near-duplicates) */
8680
8689
  threshold?: number;
8681
8690
  /** @description Filter pairs involving a specific document */
8682
8691
  doc_ext_id?: string | null;
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@arbidocs/client",
3
- "version": "0.3.46",
3
+ "version": "0.3.48",
4
4
  "description": "TypeScript SDK for the ARBI API — zero-knowledge auth, E2E encryption, and type-safe REST client",
5
5
  "type": "module",
6
6
  "main": "dist/index.cjs",