carbon_ruby_sdk 0.2.16 → 0.2.18
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/Gemfile.lock +16 -20
- data/README.md +28 -7
- data/lib/carbon_ruby_sdk/api/embeddings_api.rb +6 -2
- data/lib/carbon_ruby_sdk/api/files_api.rb +15 -4
- data/lib/carbon_ruby_sdk/api/integrations_api.rb +8 -8
- data/lib/carbon_ruby_sdk/models/file_sync_config.rb +11 -1
- data/lib/carbon_ruby_sdk/models/file_sync_config_nullable.rb +11 -1
- data/lib/carbon_ruby_sdk/models/get_embedding_documents_body.rb +18 -5
- data/lib/carbon_ruby_sdk/models/o_auth_url_request.rb +2 -2
- data/lib/carbon_ruby_sdk/models/object_type.rb +42 -0
- data/lib/carbon_ruby_sdk/models/organization_user_files_to_sync_filters.rb +18 -5
- data/lib/carbon_ruby_sdk/models/sent_webhook_payload.rb +276 -0
- data/lib/carbon_ruby_sdk/models/sent_webhook_payload_object.rb +235 -0
- data/lib/carbon_ruby_sdk/models/sent_webhook_payload_object_additional_information.rb +101 -0
- data/lib/carbon_ruby_sdk/models/sent_webhook_payload_object_object_id.rb +103 -0
- data/lib/carbon_ruby_sdk/models/sent_webhook_request_body.rb +215 -0
- data/lib/carbon_ruby_sdk/models/sync_files_request.rb +1 -1
- data/lib/carbon_ruby_sdk/models/sync_options.rb +1 -1
- data/lib/carbon_ruby_sdk/models/transcription_service.rb +36 -0
- data/lib/carbon_ruby_sdk/models/transcription_service_nullable.rb +36 -0
- data/lib/carbon_ruby_sdk/models/upload_file_from_url_input.rb +11 -1
- data/lib/carbon_ruby_sdk/version.rb +1 -1
- data/lib/carbon_ruby_sdk.rb +8 -0
- data/spec/api/files_api_spec.rb +1 -0
- data/spec/models/file_sync_config_nullable_spec.rb +6 -0
- data/spec/models/file_sync_config_spec.rb +6 -0
- data/spec/models/get_embedding_documents_body_spec.rb +6 -0
- data/spec/models/object_type_spec.rb +22 -0
- data/spec/models/organization_user_files_to_sync_filters_spec.rb +6 -0
- data/spec/models/sent_webhook_payload_object_additional_information_spec.rb +25 -0
- data/spec/models/sent_webhook_payload_object_object_id_spec.rb +25 -0
- data/spec/models/sent_webhook_payload_object_spec.rb +40 -0
- data/spec/models/sent_webhook_payload_spec.rb +50 -0
- data/spec/models/sent_webhook_request_body_spec.rb +28 -0
- data/spec/models/transcription_service_nullable_spec.rb +22 -0
- data/spec/models/transcription_service_spec.rb +22 -0
- data/spec/models/upload_file_from_url_input_spec.rb +6 -0
- metadata +27 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 621a55f88f43768897cf3086257a2c73bb47a8417043d4576e9097069c979a75
|
4
|
+
data.tar.gz: 8a19d96655e5c7230b5dc1d4d34ed2faae53b270e78a973ffae5396041c8ed40
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 610cc7b260e629e544ae15e90b0120276403d5beb06936613b6cc7956272a3761c596ad8d8cb34ad2d91b66b1ba55ebdf25fcf2606139ea3976eae842bb98823
|
7
|
+
data.tar.gz: 8d082ccc3c69fe4b64f47462f3b97cfab0ea508b2cba1cac9db5efc4975461f823d40c39a5ce9e610d09a3ab37a20397770fd6d634c7bb54c32d24587ab2b32a
|
data/Gemfile.lock
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
PATH
|
2
2
|
remote: .
|
3
3
|
specs:
|
4
|
-
carbon_ruby_sdk (0.2.
|
4
|
+
carbon_ruby_sdk (0.2.17)
|
5
5
|
faraday (>= 1.0.1, < 3.0)
|
6
6
|
faraday-multipart (~> 1.0, >= 1.0.4)
|
7
7
|
|
@@ -15,9 +15,8 @@ GEM
|
|
15
15
|
irb (>= 1.5.0)
|
16
16
|
reline (>= 0.3.1)
|
17
17
|
diff-lcs (1.5.1)
|
18
|
-
faraday (2.
|
18
|
+
faraday (2.9.0)
|
19
19
|
faraday-net_http (>= 2.0, < 3.2)
|
20
|
-
logger
|
21
20
|
faraday-multipart (1.0.4)
|
22
21
|
multipart-post (~> 2)
|
23
22
|
faraday-net_http (3.1.0)
|
@@ -25,13 +24,12 @@ GEM
|
|
25
24
|
io-console (0.7.2)
|
26
25
|
irb (1.6.4)
|
27
26
|
reline (>= 0.3.0)
|
28
|
-
|
29
|
-
|
30
|
-
multipart-post (2.4.1)
|
27
|
+
method_source (1.0.0)
|
28
|
+
multipart-post (2.4.0)
|
31
29
|
net-http (0.4.1)
|
32
30
|
uri
|
33
|
-
parallel (1.
|
34
|
-
parser (3.3.
|
31
|
+
parallel (1.24.0)
|
32
|
+
parser (3.3.0.5)
|
35
33
|
ast (~> 2.4.1)
|
36
34
|
racc
|
37
35
|
pry (0.14.2)
|
@@ -40,24 +38,23 @@ GEM
|
|
40
38
|
pry-byebug (3.10.1)
|
41
39
|
byebug (~> 11.0)
|
42
40
|
pry (>= 0.13, < 0.15)
|
43
|
-
racc (1.
|
41
|
+
racc (1.7.3)
|
44
42
|
rainbow (3.1.1)
|
45
43
|
rake (13.0.6)
|
46
|
-
regexp_parser (2.9.
|
47
|
-
reline (0.5.
|
44
|
+
regexp_parser (2.9.0)
|
45
|
+
reline (0.5.0)
|
48
46
|
io-console (~> 0.5)
|
49
|
-
rexml (3.
|
50
|
-
strscan
|
47
|
+
rexml (3.2.6)
|
51
48
|
rspec (3.13.0)
|
52
49
|
rspec-core (~> 3.13.0)
|
53
50
|
rspec-expectations (~> 3.13.0)
|
54
51
|
rspec-mocks (~> 3.13.0)
|
55
52
|
rspec-core (3.13.0)
|
56
53
|
rspec-support (~> 3.13.0)
|
57
|
-
rspec-expectations (3.13.
|
54
|
+
rspec-expectations (3.13.0)
|
58
55
|
diff-lcs (>= 1.2.0, < 2.0)
|
59
56
|
rspec-support (~> 3.13.0)
|
60
|
-
rspec-mocks (3.13.
|
57
|
+
rspec-mocks (3.13.0)
|
61
58
|
diff-lcs (>= 1.2.0, < 2.0)
|
62
59
|
rspec-support (~> 3.13.0)
|
63
60
|
rspec-support (3.13.1)
|
@@ -70,15 +67,14 @@ GEM
|
|
70
67
|
rubocop-ast (>= 1.2.0, < 2.0)
|
71
68
|
ruby-progressbar (~> 1.7)
|
72
69
|
unicode-display_width (>= 1.4.0, < 3.0)
|
73
|
-
rubocop-ast (1.31.
|
74
|
-
parser (>= 3.3.
|
70
|
+
rubocop-ast (1.31.2)
|
71
|
+
parser (>= 3.3.0.4)
|
75
72
|
ruby-progressbar (1.13.0)
|
76
|
-
strscan (3.1.0)
|
77
73
|
unicode-display_width (2.5.0)
|
78
74
|
uri (0.13.0)
|
79
75
|
|
80
76
|
PLATFORMS
|
81
|
-
arm64-darwin-
|
77
|
+
arm64-darwin-22
|
82
78
|
|
83
79
|
DEPENDENCIES
|
84
80
|
carbon_ruby_sdk!
|
@@ -90,4 +86,4 @@ DEPENDENCIES
|
|
90
86
|
rubocop (~> 1.12.1)
|
91
87
|
|
92
88
|
BUNDLED WITH
|
93
|
-
2.
|
89
|
+
2.4.19
|
data/README.md
CHANGED
@@ -6,7 +6,7 @@
|
|
6
6
|
|
7
7
|
Connect external data to LLMs, no matter the source.
|
8
8
|
|
9
|
-
[![npm](https://img.shields.io/badge/gem-v0.2.
|
9
|
+
[![npm](https://img.shields.io/badge/gem-v0.2.18-blue)](https://rubygems.org/gems/carbon_ruby_sdk/versions/0.2.18)
|
10
10
|
|
11
11
|
</div>
|
12
12
|
|
@@ -91,7 +91,7 @@ Connect external data to LLMs, no matter the source.
|
|
91
91
|
Add to Gemfile:
|
92
92
|
|
93
93
|
```ruby
|
94
|
-
gem 'carbon_ruby_sdk', '~> 0.2.
|
94
|
+
gem 'carbon_ruby_sdk', '~> 0.2.18'
|
95
95
|
```
|
96
96
|
|
97
97
|
## Getting Started<a id="getting-started"></a>
|
@@ -385,6 +385,9 @@ result = carbon.embeddings.get_documents(
|
|
385
385
|
rerank: {
|
386
386
|
"model" => "model_example",
|
387
387
|
},
|
388
|
+
file_types_at_source: [
|
389
|
+
"string_example"
|
390
|
+
],
|
388
391
|
)
|
389
392
|
p result
|
390
393
|
```
|
@@ -449,6 +452,10 @@ default, this is set to false. If true, the search may return more accurate
|
|
449
452
|
results, but may take longer to complete.
|
450
453
|
|
451
454
|
##### rerank: [`RerankParamsNullable`](./lib/carbon_ruby_sdk/models/rerank_params_nullable.rb)<a id="rerank-rerankparamsnullablelibcarbon_ruby_sdkmodelsrerank_params_nullablerb"></a>
|
455
|
+
##### file_types_at_source: Array<[`HelpdeskFileTypes`](./lib/carbon_ruby_sdk/models/helpdesk_file_types.rb)><a id="file_types_at_source-array"></a>
|
456
|
+
Filter files based on their type at the source (for example help center tickets
|
457
|
+
and articles)
|
458
|
+
|
452
459
|
#### 🔄 Return<a id="🔄-return"></a>
|
453
460
|
|
454
461
|
[DocumentResponseList](./lib/carbon_ruby_sdk/models/document_response_list.rb)
|
@@ -1071,6 +1078,7 @@ result = carbon.files.upload(
|
|
1071
1078
|
max_items_per_chunk: 1,
|
1072
1079
|
parse_pdf_tables_with_ocr: false,
|
1073
1080
|
detect_audio_language: false,
|
1081
|
+
transcription_service: "assemblyai",
|
1074
1082
|
media_type: "TEXT",
|
1075
1083
|
split_rows: false,
|
1076
1084
|
)
|
@@ -1118,6 +1126,10 @@ Whether to use rich table parsing when `use_ocr` is enabled.
|
|
1118
1126
|
##### detect_audio_language: `Boolean`<a id="detect_audio_language-boolean"></a>
|
1119
1127
|
Whether to automatically detect the language of the uploaded audio file.
|
1120
1128
|
|
1129
|
+
##### transcription_service: [`TranscriptionServiceNullable`](./lib/carbon_ruby_sdk/models/transcription_service_nullable.rb)<a id="transcription_service-transcriptionservicenullablelibcarbon_ruby_sdkmodelstranscription_service_nullablerb"></a>
|
1130
|
+
The transcription service to use for audio files. If no service is specified,
|
1131
|
+
'deepgram' will be used.
|
1132
|
+
|
1121
1133
|
##### media_type: [`FileContentTypesNullable`](./lib/carbon_ruby_sdk/models/file_content_types_nullable.rb)<a id="media_type-filecontenttypesnullablelibcarbon_ruby_sdkmodelsfile_content_types_nullablerb"></a>
|
1122
1134
|
The media type of the file. If not provided, it will be inferred from the file
|
1123
1135
|
extension.
|
@@ -1160,6 +1172,7 @@ result = carbon.files.upload_from_url(
|
|
1160
1172
|
max_items_per_chunk: 1,
|
1161
1173
|
parse_pdf_tables_with_ocr: false,
|
1162
1174
|
detect_audio_language: false,
|
1175
|
+
transcription_service: "assemblyai",
|
1163
1176
|
media_type: "TEXT",
|
1164
1177
|
split_rows: false,
|
1165
1178
|
)
|
@@ -1183,6 +1196,7 @@ Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
|
1183
1196
|
|
1184
1197
|
##### parse_pdf_tables_with_ocr: `Boolean`<a id="parse_pdf_tables_with_ocr-boolean"></a>
|
1185
1198
|
##### detect_audio_language: `Boolean`<a id="detect_audio_language-boolean"></a>
|
1199
|
+
##### transcription_service: [`TranscriptionServiceNullable`](./lib/carbon_ruby_sdk/models/transcription_service_nullable.rb)<a id="transcription_service-transcriptionservicenullablelibcarbon_ruby_sdkmodelstranscription_service_nullablerb"></a>
|
1186
1200
|
##### media_type: [`FileContentTypesNullable`](./lib/carbon_ruby_sdk/models/file_content_types_nullable.rb)<a id="media_type-filecontenttypesnullablelibcarbon_ruby_sdkmodelsfile_content_types_nullablerb"></a>
|
1187
1201
|
##### split_rows: `Boolean`<a id="split_rows-boolean"></a>
|
1188
1202
|
#### 🔄 Return<a id="🔄-return"></a>
|
@@ -1300,7 +1314,7 @@ result = carbon.integrations.connect_data_source(
|
|
1300
1314
|
"prepend_filename_to_chunks" => false,
|
1301
1315
|
"sync_files_on_connection" => true,
|
1302
1316
|
"set_page_as_boundary" => false,
|
1303
|
-
"request_id" => "
|
1317
|
+
"request_id" => "f5e8c193-f7e1-4e45-9be5-6aa157dfe3c3",
|
1304
1318
|
"enable_file_picker" => true,
|
1305
1319
|
"sync_source_items" => true,
|
1306
1320
|
"incremental_sync" => false,
|
@@ -1354,6 +1368,7 @@ result = carbon.integrations.connect_freshdesk(
|
|
1354
1368
|
"auto_synced_source_types" => ["ARTICLE"],
|
1355
1369
|
"sync_attachments" => false,
|
1356
1370
|
"detect_audio_language" => false,
|
1371
|
+
"transcription_service" => "assemblyai",
|
1357
1372
|
"split_rows" => false,
|
1358
1373
|
},
|
1359
1374
|
)
|
@@ -1520,7 +1535,7 @@ result = carbon.integrations.get_oauth_url(
|
|
1520
1535
|
set_page_as_boundary: false,
|
1521
1536
|
data_source_id: 1,
|
1522
1537
|
connecting_new_account: false,
|
1523
|
-
request_id: "
|
1538
|
+
request_id: "c4055754-ba2d-4f57-a990-6e990abbbd90",
|
1524
1539
|
use_ocr: false,
|
1525
1540
|
parse_pdf_tables_with_ocr: false,
|
1526
1541
|
enable_file_picker: true,
|
@@ -1530,6 +1545,7 @@ result = carbon.integrations.get_oauth_url(
|
|
1530
1545
|
"auto_synced_source_types" => ["ARTICLE"],
|
1531
1546
|
"sync_attachments" => false,
|
1532
1547
|
"detect_audio_language" => false,
|
1548
|
+
"transcription_service" => "assemblyai",
|
1533
1549
|
"split_rows" => false,
|
1534
1550
|
},
|
1535
1551
|
)
|
@@ -1581,7 +1597,7 @@ Enable OCR for files that support it. Supported formats: pdf
|
|
1581
1597
|
##### parse_pdf_tables_with_ocr: `Boolean`<a id="parse_pdf_tables_with_ocr-boolean"></a>
|
1582
1598
|
##### enable_file_picker: `Boolean`<a id="enable_file_picker-boolean"></a>
|
1583
1599
|
Enable integration's file picker for sources that support it. Supported sources:
|
1584
|
-
BOX,
|
1600
|
+
BOX, DROPBOX, GOOGLE_DRIVE, ONEDRIVE, SHAREPOINT
|
1585
1601
|
|
1586
1602
|
##### sync_source_items: `Boolean`<a id="sync_source_items-boolean"></a>
|
1587
1603
|
Enabling this flag will fetch all available content from the source to be listed
|
@@ -1887,7 +1903,7 @@ result = carbon.integrations.sync_confluence(
|
|
1887
1903
|
prepend_filename_to_chunks: false,
|
1888
1904
|
max_items_per_chunk: 1,
|
1889
1905
|
set_page_as_boundary: false,
|
1890
|
-
request_id: "
|
1906
|
+
request_id: "991e89b6-1e71-41e1-bdc4-4dd475f21696",
|
1891
1907
|
use_ocr: false,
|
1892
1908
|
parse_pdf_tables_with_ocr: false,
|
1893
1909
|
incremental_sync: false,
|
@@ -1895,6 +1911,7 @@ result = carbon.integrations.sync_confluence(
|
|
1895
1911
|
"auto_synced_source_types" => ["ARTICLE"],
|
1896
1912
|
"sync_attachments" => false,
|
1897
1913
|
"detect_audio_language" => false,
|
1914
|
+
"transcription_service" => "assemblyai",
|
1898
1915
|
"split_rows" => false,
|
1899
1916
|
},
|
1900
1917
|
)
|
@@ -1992,7 +2009,7 @@ result = carbon.integrations.sync_files(
|
|
1992
2009
|
prepend_filename_to_chunks: false,
|
1993
2010
|
max_items_per_chunk: 1,
|
1994
2011
|
set_page_as_boundary: false,
|
1995
|
-
request_id: "
|
2012
|
+
request_id: "991e89b6-1e71-41e1-bdc4-4dd475f21696",
|
1996
2013
|
use_ocr: false,
|
1997
2014
|
parse_pdf_tables_with_ocr: false,
|
1998
2015
|
incremental_sync: false,
|
@@ -2000,6 +2017,7 @@ result = carbon.integrations.sync_files(
|
|
2000
2017
|
"auto_synced_source_types" => ["ARTICLE"],
|
2001
2018
|
"sync_attachments" => false,
|
2002
2019
|
"detect_audio_language" => false,
|
2020
|
+
"transcription_service" => "assemblyai",
|
2003
2021
|
"split_rows" => false,
|
2004
2022
|
},
|
2005
2023
|
)
|
@@ -2202,6 +2220,7 @@ result = carbon.integrations.sync_gmail(
|
|
2202
2220
|
"auto_synced_source_types" => ["ARTICLE"],
|
2203
2221
|
"sync_attachments" => false,
|
2204
2222
|
"detect_audio_language" => false,
|
2223
|
+
"transcription_service" => "assemblyai",
|
2205
2224
|
"split_rows" => false,
|
2206
2225
|
},
|
2207
2226
|
incremental_sync: false,
|
@@ -2321,6 +2340,7 @@ result = carbon.integrations.sync_outlook(
|
|
2321
2340
|
"auto_synced_source_types" => ["ARTICLE"],
|
2322
2341
|
"sync_attachments" => false,
|
2323
2342
|
"detect_audio_language" => false,
|
2343
|
+
"transcription_service" => "assemblyai",
|
2324
2344
|
"split_rows" => false,
|
2325
2345
|
},
|
2326
2346
|
incremental_sync: false,
|
@@ -2464,6 +2484,7 @@ result = carbon.integrations.sync_s3_files(
|
|
2464
2484
|
"auto_synced_source_types" => ["ARTICLE"],
|
2465
2485
|
"sync_attachments" => false,
|
2466
2486
|
"detect_audio_language" => false,
|
2487
|
+
"transcription_service" => "assemblyai",
|
2467
2488
|
"split_rows" => false,
|
2468
2489
|
},
|
2469
2490
|
)
|
@@ -131,9 +131,10 @@ module Carbon
|
|
131
131
|
# @param include_file_level_metadata [Boolean] Flag to control whether or not to include file-level metadata in the response. This metadata will be included in the `content_metadata` field of each document along with chunk/embedding level metadata.
|
132
132
|
# @param high_accuracy [Boolean] Flag to control whether or not to perform a high accuracy embedding search. By default, this is set to false. If true, the search may return more accurate results, but may take longer to complete.
|
133
133
|
# @param rerank [RerankParamsNullable]
|
134
|
+
# @param file_types_at_source [Array<HelpdeskFileTypes>] Filter files based on their type at the source (for example help center tickets and articles)
|
134
135
|
# @param body [GetEmbeddingDocumentsBody]
|
135
136
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
136
|
-
def get_documents(query:, k:, tags: SENTINEL, query_vector: SENTINEL, file_ids: SENTINEL, parent_file_ids: SENTINEL, include_all_children: false, tags_v2: SENTINEL, include_tags: SENTINEL, include_vectors: SENTINEL, include_raw_file: SENTINEL, hybrid_search: SENTINEL, hybrid_search_tuning_parameters: SENTINEL, media_type: SENTINEL, embedding_model: 'OPENAI', include_file_level_metadata: false, high_accuracy: false, rerank: SENTINEL, extra: {})
|
137
|
+
def get_documents(query:, k:, tags: SENTINEL, query_vector: SENTINEL, file_ids: SENTINEL, parent_file_ids: SENTINEL, include_all_children: false, tags_v2: SENTINEL, include_tags: SENTINEL, include_vectors: SENTINEL, include_raw_file: SENTINEL, hybrid_search: SENTINEL, hybrid_search_tuning_parameters: SENTINEL, media_type: SENTINEL, embedding_model: 'OPENAI', include_file_level_metadata: false, high_accuracy: false, rerank: SENTINEL, file_types_at_source: SENTINEL, extra: {})
|
137
138
|
_body = {}
|
138
139
|
_body[:tags] = tags if tags != SENTINEL
|
139
140
|
_body[:query] = query if query != SENTINEL
|
@@ -153,6 +154,7 @@ module Carbon
|
|
153
154
|
_body[:include_file_level_metadata] = include_file_level_metadata if include_file_level_metadata != SENTINEL
|
154
155
|
_body[:high_accuracy] = high_accuracy if high_accuracy != SENTINEL
|
155
156
|
_body[:rerank] = rerank if rerank != SENTINEL
|
157
|
+
_body[:file_types_at_source] = file_types_at_source if file_types_at_source != SENTINEL
|
156
158
|
get_embedding_documents_body = _body
|
157
159
|
api_response = get_documents_with_http_info_impl(get_embedding_documents_body, extra)
|
158
160
|
api_response.data
|
@@ -273,9 +275,10 @@ module Carbon
|
|
273
275
|
# @param include_file_level_metadata [Boolean] Flag to control whether or not to include file-level metadata in the response. This metadata will be included in the `content_metadata` field of each document along with chunk/embedding level metadata.
|
274
276
|
# @param high_accuracy [Boolean] Flag to control whether or not to perform a high accuracy embedding search. By default, this is set to false. If true, the search may return more accurate results, but may take longer to complete.
|
275
277
|
# @param rerank [RerankParamsNullable]
|
278
|
+
# @param file_types_at_source [Array<HelpdeskFileTypes>] Filter files based on their type at the source (for example help center tickets and articles)
|
276
279
|
# @param body [GetEmbeddingDocumentsBody]
|
277
280
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
278
|
-
def get_documents_with_http_info(query:, k:, tags: SENTINEL, query_vector: SENTINEL, file_ids: SENTINEL, parent_file_ids: SENTINEL, include_all_children: false, tags_v2: SENTINEL, include_tags: SENTINEL, include_vectors: SENTINEL, include_raw_file: SENTINEL, hybrid_search: SENTINEL, hybrid_search_tuning_parameters: SENTINEL, media_type: SENTINEL, embedding_model: 'OPENAI', include_file_level_metadata: false, high_accuracy: false, rerank: SENTINEL, extra: {})
|
281
|
+
def get_documents_with_http_info(query:, k:, tags: SENTINEL, query_vector: SENTINEL, file_ids: SENTINEL, parent_file_ids: SENTINEL, include_all_children: false, tags_v2: SENTINEL, include_tags: SENTINEL, include_vectors: SENTINEL, include_raw_file: SENTINEL, hybrid_search: SENTINEL, hybrid_search_tuning_parameters: SENTINEL, media_type: SENTINEL, embedding_model: 'OPENAI', include_file_level_metadata: false, high_accuracy: false, rerank: SENTINEL, file_types_at_source: SENTINEL, extra: {})
|
279
282
|
_body = {}
|
280
283
|
_body[:tags] = tags if tags != SENTINEL
|
281
284
|
_body[:query] = query if query != SENTINEL
|
@@ -295,6 +298,7 @@ module Carbon
|
|
295
298
|
_body[:include_file_level_metadata] = include_file_level_metadata if include_file_level_metadata != SENTINEL
|
296
299
|
_body[:high_accuracy] = high_accuracy if high_accuracy != SENTINEL
|
297
300
|
_body[:rerank] = rerank if rerank != SENTINEL
|
301
|
+
_body[:file_types_at_source] = file_types_at_source if file_types_at_source != SENTINEL
|
298
302
|
get_embedding_documents_body = _body
|
299
303
|
get_documents_with_http_info_impl(get_embedding_documents_body, extra)
|
300
304
|
end
|
@@ -1177,11 +1177,12 @@ module Carbon
|
|
1177
1177
|
# @param max_items_per_chunk [Integer] Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1178
1178
|
# @param parse_pdf_tables_with_ocr [Boolean] Whether to use rich table parsing when `use_ocr` is enabled.
|
1179
1179
|
# @param detect_audio_language [Boolean] Whether to automatically detect the language of the uploaded audio file.
|
1180
|
+
# @param transcription_service [TranscriptionServiceNullable] The transcription service to use for audio files. If no service is specified, 'deepgram' will be used.
|
1180
1181
|
# @param media_type [FileContentTypesNullable] The media type of the file. If not provided, it will be inferred from the file extension.
|
1181
1182
|
# @param split_rows [Boolean] Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
|
1182
1183
|
# @param body [BodyCreateUploadFileUploadfilePost]
|
1183
1184
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1184
|
-
def upload(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
|
1185
|
+
def upload(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, transcription_service: SENTINEL, media_type: SENTINEL, split_rows: false, extra: {})
|
1185
1186
|
_body = {}
|
1186
1187
|
_body[:file] = file if file != SENTINEL
|
1187
1188
|
body_create_upload_file_uploadfile_post = _body
|
@@ -1196,6 +1197,7 @@ module Carbon
|
|
1196
1197
|
extra[:max_items_per_chunk] = max_items_per_chunk if max_items_per_chunk != SENTINEL
|
1197
1198
|
extra[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
|
1198
1199
|
extra[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
|
1200
|
+
extra[:transcription_service] = transcription_service if transcription_service != SENTINEL
|
1199
1201
|
extra[:media_type] = media_type if media_type != SENTINEL
|
1200
1202
|
extra[:split_rows] = split_rows if split_rows != SENTINEL
|
1201
1203
|
api_response = upload_with_http_info_impl(file, body_create_upload_file_uploadfile_post, extra)
|
@@ -1242,11 +1244,12 @@ module Carbon
|
|
1242
1244
|
# @param max_items_per_chunk [Integer] Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1243
1245
|
# @param parse_pdf_tables_with_ocr [Boolean] Whether to use rich table parsing when `use_ocr` is enabled.
|
1244
1246
|
# @param detect_audio_language [Boolean] Whether to automatically detect the language of the uploaded audio file.
|
1247
|
+
# @param transcription_service [TranscriptionServiceNullable] The transcription service to use for audio files. If no service is specified, 'deepgram' will be used.
|
1245
1248
|
# @param media_type [FileContentTypesNullable] The media type of the file. If not provided, it will be inferred from the file extension.
|
1246
1249
|
# @param split_rows [Boolean] Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
|
1247
1250
|
# @param body [BodyCreateUploadFileUploadfilePost]
|
1248
1251
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1249
|
-
def upload_with_http_info(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
|
1252
|
+
def upload_with_http_info(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, transcription_service: SENTINEL, media_type: SENTINEL, split_rows: false, extra: {})
|
1250
1253
|
_body = {}
|
1251
1254
|
_body[:file] = file if file != SENTINEL
|
1252
1255
|
body_create_upload_file_uploadfile_post = _body
|
@@ -1261,6 +1264,7 @@ module Carbon
|
|
1261
1264
|
extra[:max_items_per_chunk] = max_items_per_chunk if max_items_per_chunk != SENTINEL
|
1262
1265
|
extra[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
|
1263
1266
|
extra[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
|
1267
|
+
extra[:transcription_service] = transcription_service if transcription_service != SENTINEL
|
1264
1268
|
extra[:media_type] = media_type if media_type != SENTINEL
|
1265
1269
|
extra[:split_rows] = split_rows if split_rows != SENTINEL
|
1266
1270
|
upload_with_http_info_impl(file, body_create_upload_file_uploadfile_post, extra)
|
@@ -1282,6 +1286,7 @@ module Carbon
|
|
1282
1286
|
# @option opts [Integer] :max_items_per_chunk Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1283
1287
|
# @option opts [Boolean] :parse_pdf_tables_with_ocr Whether to use rich table parsing when `use_ocr` is enabled. (default to false)
|
1284
1288
|
# @option opts [Boolean] :detect_audio_language Whether to automatically detect the language of the uploaded audio file. (default to false)
|
1289
|
+
# @option opts [TranscriptionServiceNullable] :transcription_service The transcription service to use for audio files. If no service is specified, 'deepgram' will be used.
|
1285
1290
|
# @option opts [FileContentTypesNullable] :media_type The media type of the file. If not provided, it will be inferred from the file extension.
|
1286
1291
|
# @option opts [Boolean] :split_rows Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files. (default to false)
|
1287
1292
|
# @return [UserFile]
|
@@ -1306,6 +1311,7 @@ module Carbon
|
|
1306
1311
|
# @option opts [Integer] :max_items_per_chunk Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1307
1312
|
# @option opts [Boolean] :parse_pdf_tables_with_ocr Whether to use rich table parsing when `use_ocr` is enabled. (default to false)
|
1308
1313
|
# @option opts [Boolean] :detect_audio_language Whether to automatically detect the language of the uploaded audio file. (default to false)
|
1314
|
+
# @option opts [TranscriptionServiceNullable] :transcription_service The transcription service to use for audio files. If no service is specified, 'deepgram' will be used.
|
1309
1315
|
# @option opts [FileContentTypesNullable] :media_type The media type of the file. If not provided, it will be inferred from the file extension.
|
1310
1316
|
# @option opts [Boolean] :split_rows Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files. (default to false)
|
1311
1317
|
# @return [APIResponse] data is UserFile, status code, headers and response
|
@@ -1337,6 +1343,7 @@ module Carbon
|
|
1337
1343
|
query_params[:'max_items_per_chunk'] = opts[:'max_items_per_chunk'] if !opts[:'max_items_per_chunk'].nil?
|
1338
1344
|
query_params[:'parse_pdf_tables_with_ocr'] = opts[:'parse_pdf_tables_with_ocr'] if !opts[:'parse_pdf_tables_with_ocr'].nil?
|
1339
1345
|
query_params[:'detect_audio_language'] = opts[:'detect_audio_language'] if !opts[:'detect_audio_language'].nil?
|
1346
|
+
query_params[:'transcription_service'] = opts[:'transcription_service'] if !opts[:'transcription_service'].nil?
|
1340
1347
|
query_params[:'media_type'] = opts[:'media_type'] if !opts[:'media_type'].nil?
|
1341
1348
|
query_params[:'split_rows'] = opts[:'split_rows'] if !opts[:'split_rows'].nil?
|
1342
1349
|
|
@@ -1396,11 +1403,12 @@ module Carbon
|
|
1396
1403
|
# @param max_items_per_chunk [Integer] Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1397
1404
|
# @param parse_pdf_tables_with_ocr [Boolean]
|
1398
1405
|
# @param detect_audio_language [Boolean]
|
1406
|
+
# @param transcription_service [TranscriptionServiceNullable]
|
1399
1407
|
# @param media_type [FileContentTypesNullable]
|
1400
1408
|
# @param split_rows [Boolean]
|
1401
1409
|
# @param body [UploadFileFromUrlInput]
|
1402
1410
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1403
|
-
def upload_from_url(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
|
1411
|
+
def upload_from_url(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, transcription_service: SENTINEL, media_type: SENTINEL, split_rows: false, extra: {})
|
1404
1412
|
_body = {}
|
1405
1413
|
_body[:url] = url if url != SENTINEL
|
1406
1414
|
_body[:file_name] = file_name if file_name != SENTINEL
|
@@ -1415,6 +1423,7 @@ module Carbon
|
|
1415
1423
|
_body[:max_items_per_chunk] = max_items_per_chunk if max_items_per_chunk != SENTINEL
|
1416
1424
|
_body[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
|
1417
1425
|
_body[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
|
1426
|
+
_body[:transcription_service] = transcription_service if transcription_service != SENTINEL
|
1418
1427
|
_body[:media_type] = media_type if media_type != SENTINEL
|
1419
1428
|
_body[:split_rows] = split_rows if split_rows != SENTINEL
|
1420
1429
|
upload_file_from_url_input = _body
|
@@ -1437,11 +1446,12 @@ module Carbon
|
|
1437
1446
|
# @param max_items_per_chunk [Integer] Number of objects per chunk. For csv, tsv, xlsx, and json files only.
|
1438
1447
|
# @param parse_pdf_tables_with_ocr [Boolean]
|
1439
1448
|
# @param detect_audio_language [Boolean]
|
1449
|
+
# @param transcription_service [TranscriptionServiceNullable]
|
1440
1450
|
# @param media_type [FileContentTypesNullable]
|
1441
1451
|
# @param split_rows [Boolean]
|
1442
1452
|
# @param body [UploadFileFromUrlInput]
|
1443
1453
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1444
|
-
def upload_from_url_with_http_info(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
|
1454
|
+
def upload_from_url_with_http_info(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, transcription_service: SENTINEL, media_type: SENTINEL, split_rows: false, extra: {})
|
1445
1455
|
_body = {}
|
1446
1456
|
_body[:url] = url if url != SENTINEL
|
1447
1457
|
_body[:file_name] = file_name if file_name != SENTINEL
|
@@ -1456,6 +1466,7 @@ module Carbon
|
|
1456
1466
|
_body[:max_items_per_chunk] = max_items_per_chunk if max_items_per_chunk != SENTINEL
|
1457
1467
|
_body[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
|
1458
1468
|
_body[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
|
1469
|
+
_body[:transcription_service] = transcription_service if transcription_service != SENTINEL
|
1459
1470
|
_body[:media_type] = media_type if media_type != SENTINEL
|
1460
1471
|
_body[:split_rows] = split_rows if split_rows != SENTINEL
|
1461
1472
|
upload_file_from_url_input = _body
|
@@ -653,13 +653,13 @@ module Carbon
|
|
653
653
|
# @param request_id [String] This request id will be added to all files that get synced using the generated OAuth URL
|
654
654
|
# @param use_ocr [Boolean] Enable OCR for files that support it. Supported formats: pdf
|
655
655
|
# @param parse_pdf_tables_with_ocr [Boolean]
|
656
|
-
# @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: BOX,
|
656
|
+
# @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: BOX, DROPBOX, GOOGLE_DRIVE, ONEDRIVE, SHAREPOINT
|
657
657
|
# @param sync_source_items [Boolean] Enabling this flag will fetch all available content from the source to be listed via list items endpoint
|
658
658
|
# @param incremental_sync [Boolean] Only sync files if they have not already been synced or if the embedding properties have changed. This flag is currently supported by ONEDRIVE, GOOGLE_DRIVE, BOX, DROPBOX, INTERCOM, GMAIL, OUTLOOK. It will be ignored for other data sources.
|
659
659
|
# @param file_sync_config [FileSyncConfigNullable]
|
660
660
|
# @param body [OAuthURLRequest]
|
661
661
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
662
|
-
def get_oauth_url(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: '
|
662
|
+
def get_oauth_url(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: 'c4055754-ba2d-4f57-a990-6e990abbbd90', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
663
663
|
_body = {}
|
664
664
|
_body[:tags] = tags if tags != SENTINEL
|
665
665
|
_body[:scope] = scope if scope != SENTINEL
|
@@ -721,13 +721,13 @@ module Carbon
|
|
721
721
|
# @param request_id [String] This request id will be added to all files that get synced using the generated OAuth URL
|
722
722
|
# @param use_ocr [Boolean] Enable OCR for files that support it. Supported formats: pdf
|
723
723
|
# @param parse_pdf_tables_with_ocr [Boolean]
|
724
|
-
# @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: BOX,
|
724
|
+
# @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: BOX, DROPBOX, GOOGLE_DRIVE, ONEDRIVE, SHAREPOINT
|
725
725
|
# @param sync_source_items [Boolean] Enabling this flag will fetch all available content from the source to be listed via list items endpoint
|
726
726
|
# @param incremental_sync [Boolean] Only sync files if they have not already been synced or if the embedding properties have changed. This flag is currently supported by ONEDRIVE, GOOGLE_DRIVE, BOX, DROPBOX, INTERCOM, GMAIL, OUTLOOK. It will be ignored for other data sources.
|
727
727
|
# @param file_sync_config [FileSyncConfigNullable]
|
728
728
|
# @param body [OAuthURLRequest]
|
729
729
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
730
|
-
def get_oauth_url_with_http_info(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: '
|
730
|
+
def get_oauth_url_with_http_info(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: 'c4055754-ba2d-4f57-a990-6e990abbbd90', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
731
731
|
_body = {}
|
732
732
|
_body[:tags] = tags if tags != SENTINEL
|
733
733
|
_body[:scope] = scope if scope != SENTINEL
|
@@ -1646,7 +1646,7 @@ module Carbon
|
|
1646
1646
|
# @param file_sync_config [FileSyncConfigNullable]
|
1647
1647
|
# @param body [SyncFilesRequest]
|
1648
1648
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1649
|
-
def sync_confluence(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '
|
1649
|
+
def sync_confluence(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '991e89b6-1e71-41e1-bdc4-4dd475f21696', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
1650
1650
|
_body = {}
|
1651
1651
|
_body[:tags] = tags if tags != SENTINEL
|
1652
1652
|
_body[:data_source_id] = data_source_id if data_source_id != SENTINEL
|
@@ -1696,7 +1696,7 @@ module Carbon
|
|
1696
1696
|
# @param file_sync_config [FileSyncConfigNullable]
|
1697
1697
|
# @param body [SyncFilesRequest]
|
1698
1698
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1699
|
-
def sync_confluence_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '
|
1699
|
+
def sync_confluence_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '991e89b6-1e71-41e1-bdc4-4dd475f21696', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
1700
1700
|
_body = {}
|
1701
1701
|
_body[:tags] = tags if tags != SENTINEL
|
1702
1702
|
_body[:data_source_id] = data_source_id if data_source_id != SENTINEL
|
@@ -1904,7 +1904,7 @@ module Carbon
|
|
1904
1904
|
# @param file_sync_config [FileSyncConfigNullable]
|
1905
1905
|
# @param body [SyncFilesRequest]
|
1906
1906
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1907
|
-
def sync_files(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '
|
1907
|
+
def sync_files(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '991e89b6-1e71-41e1-bdc4-4dd475f21696', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
1908
1908
|
_body = {}
|
1909
1909
|
_body[:tags] = tags if tags != SENTINEL
|
1910
1910
|
_body[:data_source_id] = data_source_id if data_source_id != SENTINEL
|
@@ -1952,7 +1952,7 @@ module Carbon
|
|
1952
1952
|
# @param file_sync_config [FileSyncConfigNullable]
|
1953
1953
|
# @param body [SyncFilesRequest]
|
1954
1954
|
# @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
|
1955
|
-
def sync_files_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '
|
1955
|
+
def sync_files_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: '991e89b6-1e71-41e1-bdc4-4dd475f21696', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
|
1956
1956
|
_body = {}
|
1957
1957
|
_body[:tags] = tags if tags != SENTINEL
|
1958
1958
|
_body[:data_source_id] = data_source_id if data_source_id != SENTINEL
|
@@ -20,6 +20,8 @@ module Carbon
|
|
20
20
|
# Detect audio language before transcription for audio files
|
21
21
|
attr_accessor :detect_audio_language
|
22
22
|
|
23
|
+
attr_accessor :transcription_service
|
24
|
+
|
23
25
|
# Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
|
24
26
|
attr_accessor :split_rows
|
25
27
|
|
@@ -29,6 +31,7 @@ module Carbon
|
|
29
31
|
:'auto_synced_source_types' => :'auto_synced_source_types',
|
30
32
|
:'sync_attachments' => :'sync_attachments',
|
31
33
|
:'detect_audio_language' => :'detect_audio_language',
|
34
|
+
:'transcription_service' => :'transcription_service',
|
32
35
|
:'split_rows' => :'split_rows'
|
33
36
|
}
|
34
37
|
end
|
@@ -44,6 +47,7 @@ module Carbon
|
|
44
47
|
:'auto_synced_source_types' => :'Array<HelpdeskFileTypes>',
|
45
48
|
:'sync_attachments' => :'Boolean',
|
46
49
|
:'detect_audio_language' => :'Boolean',
|
50
|
+
:'transcription_service' => :'TranscriptionServiceNullable',
|
47
51
|
:'split_rows' => :'Boolean'
|
48
52
|
}
|
49
53
|
end
|
@@ -51,6 +55,7 @@ module Carbon
|
|
51
55
|
# List of attributes with nullable: true
|
52
56
|
def self.openapi_nullable
|
53
57
|
Set.new([
|
58
|
+
:'transcription_service',
|
54
59
|
])
|
55
60
|
end
|
56
61
|
|
@@ -87,6 +92,10 @@ module Carbon
|
|
87
92
|
self.detect_audio_language = false
|
88
93
|
end
|
89
94
|
|
95
|
+
if attributes.key?(:'transcription_service')
|
96
|
+
self.transcription_service = attributes[:'transcription_service']
|
97
|
+
end
|
98
|
+
|
90
99
|
if attributes.key?(:'split_rows')
|
91
100
|
self.split_rows = attributes[:'split_rows']
|
92
101
|
else
|
@@ -115,6 +124,7 @@ module Carbon
|
|
115
124
|
auto_synced_source_types == o.auto_synced_source_types &&
|
116
125
|
sync_attachments == o.sync_attachments &&
|
117
126
|
detect_audio_language == o.detect_audio_language &&
|
127
|
+
transcription_service == o.transcription_service &&
|
118
128
|
split_rows == o.split_rows
|
119
129
|
end
|
120
130
|
|
@@ -127,7 +137,7 @@ module Carbon
|
|
127
137
|
# Calculates hash code according to all attributes.
|
128
138
|
# @return [Integer] Hash code
|
129
139
|
def hash
|
130
|
-
[auto_synced_source_types, sync_attachments, detect_audio_language, split_rows].hash
|
140
|
+
[auto_synced_source_types, sync_attachments, detect_audio_language, transcription_service, split_rows].hash
|
131
141
|
end
|
132
142
|
|
133
143
|
# Builds the object from hash
|
@@ -21,6 +21,8 @@ module Carbon
|
|
21
21
|
# Detect audio language before transcription for audio files
|
22
22
|
attr_accessor :detect_audio_language
|
23
23
|
|
24
|
+
attr_accessor :transcription_service
|
25
|
+
|
24
26
|
# Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
|
25
27
|
attr_accessor :split_rows
|
26
28
|
|
@@ -30,6 +32,7 @@ module Carbon
|
|
30
32
|
:'auto_synced_source_types' => :'auto_synced_source_types',
|
31
33
|
:'sync_attachments' => :'sync_attachments',
|
32
34
|
:'detect_audio_language' => :'detect_audio_language',
|
35
|
+
:'transcription_service' => :'transcription_service',
|
33
36
|
:'split_rows' => :'split_rows'
|
34
37
|
}
|
35
38
|
end
|
@@ -45,6 +48,7 @@ module Carbon
|
|
45
48
|
:'auto_synced_source_types' => :'Array<HelpdeskFileTypes>',
|
46
49
|
:'sync_attachments' => :'Boolean',
|
47
50
|
:'detect_audio_language' => :'Boolean',
|
51
|
+
:'transcription_service' => :'TranscriptionServiceNullable',
|
48
52
|
:'split_rows' => :'Boolean'
|
49
53
|
}
|
50
54
|
end
|
@@ -52,6 +56,7 @@ module Carbon
|
|
52
56
|
# List of attributes with nullable: true
|
53
57
|
def self.openapi_nullable
|
54
58
|
Set.new([
|
59
|
+
:'transcription_service',
|
55
60
|
])
|
56
61
|
end
|
57
62
|
|
@@ -88,6 +93,10 @@ module Carbon
|
|
88
93
|
self.detect_audio_language = false
|
89
94
|
end
|
90
95
|
|
96
|
+
if attributes.key?(:'transcription_service')
|
97
|
+
self.transcription_service = attributes[:'transcription_service']
|
98
|
+
end
|
99
|
+
|
91
100
|
if attributes.key?(:'split_rows')
|
92
101
|
self.split_rows = attributes[:'split_rows']
|
93
102
|
else
|
@@ -116,6 +125,7 @@ module Carbon
|
|
116
125
|
auto_synced_source_types == o.auto_synced_source_types &&
|
117
126
|
sync_attachments == o.sync_attachments &&
|
118
127
|
detect_audio_language == o.detect_audio_language &&
|
128
|
+
transcription_service == o.transcription_service &&
|
119
129
|
split_rows == o.split_rows
|
120
130
|
end
|
121
131
|
|
@@ -128,7 +138,7 @@ module Carbon
|
|
128
138
|
# Calculates hash code according to all attributes.
|
129
139
|
# @return [Integer] Hash code
|
130
140
|
def hash
|
131
|
-
[auto_synced_source_types, sync_attachments, detect_audio_language, split_rows].hash
|
141
|
+
[auto_synced_source_types, sync_attachments, detect_audio_language, transcription_service, split_rows].hash
|
132
142
|
end
|
133
143
|
|
134
144
|
# Builds the object from hash
|