RubyGems - carbon_ruby_sdk - Versions diffs - 0.2.2 → 0.2.4 - Mend

carbon_ruby_sdk 0.2.2 → 0.2.4

Files changed (18) hide show

checksums.yaml +4 -4
data/Gemfile.lock +1 -1
data/README.md +27 -7
data/lib/carbon_ruby_sdk/api/files_api.rb +15 -4
data/lib/carbon_ruby_sdk/api/integrations_api.rb +8 -8
data/lib/carbon_ruby_sdk/api/utilities_api.rb +10 -2
data/lib/carbon_ruby_sdk/models/o_auth_url_request.rb +2 -2
data/lib/carbon_ruby_sdk/models/sitemap_scrape_request.rb +60 -4
data/lib/carbon_ruby_sdk/models/sync_files_request.rb +1 -1
data/lib/carbon_ruby_sdk/models/sync_options.rb +1 -1
data/lib/carbon_ruby_sdk/models/upload_file_from_url_input.rb +16 -5
data/lib/carbon_ruby_sdk/models/webscrape_request.rb +32 -4
data/lib/carbon_ruby_sdk/version.rb +1 -1
data/spec/api/files_api_spec.rb +1 -0
data/spec/models/sitemap_scrape_request_spec.rb +12 -0
data/spec/models/upload_file_from_url_input_spec.rb +6 -0
data/spec/models/webscrape_request_spec.rb +6 -0
metadata +2 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 48a58cba1f17ea688e80ef5572f4944be16851ffe4ab0bed12010fe0f8b12f3e
-  data.tar.gz: 637e68cdedc5092c2c3de53c87f99b732cb2ba2eea49f6e0296220cd741dc217
+  metadata.gz: f36c299546586666be2828957b23ea39f49cffb5f16a0934aab82aaf29d0b1c7
+  data.tar.gz: f3299f1ee7db27666209ef10411d43190e8769fba5a852aa609c6ab4721d4dec
 SHA512:
-  metadata.gz: a3ca1057eaaa76eac67308c1f22a46828e1abc53732e8ab309d4d9fe53f87a59cd9712e9d541d2ef7f3b05854dbef675ab80fbf38ea7cd2b54b1cb2cab41f002
-  data.tar.gz: 4354aafdeb4fdd30b24c74b266b0c839eadcba4776590a412b77f54bff85465e49f734e538bc634f3d176d20c1157932a9dc7470acb3cbebc3572619bdceb0e2
+  metadata.gz: 42689eebf092d715da57445f2ec9a2e98dd367a6f610b34de15928f8cf7e2f0333a9492bddb40ec5996ff84cbe04907bbad0b83e9e742140af25fd524b208a0e
+  data.tar.gz: 22d020e4ea8811d8e5595b62eb3ea3917df41a10e5c1ee6e0d251eb946061b4a24ff1f2f20b579e3be4ae1e91dd7c319c0107e55290b88ad64c96f3662425293

data/Gemfile.lock CHANGED Viewed

@@ -1,7 +1,7 @@
 PATH
   remote: .
   specs:
-    carbon_ruby_sdk (0.2.1)
+    carbon_ruby_sdk (0.2.4)
       faraday (>= 1.0.1, < 3.0)
       faraday-multipart (~> 1.0, >= 1.0.4)

data/README.md CHANGED Viewed

@@ -6,7 +6,7 @@
 Connect external data to LLMs, no matter the source.
-[![npm](https://img.shields.io/badge/gem-v0.2.2-blue)](https://rubygems.org/gems/carbon_ruby_sdk/versions/0.2.2)
+[![npm](https://img.shields.io/badge/gem-v0.2.4-blue)](https://rubygems.org/gems/carbon_ruby_sdk/versions/0.2.4)
 </div>
@@ -86,7 +86,7 @@ Connect external data to LLMs, no matter the source.
 Add to Gemfile:
 ```ruby
-gem 'carbon_ruby_sdk', '~> 0.2.2'
+gem 'carbon_ruby_sdk', '~> 0.2.4'
 ```
 ## Getting Started<a id="getting-started"></a>
@@ -999,6 +999,7 @@ result = carbon.files.upload(
   parse_pdf_tables_with_ocr: false,
   detect_audio_language: false,
   media_type: "TEXT",
+  split_rows: false,
 )
 p result
 ```
@@ -1048,6 +1049,10 @@ Whether to automatically detect the language of the uploaded audio file.
 The media type of the file. If not provided, it will be inferred from the file
 extension.
+##### split_rows: `Boolean`<a id="split_rows-boolean"></a>
+Whether to split tabular rows into chunks. Currently only valid for CSV, TSV,
+and XLSX files.
 #### 🔄 Return<a id="🔄-return"></a>
 [UserFile](./lib/carbon_ruby_sdk/models/user_file.rb)
@@ -1083,6 +1088,7 @@ result = carbon.files.upload_from_url(
   parse_pdf_tables_with_ocr: false,
   detect_audio_language: false,
   media_type: "TEXT",
+  split_rows: false,
 )
 p result
 ```
@@ -1105,6 +1111,7 @@ Number of objects per chunk. For csv, tsv, xlsx, and json files only.
 ##### parse_pdf_tables_with_ocr: `Boolean`<a id="parse_pdf_tables_with_ocr-boolean"></a>
 ##### detect_audio_language: `Boolean`<a id="detect_audio_language-boolean"></a>
 ##### media_type: [`FileContentTypesNullable`](./lib/carbon_ruby_sdk/models/file_content_types_nullable.rb)<a id="media_type-filecontenttypesnullablelibcarbon_ruby_sdkmodelsfile_content_types_nullablerb"></a>
+##### split_rows: `Boolean`<a id="split_rows-boolean"></a>
 #### 🔄 Return<a id="🔄-return"></a>
 [UserFile](./lib/carbon_ruby_sdk/models/user_file.rb)
@@ -1240,7 +1247,7 @@ result = carbon.integrations.connect_data_source(
         "prepend_filename_to_chunks" => false,
         "sync_files_on_connection" => true,
         "set_page_as_boundary" => false,
-        "request_id" => "368135ce-5cca-4fb5-a19d-42b9a409af35",
+        "request_id" => "07144230-657d-40ab-9fb5-89095bf3fc65",
         "enable_file_picker" => true,
         "sync_source_items" => true,
         "incremental_sync" => false,
@@ -1459,7 +1466,7 @@ result = carbon.integrations.get_oauth_url(
   set_page_as_boundary: false,
   data_source_id: 1,
   connecting_new_account: false,
-  request_id: "2e662fad-1193-4482-a2d7-ec7b821a9d2b",
+  request_id: "b7620173-662c-4ae7-bb61-2e6ffd8619f5",
   use_ocr: false,
   parse_pdf_tables_with_ocr: false,
   enable_file_picker: true,
@@ -1519,7 +1526,7 @@ Enable OCR for files that support it. Supported formats: pdf
 ##### parse_pdf_tables_with_ocr: `Boolean`<a id="parse_pdf_tables_with_ocr-boolean"></a>
 ##### enable_file_picker: `Boolean`<a id="enable_file_picker-boolean"></a>
 Enable integration's file picker for sources that support it. Supported sources:
-SHAREPOINT, BOX, ONEDRIVE, GOOGLE_DRIVE, DROPBOX
+DROPBOX, ONEDRIVE, BOX, GOOGLE_DRIVE, SHAREPOINT
 ##### sync_source_items: `Boolean`<a id="sync_source_items-boolean"></a>
 Enabling this flag will fetch all available content from the source to be listed
@@ -1781,7 +1788,7 @@ result = carbon.integrations.sync_confluence(
   prepend_filename_to_chunks: false,
   max_items_per_chunk: 1,
   set_page_as_boundary: false,
-  request_id: "dd2130b5-0f9f-4f3a-b450-f3fa458763ae",
+  request_id: "b2c5c595-0cfb-4ec3-96ff-87158c2b6207",
   use_ocr: false,
   parse_pdf_tables_with_ocr: false,
   incremental_sync: false,
@@ -1884,7 +1891,7 @@ result = carbon.integrations.sync_files(
   prepend_filename_to_chunks: false,
   max_items_per_chunk: 1,
   set_page_as_boundary: false,
-  request_id: "dd2130b5-0f9f-4f3a-b450-f3fa458763ae",
+  request_id: "b2c5c595-0cfb-4ec3-96ff-87158c2b6207",
   use_ocr: false,
   parse_pdf_tables_with_ocr: false,
   incremental_sync: false,
@@ -2741,6 +2748,8 @@ result = carbon.utilities.scrape_sitemap(
   css_classes_to_skip: [],
   css_selectors_to_skip: [],
   embedding_model: "OPENAI",
+  url_paths_to_include: [],
+  url_paths_to_exclude: [],
 )
 p result
 ```
@@ -2760,6 +2769,16 @@ p result
 ##### css_classes_to_skip: Array<`String`><a id="css_classes_to_skip-array"></a>
 ##### css_selectors_to_skip: Array<`String`><a id="css_selectors_to_skip-array"></a>
 ##### embedding_model: [`EmbeddingGenerators`](./lib/carbon_ruby_sdk/models/embedding_generators.rb)<a id="embedding_model-embeddinggeneratorslibcarbon_ruby_sdkmodelsembedding_generatorsrb"></a>
+##### url_paths_to_include: Array<`String`><a id="url_paths_to_include-array"></a>
+URL subpaths or directories that you want to include. For example if you want to
+only include URLs that start with /questions in stackoverflow.com, you will add
+/questions/ in this input
+##### url_paths_to_exclude: Array<`String`><a id="url_paths_to_exclude-array"></a>
+URL subpaths or directories that you want to exclude. For example if you want to
+exclude URLs that start with /questions in stackoverflow.com, you will add
+/questions/ in this input
 #### 🌐 Endpoint<a id="🌐-endpoint"></a>
 `/scrape_sitemap` `POST`
@@ -2799,6 +2818,7 @@ result = carbon.utilities.scrape_web(
             "css_classes_to_skip" => [],
             "css_selectors_to_skip" => [],
             "embedding_model" => "OPENAI",
+            "url_paths_to_include" => [],
         }
     ],
 )

data/lib/carbon_ruby_sdk/api/files_api.rb CHANGED Viewed

@@ -1174,9 +1174,10 @@ module Carbon
     # @param parse_pdf_tables_with_ocr [Boolean] Whether to use rich table parsing when `use_ocr` is enabled.
     # @param detect_audio_language [Boolean] Whether to automatically detect the language of the uploaded audio file.
     # @param media_type [FileContentTypesNullable] The media type of the file. If not provided, it will be inferred from the file extension.
+    # @param split_rows [Boolean] Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
     # @param body [BodyCreateUploadFileUploadfilePost]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def upload(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, extra: {})
+    def upload(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
       _body = {}
       _body[:file] = file if file != SENTINEL
       body_create_upload_file_uploadfile_post = _body
@@ -1192,6 +1193,7 @@ module Carbon
       extra[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
       extra[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
       extra[:media_type] = media_type if media_type != SENTINEL
+      extra[:split_rows] = split_rows if split_rows != SENTINEL
       api_response = upload_with_http_info_impl(file, body_create_upload_file_uploadfile_post, extra)
       api_response.data
     end
@@ -1237,9 +1239,10 @@ module Carbon
     # @param parse_pdf_tables_with_ocr [Boolean] Whether to use rich table parsing when `use_ocr` is enabled.
     # @param detect_audio_language [Boolean] Whether to automatically detect the language of the uploaded audio file.
     # @param media_type [FileContentTypesNullable] The media type of the file. If not provided, it will be inferred from the file extension.
+    # @param split_rows [Boolean] Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
     # @param body [BodyCreateUploadFileUploadfilePost]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def upload_with_http_info(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, extra: {})
+    def upload_with_http_info(file:, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', use_ocr: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
       _body = {}
       _body[:file] = file if file != SENTINEL
       body_create_upload_file_uploadfile_post = _body
@@ -1255,6 +1258,7 @@ module Carbon
       extra[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
       extra[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
       extra[:media_type] = media_type if media_type != SENTINEL
+      extra[:split_rows] = split_rows if split_rows != SENTINEL
       upload_with_http_info_impl(file, body_create_upload_file_uploadfile_post, extra)
     end
@@ -1275,6 +1279,7 @@ module Carbon
     # @option opts [Boolean] :parse_pdf_tables_with_ocr Whether to use rich table parsing when `use_ocr` is enabled. (default to false)
     # @option opts [Boolean] :detect_audio_language Whether to automatically detect the language of the uploaded audio file. (default to false)
     # @option opts [FileContentTypesNullable] :media_type The media type of the file. If not provided, it will be inferred from the file extension.
+    # @option opts [Boolean] :split_rows Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files. (default to false)
     # @return [UserFile]
     private def upload_impl(file, body_create_upload_file_uploadfile_post, opts = {})
       data, _status_code, _headers = upload_with_http_info(file, body_create_upload_file_uploadfile_post, opts)
@@ -1298,6 +1303,7 @@ module Carbon
     # @option opts [Boolean] :parse_pdf_tables_with_ocr Whether to use rich table parsing when `use_ocr` is enabled. (default to false)
     # @option opts [Boolean] :detect_audio_language Whether to automatically detect the language of the uploaded audio file. (default to false)
     # @option opts [FileContentTypesNullable] :media_type The media type of the file. If not provided, it will be inferred from the file extension.
+    # @option opts [Boolean] :split_rows Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files. (default to false)
     # @return [APIResponse] data is UserFile, status code, headers and response
     private def upload_with_http_info_impl(file, body_create_upload_file_uploadfile_post, opts = {})
       if @api_client.config.debugging
@@ -1328,6 +1334,7 @@ module Carbon
       query_params[:'parse_pdf_tables_with_ocr'] = opts[:'parse_pdf_tables_with_ocr'] if !opts[:'parse_pdf_tables_with_ocr'].nil?
       query_params[:'detect_audio_language'] = opts[:'detect_audio_language'] if !opts[:'detect_audio_language'].nil?
       query_params[:'media_type'] = opts[:'media_type'] if !opts[:'media_type'].nil?
+      query_params[:'split_rows'] = opts[:'split_rows'] if !opts[:'split_rows'].nil?
       # header parameters
       header_params = opts[:header_params] || {}
@@ -1386,9 +1393,10 @@ module Carbon
     # @param parse_pdf_tables_with_ocr [Boolean]
     # @param detect_audio_language [Boolean]
     # @param media_type [FileContentTypesNullable]
+    # @param split_rows [Boolean]
     # @param body [UploadFileFromUrlInput]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def upload_from_url(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, extra: {})
+    def upload_from_url(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
       _body = {}
       _body[:url] = url if url != SENTINEL
       _body[:file_name] = file_name if file_name != SENTINEL
@@ -1404,6 +1412,7 @@ module Carbon
       _body[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
       _body[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
       _body[:media_type] = media_type if media_type != SENTINEL
+      _body[:split_rows] = split_rows if split_rows != SENTINEL
       upload_file_from_url_input = _body
       api_response = upload_from_url_with_http_info_impl(upload_file_from_url_input, extra)
       api_response.data
@@ -1425,9 +1434,10 @@ module Carbon
     # @param parse_pdf_tables_with_ocr [Boolean]
     # @param detect_audio_language [Boolean]
     # @param media_type [FileContentTypesNullable]
+    # @param split_rows [Boolean]
     # @param body [UploadFileFromUrlInput]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def upload_from_url_with_http_info(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, extra: {})
+    def upload_from_url_with_http_info(url:, file_name: SENTINEL, chunk_size: SENTINEL, chunk_overlap: SENTINEL, skip_embedding_generation: false, set_page_as_boundary: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, use_textract: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, parse_pdf_tables_with_ocr: false, detect_audio_language: false, media_type: SENTINEL, split_rows: false, extra: {})
       _body = {}
       _body[:url] = url if url != SENTINEL
       _body[:file_name] = file_name if file_name != SENTINEL
@@ -1443,6 +1453,7 @@ module Carbon
       _body[:parse_pdf_tables_with_ocr] = parse_pdf_tables_with_ocr if parse_pdf_tables_with_ocr != SENTINEL
       _body[:detect_audio_language] = detect_audio_language if detect_audio_language != SENTINEL
       _body[:media_type] = media_type if media_type != SENTINEL
+      _body[:split_rows] = split_rows if split_rows != SENTINEL
       upload_file_from_url_input = _body
       upload_from_url_with_http_info_impl(upload_file_from_url_input, extra)
     end

data/lib/carbon_ruby_sdk/api/integrations_api.rb CHANGED Viewed

@@ -653,13 +653,13 @@ module Carbon
     # @param request_id [String] This request id will be added to all files that get synced using the generated OAuth URL
     # @param use_ocr [Boolean] Enable OCR for files that support it. Supported formats: pdf
     # @param parse_pdf_tables_with_ocr [Boolean]
-    # @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: SHAREPOINT, BOX, ONEDRIVE, GOOGLE_DRIVE, DROPBOX
+    # @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: DROPBOX, ONEDRIVE, BOX, GOOGLE_DRIVE, SHAREPOINT
     # @param sync_source_items [Boolean] Enabling this flag will fetch all available content from the source to be listed via list items endpoint
     # @param incremental_sync [Boolean] Only sync files if they have not already been synced or if the embedding properties have changed. This flag is currently supported by ONEDRIVE, GOOGLE_DRIVE, BOX, DROPBOX. It will be ignored for other data sources.
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [OAuthURLRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def get_oauth_url(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: '2e662fad-1193-4482-a2d7-ec7b821a9d2b', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def get_oauth_url(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: 'b7620173-662c-4ae7-bb61-2e6ffd8619f5', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:scope] = scope if scope != SENTINEL
@@ -721,13 +721,13 @@ module Carbon
     # @param request_id [String] This request id will be added to all files that get synced using the generated OAuth URL
     # @param use_ocr [Boolean] Enable OCR for files that support it. Supported formats: pdf
     # @param parse_pdf_tables_with_ocr [Boolean]
-    # @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: SHAREPOINT, BOX, ONEDRIVE, GOOGLE_DRIVE, DROPBOX
+    # @param enable_file_picker [Boolean] Enable integration's file picker for sources that support it. Supported sources: DROPBOX, ONEDRIVE, BOX, GOOGLE_DRIVE, SHAREPOINT
     # @param sync_source_items [Boolean] Enabling this flag will fetch all available content from the source to be listed via list items endpoint
     # @param incremental_sync [Boolean] Only sync files if they have not already been synced or if the embedding properties have changed. This flag is currently supported by ONEDRIVE, GOOGLE_DRIVE, BOX, DROPBOX. It will be ignored for other data sources.
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [OAuthURLRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def get_oauth_url_with_http_info(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: '2e662fad-1193-4482-a2d7-ec7b821a9d2b', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def get_oauth_url_with_http_info(service:, tags: SENTINEL, scope: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', zendesk_subdomain: SENTINEL, microsoft_tenant: SENTINEL, sharepoint_site_name: SENTINEL, confluence_subdomain: SENTINEL, generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, salesforce_domain: SENTINEL, sync_files_on_connection: true, set_page_as_boundary: false, data_source_id: SENTINEL, connecting_new_account: false, request_id: 'b7620173-662c-4ae7-bb61-2e6ffd8619f5', use_ocr: false, parse_pdf_tables_with_ocr: false, enable_file_picker: true, sync_source_items: true, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:scope] = scope if scope != SENTINEL
@@ -1523,7 +1523,7 @@ module Carbon
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [SyncFilesRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def sync_confluence(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'dd2130b5-0f9f-4f3a-b450-f3fa458763ae', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def sync_confluence(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'b2c5c595-0cfb-4ec3-96ff-87158c2b6207', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:data_source_id] = data_source_id if data_source_id != SENTINEL
@@ -1571,7 +1571,7 @@ module Carbon
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [SyncFilesRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def sync_confluence_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'dd2130b5-0f9f-4f3a-b450-f3fa458763ae', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def sync_confluence_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'b2c5c595-0cfb-4ec3-96ff-87158c2b6207', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:data_source_id] = data_source_id if data_source_id != SENTINEL
@@ -1779,7 +1779,7 @@ module Carbon
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [SyncFilesRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def sync_files(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'dd2130b5-0f9f-4f3a-b450-f3fa458763ae', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def sync_files(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'b2c5c595-0cfb-4ec3-96ff-87158c2b6207', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:data_source_id] = data_source_id if data_source_id != SENTINEL
@@ -1827,7 +1827,7 @@ module Carbon
     # @param file_sync_config [FileSyncConfigNullable]
     # @param body [SyncFilesRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def sync_files_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'dd2130b5-0f9f-4f3a-b450-f3fa458763ae', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
+    def sync_files_with_http_info(data_source_id:, ids:, tags: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, embedding_model: 'OPENAI', generate_sparse_vectors: false, prepend_filename_to_chunks: false, max_items_per_chunk: SENTINEL, set_page_as_boundary: false, request_id: 'b2c5c595-0cfb-4ec3-96ff-87158c2b6207', use_ocr: false, parse_pdf_tables_with_ocr: false, incremental_sync: false, file_sync_config: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:data_source_id] = data_source_id if data_source_id != SENTINEL

data/lib/carbon_ruby_sdk/api/utilities_api.rb CHANGED Viewed

@@ -342,9 +342,11 @@ module Carbon
     # @param css_classes_to_skip [Array<String>]
     # @param css_selectors_to_skip [Array<String>]
     # @param embedding_model [EmbeddingGenerators]
+    # @param url_paths_to_include [Array<String>] URL subpaths or directories that you want to include. For example if you want to only include URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
+    # @param url_paths_to_exclude [Array<String>] URL subpaths or directories that you want to exclude. For example if you want to exclude URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
     # @param body [SitemapScrapeRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def scrape_sitemap(url:, tags: SENTINEL, max_pages_to_scrape: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, enable_auto_sync: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, html_tags_to_skip: SENTINEL, css_classes_to_skip: SENTINEL, css_selectors_to_skip: SENTINEL, embedding_model: 'OPENAI', extra: {})
+    def scrape_sitemap(url:, tags: SENTINEL, max_pages_to_scrape: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, enable_auto_sync: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, html_tags_to_skip: SENTINEL, css_classes_to_skip: SENTINEL, css_selectors_to_skip: SENTINEL, embedding_model: 'OPENAI', url_paths_to_include: SENTINEL, url_paths_to_exclude: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:url] = url if url != SENTINEL
@@ -359,6 +361,8 @@ module Carbon
       _body[:css_classes_to_skip] = css_classes_to_skip if css_classes_to_skip != SENTINEL
       _body[:css_selectors_to_skip] = css_selectors_to_skip if css_selectors_to_skip != SENTINEL
       _body[:embedding_model] = embedding_model if embedding_model != SENTINEL
+      _body[:url_paths_to_include] = url_paths_to_include if url_paths_to_include != SENTINEL
+      _body[:url_paths_to_exclude] = url_paths_to_exclude if url_paths_to_exclude != SENTINEL
       sitemap_scrape_request = _body
       api_response = scrape_sitemap_with_http_info_impl(sitemap_scrape_request, extra)
       api_response.data
@@ -387,9 +391,11 @@ module Carbon
     # @param css_classes_to_skip [Array<String>]
     # @param css_selectors_to_skip [Array<String>]
     # @param embedding_model [EmbeddingGenerators]
+    # @param url_paths_to_include [Array<String>] URL subpaths or directories that you want to include. For example if you want to only include URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
+    # @param url_paths_to_exclude [Array<String>] URL subpaths or directories that you want to exclude. For example if you want to exclude URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
     # @param body [SitemapScrapeRequest]
     # @param [Hash] extra additional parameters to pass along through :header_params, :query_params, or parameter name
-    def scrape_sitemap_with_http_info(url:, tags: SENTINEL, max_pages_to_scrape: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, enable_auto_sync: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, html_tags_to_skip: SENTINEL, css_classes_to_skip: SENTINEL, css_selectors_to_skip: SENTINEL, embedding_model: 'OPENAI', extra: {})
+    def scrape_sitemap_with_http_info(url:, tags: SENTINEL, max_pages_to_scrape: SENTINEL, chunk_size: 1500, chunk_overlap: 20, skip_embedding_generation: false, enable_auto_sync: false, generate_sparse_vectors: false, prepend_filename_to_chunks: false, html_tags_to_skip: SENTINEL, css_classes_to_skip: SENTINEL, css_selectors_to_skip: SENTINEL, embedding_model: 'OPENAI', url_paths_to_include: SENTINEL, url_paths_to_exclude: SENTINEL, extra: {})
       _body = {}
       _body[:tags] = tags if tags != SENTINEL
       _body[:url] = url if url != SENTINEL
@@ -404,6 +410,8 @@ module Carbon
       _body[:css_classes_to_skip] = css_classes_to_skip if css_classes_to_skip != SENTINEL
       _body[:css_selectors_to_skip] = css_selectors_to_skip if css_selectors_to_skip != SENTINEL
       _body[:embedding_model] = embedding_model if embedding_model != SENTINEL
+      _body[:url_paths_to_include] = url_paths_to_include if url_paths_to_include != SENTINEL
+      _body[:url_paths_to_exclude] = url_paths_to_exclude if url_paths_to_exclude != SENTINEL
       sitemap_scrape_request = _body
       scrape_sitemap_with_http_info_impl(sitemap_scrape_request, extra)
     end

data/lib/carbon_ruby_sdk/models/o_auth_url_request.rb CHANGED Viewed

@@ -61,7 +61,7 @@ module Carbon
     attr_accessor :parse_pdf_tables_with_ocr
-    # Enable integration's file picker for sources that support it. Supported sources: SHAREPOINT, BOX, ONEDRIVE, GOOGLE_DRIVE, DROPBOX
+    # Enable integration's file picker for sources that support it. Supported sources: DROPBOX, ONEDRIVE, BOX, GOOGLE_DRIVE, SHAREPOINT
     attr_accessor :enable_file_picker
     # Enabling this flag will fetch all available content from the source to be listed via list items endpoint
@@ -279,7 +279,7 @@ module Carbon
       if attributes.key?(:'request_id')
         self.request_id = attributes[:'request_id']
       else
-        self.request_id = '2e662fad-1193-4482-a2d7-ec7b821a9d2b'
+        self.request_id = 'b7620173-662c-4ae7-bb61-2e6ffd8619f5'
       end
       if attributes.key?(:'use_ocr')

data/lib/carbon_ruby_sdk/models/sitemap_scrape_request.rb CHANGED Viewed

@@ -37,6 +37,12 @@ module Carbon
     attr_accessor :embedding_model
+    # URL subpaths or directories that you want to include. For example if you want to only include         URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
+    attr_accessor :url_paths_to_include
+    # URL subpaths or directories that you want to exclude. For example if you want to exclude         URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
+    attr_accessor :url_paths_to_exclude
     # Attribute mapping from ruby-style variable name to JSON key.
     def self.attribute_map
       {
@@ -52,7 +58,9 @@ module Carbon
         :'html_tags_to_skip' => :'html_tags_to_skip',
         :'css_classes_to_skip' => :'css_classes_to_skip',
         :'css_selectors_to_skip' => :'css_selectors_to_skip',
-        :'embedding_model' => :'embedding_model'
+        :'embedding_model' => :'embedding_model',
+        :'url_paths_to_include' => :'url_paths_to_include',
+        :'url_paths_to_exclude' => :'url_paths_to_exclude'
       }
     end
@@ -76,7 +84,9 @@ module Carbon
         :'html_tags_to_skip' => :'Array<String>',
         :'css_classes_to_skip' => :'Array<String>',
         :'css_selectors_to_skip' => :'Array<String>',
-        :'embedding_model' => :'EmbeddingGenerators'
+        :'embedding_model' => :'EmbeddingGenerators',
+        :'url_paths_to_include' => :'Array<String>',
+        :'url_paths_to_exclude' => :'Array<String>'
       }
     end
@@ -94,6 +104,8 @@ module Carbon
         :'html_tags_to_skip',
         :'css_classes_to_skip',
         :'css_selectors_to_skip',
+        :'url_paths_to_include',
+        :'url_paths_to_exclude'
       ])
     end
@@ -185,6 +197,18 @@ module Carbon
       else
         self.embedding_model = 'OPENAI'
       end
+      if attributes.key?(:'url_paths_to_include')
+        if (value = attributes[:'url_paths_to_include']).is_a?(Array)
+          self.url_paths_to_include = value
+        end
+      end
+      if attributes.key?(:'url_paths_to_exclude')
+        if (value = attributes[:'url_paths_to_exclude']).is_a?(Array)
+          self.url_paths_to_exclude = value
+        end
+      end
     end
     # Show invalid properties with the reasons. Usually used together with valid?
@@ -199,6 +223,14 @@ module Carbon
         invalid_properties.push('invalid value for "max_pages_to_scrape", must be greater than or equal to 1.')
       end
+      if !@url_paths_to_include.nil? && @url_paths_to_include.length > 10
+        invalid_properties.push('invalid value for "url_paths_to_include", number of items must be less than or equal to 10.')
+      end
+      if !@url_paths_to_exclude.nil? && @url_paths_to_exclude.length > 10
+        invalid_properties.push('invalid value for "url_paths_to_exclude", number of items must be less than or equal to 10.')
+      end
       invalid_properties
     end
@@ -207,6 +239,8 @@ module Carbon
     def valid?
       return false if @url.nil?
       return false if !@max_pages_to_scrape.nil? && @max_pages_to_scrape < 1
+      return false if !@url_paths_to_include.nil? && @url_paths_to_include.length > 10
+      return false if !@url_paths_to_exclude.nil? && @url_paths_to_exclude.length > 10
       true
     end
@@ -220,6 +254,26 @@ module Carbon
       @max_pages_to_scrape = max_pages_to_scrape
     end
+    # Custom attribute writer method with validation
+    # @param [Object] url_paths_to_include Value to be assigned
+    def url_paths_to_include=(url_paths_to_include)
+      if !url_paths_to_include.nil? && url_paths_to_include.length > 10
+        fail ArgumentError, 'invalid value for "url_paths_to_include", number of items must be less than or equal to 10.'
+      end
+      @url_paths_to_include = url_paths_to_include
+    end
+    # Custom attribute writer method with validation
+    # @param [Object] url_paths_to_exclude Value to be assigned
+    def url_paths_to_exclude=(url_paths_to_exclude)
+      if !url_paths_to_exclude.nil? && url_paths_to_exclude.length > 10
+        fail ArgumentError, 'invalid value for "url_paths_to_exclude", number of items must be less than or equal to 10.'
+      end
+      @url_paths_to_exclude = url_paths_to_exclude
+    end
     # Checks equality by comparing each attribute.
     # @param [Object] Object to be compared
     def ==(o)
@@ -237,7 +291,9 @@ module Carbon
           html_tags_to_skip == o.html_tags_to_skip &&
           css_classes_to_skip == o.css_classes_to_skip &&
           css_selectors_to_skip == o.css_selectors_to_skip &&
-          embedding_model == o.embedding_model
+          embedding_model == o.embedding_model &&
+          url_paths_to_include == o.url_paths_to_include &&
+          url_paths_to_exclude == o.url_paths_to_exclude
     end
     # @see the `==` method
@@ -249,7 +305,7 @@ module Carbon
     # Calculates hash code according to all attributes.
     # @return [Integer] Hash code
     def hash
-      [tags, url, max_pages_to_scrape, chunk_size, chunk_overlap, skip_embedding_generation, enable_auto_sync, generate_sparse_vectors, prepend_filename_to_chunks, html_tags_to_skip, css_classes_to_skip, css_selectors_to_skip, embedding_model].hash
+      [tags, url, max_pages_to_scrape, chunk_size, chunk_overlap, skip_embedding_generation, enable_auto_sync, generate_sparse_vectors, prepend_filename_to_chunks, html_tags_to_skip, css_classes_to_skip, css_selectors_to_skip, embedding_model, url_paths_to_include, url_paths_to_exclude].hash
     end
     # Builds the object from hash

data/lib/carbon_ruby_sdk/models/sync_files_request.rb CHANGED Viewed

@@ -187,7 +187,7 @@ module Carbon
       if attributes.key?(:'request_id')
         self.request_id = attributes[:'request_id']
       else
-        self.request_id = 'dd2130b5-0f9f-4f3a-b450-f3fa458763ae'
+        self.request_id = 'b2c5c595-0cfb-4ec3-96ff-87158c2b6207'
       end
       if attributes.key?(:'use_ocr')

data/lib/carbon_ruby_sdk/models/sync_options.rb CHANGED Viewed

@@ -182,7 +182,7 @@ module Carbon
       if attributes.key?(:'request_id')
         self.request_id = attributes[:'request_id']
       else
-        self.request_id = '368135ce-5cca-4fb5-a19d-42b9a409af35'
+        self.request_id = '07144230-657d-40ab-9fb5-89095bf3fc65'
       end
       if attributes.key?(:'enable_file_picker')

data/lib/carbon_ruby_sdk/models/upload_file_from_url_input.rb CHANGED Viewed

@@ -40,6 +40,8 @@ module Carbon
     attr_accessor :media_type
+    attr_accessor :split_rows
     # Attribute mapping from ruby-style variable name to JSON key.
     def self.attribute_map
       {
@@ -56,7 +58,8 @@ module Carbon
         :'max_items_per_chunk' => :'max_items_per_chunk',
         :'parse_pdf_tables_with_ocr' => :'parse_pdf_tables_with_ocr',
         :'detect_audio_language' => :'detect_audio_language',
-        :'media_type' => :'media_type'
+        :'media_type' => :'media_type',
+        :'split_rows' => :'split_rows'
       }
     end
@@ -81,7 +84,8 @@ module Carbon
         :'max_items_per_chunk' => :'Integer',
         :'parse_pdf_tables_with_ocr' => :'Boolean',
         :'detect_audio_language' => :'Boolean',
-        :'media_type' => :'FileContentTypesNullable'
+        :'media_type' => :'FileContentTypesNullable',
+        :'split_rows' => :'Boolean'
       }
     end
@@ -92,7 +96,7 @@ module Carbon
         :'chunk_size',
         :'chunk_overlap',
         :'max_items_per_chunk',
-        :'media_type'
+        :'media_type',
       ])
     end
@@ -182,6 +186,12 @@ module Carbon
       if attributes.key?(:'media_type')
         self.media_type = attributes[:'media_type']
       end
+      if attributes.key?(:'split_rows')
+        self.split_rows = attributes[:'split_rows']
+      else
+        self.split_rows = false
+      end
     end
     # Show invalid properties with the reasons. Usually used together with valid?
@@ -220,7 +230,8 @@ module Carbon
           max_items_per_chunk == o.max_items_per_chunk &&
           parse_pdf_tables_with_ocr == o.parse_pdf_tables_with_ocr &&
           detect_audio_language == o.detect_audio_language &&
-          media_type == o.media_type
+          media_type == o.media_type &&
+          split_rows == o.split_rows
     end
     # @see the `==` method
@@ -232,7 +243,7 @@ module Carbon
     # Calculates hash code according to all attributes.
     # @return [Integer] Hash code
     def hash
-      [url, file_name, chunk_size, chunk_overlap, skip_embedding_generation, set_page_as_boundary, embedding_model, generate_sparse_vectors, use_textract, prepend_filename_to_chunks, max_items_per_chunk, parse_pdf_tables_with_ocr, detect_audio_language, media_type].hash
+      [url, file_name, chunk_size, chunk_overlap, skip_embedding_generation, set_page_as_boundary, embedding_model, generate_sparse_vectors, use_textract, prepend_filename_to_chunks, max_items_per_chunk, parse_pdf_tables_with_ocr, detect_audio_language, media_type, split_rows].hash
     end
     # Builds the object from hash

data/lib/carbon_ruby_sdk/models/webscrape_request.rb CHANGED Viewed

@@ -39,6 +39,9 @@ module Carbon
     attr_accessor :embedding_model
+    # URL subpaths or directories that you want to include. For example if you want to only include         URLs that start with /questions in stackoverflow.com, you will add /questions/ in this input
+    attr_accessor :url_paths_to_include
     # Attribute mapping from ruby-style variable name to JSON key.
     def self.attribute_map
       {
@@ -55,7 +58,8 @@ module Carbon
         :'html_tags_to_skip' => :'html_tags_to_skip',
         :'css_classes_to_skip' => :'css_classes_to_skip',
         :'css_selectors_to_skip' => :'css_selectors_to_skip',
-        :'embedding_model' => :'embedding_model'
+        :'embedding_model' => :'embedding_model',
+        :'url_paths_to_include' => :'url_paths_to_include'
       }
     end
@@ -80,7 +84,8 @@ module Carbon
         :'html_tags_to_skip' => :'Array<String>',
         :'css_classes_to_skip' => :'Array<String>',
         :'css_selectors_to_skip' => :'Array<String>',
-        :'embedding_model' => :'EmbeddingGenerators'
+        :'embedding_model' => :'EmbeddingGenerators',
+        :'url_paths_to_include' => :'Array<String>'
       }
     end
@@ -99,6 +104,7 @@ module Carbon
         :'html_tags_to_skip',
         :'css_classes_to_skip',
         :'css_selectors_to_skip',
+        :'url_paths_to_include'
       ])
     end
@@ -198,6 +204,12 @@ module Carbon
       else
         self.embedding_model = 'OPENAI'
       end
+      if attributes.key?(:'url_paths_to_include')
+        if (value = attributes[:'url_paths_to_include']).is_a?(Array)
+          self.url_paths_to_include = value
+        end
+      end
     end
     # Show invalid properties with the reasons. Usually used together with valid?
@@ -216,6 +228,10 @@ module Carbon
         invalid_properties.push('invalid value for "max_pages_to_scrape", must be greater than or equal to 1.')
       end
+      if !@url_paths_to_include.nil? && @url_paths_to_include.length > 10
+        invalid_properties.push('invalid value for "url_paths_to_include", number of items must be less than or equal to 10.')
+      end
       invalid_properties
     end
@@ -225,6 +241,7 @@ module Carbon
       return false if @url.nil?
       return false if !@recursion_depth.nil? && @recursion_depth < 0
       return false if !@max_pages_to_scrape.nil? && @max_pages_to_scrape < 1
+      return false if !@url_paths_to_include.nil? && @url_paths_to_include.length > 10
       true
     end
@@ -248,6 +265,16 @@ module Carbon
       @max_pages_to_scrape = max_pages_to_scrape
     end
+    # Custom attribute writer method with validation
+    # @param [Object] url_paths_to_include Value to be assigned
+    def url_paths_to_include=(url_paths_to_include)
+      if !url_paths_to_include.nil? && url_paths_to_include.length > 10
+        fail ArgumentError, 'invalid value for "url_paths_to_include", number of items must be less than or equal to 10.'
+      end
+      @url_paths_to_include = url_paths_to_include
+    end
     # Checks equality by comparing each attribute.
     # @param [Object] Object to be compared
     def ==(o)
@@ -266,7 +293,8 @@ module Carbon
           html_tags_to_skip == o.html_tags_to_skip &&
           css_classes_to_skip == o.css_classes_to_skip &&
           css_selectors_to_skip == o.css_selectors_to_skip &&
-          embedding_model == o.embedding_model
+          embedding_model == o.embedding_model &&
+          url_paths_to_include == o.url_paths_to_include
     end
     # @see the `==` method
@@ -278,7 +306,7 @@ module Carbon
     # Calculates hash code according to all attributes.
     # @return [Integer] Hash code
     def hash
-      [tags, url, recursion_depth, max_pages_to_scrape, chunk_size, chunk_overlap, skip_embedding_generation, enable_auto_sync, generate_sparse_vectors, prepend_filename_to_chunks, html_tags_to_skip, css_classes_to_skip, css_selectors_to_skip, embedding_model].hash
+      [tags, url, recursion_depth, max_pages_to_scrape, chunk_size, chunk_overlap, skip_embedding_generation, enable_auto_sync, generate_sparse_vectors, prepend_filename_to_chunks, html_tags_to_skip, css_classes_to_skip, css_selectors_to_skip, embedding_model, url_paths_to_include].hash
     end
     # Builds the object from hash

data/lib/carbon_ruby_sdk/version.rb CHANGED Viewed

@@ -7,5 +7,5 @@ The version of the OpenAPI document: 1.0.0
 =end
 module Carbon
-  VERSION = '0.2.2'
+  VERSION = '0.2.4'
 end

data/spec/api/files_api_spec.rb CHANGED Viewed

@@ -159,6 +159,7 @@ describe 'FilesApi' do
   # @option opts [Boolean] :parse_pdf_tables_with_ocr Whether to use rich table parsing when &#x60;use_ocr&#x60; is enabled.
   # @option opts [Boolean] :detect_audio_language Whether to automatically detect the language of the uploaded audio file.
   # @option opts [FileContentTypesNullable] :media_type The media type of the file. If not provided, it will be inferred from the file extension.
+  # @option opts [Boolean] :split_rows Whether to split tabular rows into chunks. Currently only valid for CSV, TSV, and XLSX files.
   # @return [UserFile]
   describe 'upload test' do
     it 'should work' do

data/spec/models/sitemap_scrape_request_spec.rb CHANGED Viewed

@@ -97,4 +97,16 @@ describe Carbon::SitemapScrapeRequest do
     end
   end
+  describe 'test attribute "url_paths_to_include"' do
+    it 'should work' do
+      # assertion here. ref: https://www.relishapp.com/rspec/rspec-expectations/docs/built-in-matchers
+    end
+  end
+  describe 'test attribute "url_paths_to_exclude"' do
+    it 'should work' do
+      # assertion here. ref: https://www.relishapp.com/rspec/rspec-expectations/docs/built-in-matchers
+    end
+  end
 end

data/spec/models/upload_file_from_url_input_spec.rb CHANGED Viewed

@@ -103,4 +103,10 @@ describe Carbon::UploadFileFromUrlInput do
     end
   end
+  describe 'test attribute "split_rows"' do
+    it 'should work' do
+      # assertion here. ref: https://www.relishapp.com/rspec/rspec-expectations/docs/built-in-matchers
+    end
+  end
 end

data/spec/models/webscrape_request_spec.rb CHANGED Viewed

@@ -103,4 +103,10 @@ describe Carbon::WebscrapeRequest do
     end
   end
+  describe 'test attribute "url_paths_to_include"' do
+    it 'should work' do
+      # assertion here. ref: https://www.relishapp.com/rspec/rspec-expectations/docs/built-in-matchers
+    end
+  end
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: carbon_ruby_sdk
 version: !ruby/object:Gem::Version
-  version: 0.2.2
+  version: 0.2.4
 platform: ruby
 authors:
 - Konfig
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2024-06-01 00:00:00.000000000 Z
+date: 2024-06-07 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: faraday