PyPI - cartography-client - Versions diffs - 0.0.1__py3-none-any.whl - Mend

cartography-client 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of cartography-client might be problematic. Click here for more details.

Files changed (70) hide show

cartography/__init__.py +100 -0
cartography/_base_client.py +1995 -0
cartography/_client.py +444 -0
cartography/_compat.py +219 -0
cartography/_constants.py +14 -0
cartography/_exceptions.py +108 -0
cartography/_files.py +123 -0
cartography/_models.py +829 -0
cartography/_qs.py +150 -0
cartography/_resource.py +43 -0
cartography/_response.py +832 -0
cartography/_streaming.py +333 -0
cartography/_types.py +219 -0
cartography/_utils/__init__.py +57 -0
cartography/_utils/_logs.py +25 -0
cartography/_utils/_proxy.py +65 -0
cartography/_utils/_reflection.py +42 -0
cartography/_utils/_resources_proxy.py +24 -0
cartography/_utils/_streams.py +12 -0
cartography/_utils/_sync.py +86 -0
cartography/_utils/_transform.py +447 -0
cartography/_utils/_typing.py +151 -0
cartography/_utils/_utils.py +422 -0
cartography/_version.py +4 -0
cartography/lib/.keep +4 -0
cartography/py.typed +0 -0
cartography/resources/__init__.py +89 -0
cartography/resources/api_info.py +135 -0
cartography/resources/crawl.py +279 -0
cartography/resources/download.py +376 -0
cartography/resources/health.py +143 -0
cartography/resources/scrape.py +331 -0
cartography/resources/workflows/__init__.py +33 -0
cartography/resources/workflows/request/__init__.py +33 -0
cartography/resources/workflows/request/crawl.py +295 -0
cartography/resources/workflows/request/request.py +221 -0
cartography/resources/workflows/workflows.py +274 -0
cartography/types/__init__.py +23 -0
cartography/types/api_info_retrieve_response.py +8 -0
cartography/types/bulk_download_result.py +23 -0
cartography/types/bulk_scrape_result.py +19 -0
cartography/types/crawl_create_graph_params.py +46 -0
cartography/types/crawl_create_graph_response.py +37 -0
cartography/types/download_create_bulk_params.py +37 -0
cartography/types/download_create_bulk_response.py +41 -0
cartography/types/download_create_single_params.py +32 -0
cartography/types/download_create_single_response.py +21 -0
cartography/types/downloader_type.py +7 -0
cartography/types/health_check_response.py +8 -0
cartography/types/scrape_engine_param.py +28 -0
cartography/types/scrape_scrape_bulk_params.py +33 -0
cartography/types/scrape_scrape_bulk_response.py +41 -0
cartography/types/scrape_scrape_single_params.py +17 -0
cartography/types/scrape_scrape_single_response.py +23 -0
cartography/types/wait_until.py +7 -0
cartography/types/workflow_describe_response.py +8 -0
cartography/types/workflow_results_response.py +8 -0
cartography/types/workflows/__init__.py +6 -0
cartography/types/workflows/request/__init__.py +9 -0
cartography/types/workflows/request/crawl_create_bulk_params.py +14 -0
cartography/types/workflows/request/crawl_create_bulk_response.py +22 -0
cartography/types/workflows/request/crawl_create_params.py +32 -0
cartography/types/workflows/request/crawl_request_param.py +32 -0
cartography/types/workflows/request/workflow_result.py +11 -0
cartography/types/workflows/request_create_download_params.py +18 -0
cartography/types/workflows/request_create_download_response.py +8 -0
cartography_client-0.0.1.dist-info/METADATA +399 -0
cartography_client-0.0.1.dist-info/RECORD +70 -0
cartography_client-0.0.1.dist-info/WHEEL +4 -0
cartography_client-0.0.1.dist-info/licenses/LICENSE +201 -0

cartography/resources/download.py ADDED Viewed

@@ -0,0 +1,376 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+from __future__ import annotations
+from typing import List, Optional
+import httpx
+from ..types import WaitUntil, DownloaderType, download_create_bulk_params, download_create_single_params
+from .._types import NOT_GIVEN, Body, Query, Headers, NotGiven
+from .._utils import maybe_transform, async_maybe_transform
+from .._compat import cached_property
+from .._resource import SyncAPIResource, AsyncAPIResource
+from .._response import (
+    to_raw_response_wrapper,
+    to_streamed_response_wrapper,
+    async_to_raw_response_wrapper,
+    async_to_streamed_response_wrapper,
+)
+from .._base_client import make_request_options
+from ..types.wait_until import WaitUntil
+from ..types.downloader_type import DownloaderType
+from ..types.download_create_bulk_response import DownloadCreateBulkResponse
+from ..types.download_create_single_response import DownloadCreateSingleResponse
+__all__ = ["DownloadResource", "AsyncDownloadResource"]
+class DownloadResource(SyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> DownloadResourceWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+        For more information, see https://www.github.com/evrimai/cartography-client#accessing-raw-response-data-eg-headers
+        """
+        return DownloadResourceWithRawResponse(self)
+    @cached_property
+    def with_streaming_response(self) -> DownloadResourceWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+        For more information, see https://www.github.com/evrimai/cartography-client#with_streaming_response
+        """
+        return DownloadResourceWithStreamingResponse(self)
+    def create_bulk(
+        self,
+        *,
+        crawl_id: str,
+        s3_bucket: str,
+        urls: List[str],
+        batch_size: int | NotGiven = NOT_GIVEN,
+        debug: bool | NotGiven = NOT_GIVEN,
+        downloader_type: DownloaderType | NotGiven = NOT_GIVEN,
+        max_workers: int | NotGiven = NOT_GIVEN,
+        wait_until: WaitUntil | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> DownloadCreateBulkResponse:
+        """
+        Bulk download multiple files with checkpointing to S3
+        Requires permission: download:write
+        Args:
+          crawl_id: Unique identifier for this crawl
+          s3_bucket: S3 bucket for storage and checkpoints
+          urls: List of URLs to download
+          batch_size: URLs per batch
+          debug: Enable debug information
+          downloader_type: Available downloader types
+          max_workers: Maximum concurrent workers
+          wait_until: When to consider downloads complete
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return self._post(
+            "/download/bulk",
+            body=maybe_transform(
+                {
+                    "crawl_id": crawl_id,
+                    "s3_bucket": s3_bucket,
+                    "urls": urls,
+                    "batch_size": batch_size,
+                    "debug": debug,
+                    "downloader_type": downloader_type,
+                    "max_workers": max_workers,
+                    "wait_until": wait_until,
+                },
+                download_create_bulk_params.DownloadCreateBulkParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=DownloadCreateBulkResponse,
+        )
+    def create_single(
+        self,
+        *,
+        s3_bucket: str,
+        url: str,
+        downloader_type: DownloaderType | NotGiven = NOT_GIVEN,
+        s3_key: Optional[str] | NotGiven = NOT_GIVEN,
+        api_timeout: int | NotGiven = NOT_GIVEN,
+        wait_until: WaitUntil | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> DownloadCreateSingleResponse:
+        """
+        Download a single file to S3
+        Requires permission: download:write
+        Args:
+          s3_bucket: S3 bucket for storage
+          url: URL to download
+          downloader_type: Available downloader types
+          s3_key: S3 key for the file
+          api_timeout: Timeout in milliseconds
+          wait_until: When to consider download complete
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return self._post(
+            "/download/single",
+            body=maybe_transform(
+                {
+                    "s3_bucket": s3_bucket,
+                    "url": url,
+                    "downloader_type": downloader_type,
+                    "s3_key": s3_key,
+                    "api_timeout": api_timeout,
+                    "wait_until": wait_until,
+                },
+                download_create_single_params.DownloadCreateSingleParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=DownloadCreateSingleResponse,
+        )
+class AsyncDownloadResource(AsyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> AsyncDownloadResourceWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+        For more information, see https://www.github.com/evrimai/cartography-client#accessing-raw-response-data-eg-headers
+        """
+        return AsyncDownloadResourceWithRawResponse(self)
+    @cached_property
+    def with_streaming_response(self) -> AsyncDownloadResourceWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+        For more information, see https://www.github.com/evrimai/cartography-client#with_streaming_response
+        """
+        return AsyncDownloadResourceWithStreamingResponse(self)
+    async def create_bulk(
+        self,
+        *,
+        crawl_id: str,
+        s3_bucket: str,
+        urls: List[str],
+        batch_size: int | NotGiven = NOT_GIVEN,
+        debug: bool | NotGiven = NOT_GIVEN,
+        downloader_type: DownloaderType | NotGiven = NOT_GIVEN,
+        max_workers: int | NotGiven = NOT_GIVEN,
+        wait_until: WaitUntil | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> DownloadCreateBulkResponse:
+        """
+        Bulk download multiple files with checkpointing to S3
+        Requires permission: download:write
+        Args:
+          crawl_id: Unique identifier for this crawl
+          s3_bucket: S3 bucket for storage and checkpoints
+          urls: List of URLs to download
+          batch_size: URLs per batch
+          debug: Enable debug information
+          downloader_type: Available downloader types
+          max_workers: Maximum concurrent workers
+          wait_until: When to consider downloads complete
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return await self._post(
+            "/download/bulk",
+            body=await async_maybe_transform(
+                {
+                    "crawl_id": crawl_id,
+                    "s3_bucket": s3_bucket,
+                    "urls": urls,
+                    "batch_size": batch_size,
+                    "debug": debug,
+                    "downloader_type": downloader_type,
+                    "max_workers": max_workers,
+                    "wait_until": wait_until,
+                },
+                download_create_bulk_params.DownloadCreateBulkParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=DownloadCreateBulkResponse,
+        )
+    async def create_single(
+        self,
+        *,
+        s3_bucket: str,
+        url: str,
+        downloader_type: DownloaderType | NotGiven = NOT_GIVEN,
+        s3_key: Optional[str] | NotGiven = NOT_GIVEN,
+        api_timeout: int | NotGiven = NOT_GIVEN,
+        wait_until: WaitUntil | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> DownloadCreateSingleResponse:
+        """
+        Download a single file to S3
+        Requires permission: download:write
+        Args:
+          s3_bucket: S3 bucket for storage
+          url: URL to download
+          downloader_type: Available downloader types
+          s3_key: S3 key for the file
+          api_timeout: Timeout in milliseconds
+          wait_until: When to consider download complete
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return await self._post(
+            "/download/single",
+            body=await async_maybe_transform(
+                {
+                    "s3_bucket": s3_bucket,
+                    "url": url,
+                    "downloader_type": downloader_type,
+                    "s3_key": s3_key,
+                    "api_timeout": api_timeout,
+                    "wait_until": wait_until,
+                },
+                download_create_single_params.DownloadCreateSingleParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=DownloadCreateSingleResponse,
+        )
+class DownloadResourceWithRawResponse:
+    def __init__(self, download: DownloadResource) -> None:
+        self._download = download
+        self.create_bulk = to_raw_response_wrapper(
+            download.create_bulk,
+        )
+        self.create_single = to_raw_response_wrapper(
+            download.create_single,
+        )
+class AsyncDownloadResourceWithRawResponse:
+    def __init__(self, download: AsyncDownloadResource) -> None:
+        self._download = download
+        self.create_bulk = async_to_raw_response_wrapper(
+            download.create_bulk,
+        )
+        self.create_single = async_to_raw_response_wrapper(
+            download.create_single,
+        )
+class DownloadResourceWithStreamingResponse:
+    def __init__(self, download: DownloadResource) -> None:
+        self._download = download
+        self.create_bulk = to_streamed_response_wrapper(
+            download.create_bulk,
+        )
+        self.create_single = to_streamed_response_wrapper(
+            download.create_single,
+        )
+class AsyncDownloadResourceWithStreamingResponse:
+    def __init__(self, download: AsyncDownloadResource) -> None:
+        self._download = download
+        self.create_bulk = async_to_streamed_response_wrapper(
+            download.create_bulk,
+        )
+        self.create_single = async_to_streamed_response_wrapper(
+            download.create_single,
+        )

cartography/resources/health.py ADDED Viewed

@@ -0,0 +1,143 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+from __future__ import annotations
+import httpx
+from .._types import NOT_GIVEN, Body, Query, Headers, NotGiven
+from .._compat import cached_property
+from .._resource import SyncAPIResource, AsyncAPIResource
+from .._response import (
+    to_raw_response_wrapper,
+    to_streamed_response_wrapper,
+    async_to_raw_response_wrapper,
+    async_to_streamed_response_wrapper,
+)
+from .._base_client import make_request_options
+from ..types.health_check_response import HealthCheckResponse
+__all__ = ["HealthResource", "AsyncHealthResource"]
+class HealthResource(SyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> HealthResourceWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+        For more information, see https://www.github.com/evrimai/cartography-client#accessing-raw-response-data-eg-headers
+        """
+        return HealthResourceWithRawResponse(self)
+    @cached_property
+    def with_streaming_response(self) -> HealthResourceWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+        For more information, see https://www.github.com/evrimai/cartography-client#with_streaming_response
+        """
+        return HealthResourceWithStreamingResponse(self)
+    def check(
+        self,
+        *,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> HealthCheckResponse:
+        """
+        Health check endpoint
+        Returns server status and basic information
+        """
+        return self._get(
+            "/health/",
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=HealthCheckResponse,
+        )
+class AsyncHealthResource(AsyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> AsyncHealthResourceWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+        For more information, see https://www.github.com/evrimai/cartography-client#accessing-raw-response-data-eg-headers
+        """
+        return AsyncHealthResourceWithRawResponse(self)
+    @cached_property
+    def with_streaming_response(self) -> AsyncHealthResourceWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+        For more information, see https://www.github.com/evrimai/cartography-client#with_streaming_response
+        """
+        return AsyncHealthResourceWithStreamingResponse(self)
+    async def check(
+        self,
+        *,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> HealthCheckResponse:
+        """
+        Health check endpoint
+        Returns server status and basic information
+        """
+        return await self._get(
+            "/health/",
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=HealthCheckResponse,
+        )
+class HealthResourceWithRawResponse:
+    def __init__(self, health: HealthResource) -> None:
+        self._health = health
+        self.check = to_raw_response_wrapper(
+            health.check,
+        )
+class AsyncHealthResourceWithRawResponse:
+    def __init__(self, health: AsyncHealthResource) -> None:
+        self._health = health
+        self.check = async_to_raw_response_wrapper(
+            health.check,
+        )
+class HealthResourceWithStreamingResponse:
+    def __init__(self, health: HealthResource) -> None:
+        self._health = health
+        self.check = to_streamed_response_wrapper(
+            health.check,
+        )
+class AsyncHealthResourceWithStreamingResponse:
+    def __init__(self, health: AsyncHealthResource) -> None:
+        self._health = health
+        self.check = async_to_streamed_response_wrapper(
+            health.check,
+        )