classifyre-cli 0.4.33__tar.gz → 0.4.35__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/.gitignore +3 -0
- classifyre_cli-0.4.35/.turbo/turbo-build.log +3 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/PKG-INFO +1 -1
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/package.json +1 -1
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/pyproject.toml +33 -1
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/models/generated_input.py +804 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/rest.py +1 -3
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/base.py +1 -3
- classifyre_cli-0.4.35/src/sources/delta_lake/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/delta_lake/source.py +139 -0
- classifyre_cli-0.4.35/src/sources/elasticsearch/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/elasticsearch/source.py +31 -0
- classifyre_cli-0.4.35/src/sources/hudi/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/hudi/source.py +98 -0
- classifyre_cli-0.4.35/src/sources/iceberg/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/iceberg/source.py +148 -0
- classifyre_cli-0.4.35/src/sources/kafka/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/kafka/source.py +362 -0
- classifyre_cli-0.4.35/src/sources/meilisearch/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/meilisearch/source.py +353 -0
- classifyre_cli-0.4.35/src/sources/opensearch/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/opensearch/source.py +32 -0
- classifyre_cli-0.4.35/src/sources/search_engine_base.py +345 -0
- classifyre_cli-0.4.35/src/sources/spark_base.py +413 -0
- classifyre_cli-0.4.35/src/sources/spark_catalog/__init__.py +3 -0
- classifyre_cli-0.4.35/src/sources/spark_catalog/source.py +93 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/tabular_base.py +4 -1
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/dependency_groups.py +5 -0
- classifyre_cli-0.4.35/src/utils/spark_runtime.py +56 -0
- classifyre_cli-0.4.35/tests/_spark_fakes.py +125 -0
- classifyre_cli-0.4.35/tests/test_delta_lake_source.py +96 -0
- classifyre_cli-0.4.35/tests/test_elasticsearch_source.py +238 -0
- classifyre_cli-0.4.35/tests/test_hudi_source.py +72 -0
- classifyre_cli-0.4.35/tests/test_iceberg_source.py +95 -0
- classifyre_cli-0.4.35/tests/test_kafka_source.py +192 -0
- classifyre_cli-0.4.35/tests/test_meilisearch_source.py +255 -0
- classifyre_cli-0.4.35/tests/test_opensearch_source.py +228 -0
- classifyre_cli-0.4.35/tests/test_spark_catalog_source.py +71 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/uv.lock +851 -689
- classifyre_cli-0.4.33/.turbo/turbo-build.log +0 -3
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/.python-version +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/README.md +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/main.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/scripts/generate_models.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/config.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/base.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/broken_links/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/broken_links/detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/config.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/content/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/extractor.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_base.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_factory.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_feature_extraction.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_gliner2.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_image_classification.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_llm.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_object_detection.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_regex.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/runners/_text_classification.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/custom/trainer.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/dependencies.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/pii/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/pii/detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/secrets/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/secrets/detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/threat/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/threat/code_security_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/detectors/threat/yara_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/main.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/models/generated_detectors.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/models/generated_single_asset_scan_results.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/base.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/console.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/factory.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/outputs/file.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/pipeline/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/pipeline/content_provider.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/pipeline/detector_pipeline.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/pipeline/parsed_content_provider.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/pipeline/worker_pool.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sandbox/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sandbox/runner.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/asset_metadata.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/atlassian_common.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/azure_blob_storage/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/azure_blob_storage/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/confluence/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/confluence/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/databricks/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/databricks/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/dependencies.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/email/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/email/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/google_cloud_storage/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/google_cloud_storage/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/hive/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/hive/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/jira/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/jira/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mongodb/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mongodb/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mssql/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mssql/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mysql/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/mysql/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/neo4j/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/neo4j/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/notion/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/notion/client.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/notion/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/object_storage/base.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/oracle/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/oracle/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/postgresql/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/postgresql/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/powerbi/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/powerbi/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/recipe_normalizer.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/s3_compatible_storage/README.md +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/s3_compatible_storage/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/s3_compatible_storage/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/servicedesk/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/servicedesk/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/slack/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/slack/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/snowflake/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/snowflake/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/sqlite/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/sqlite/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/tableau/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/tableau/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/tabular_utils.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/wordpress/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/wordpress/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/youtube/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/sources/youtube/source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/telemetry.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/content_extraction.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/embedded_images.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/file_metadata.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/file_parser.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/file_to_images.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/hashing.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/resources.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/transcription.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/uv_sync.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/src/utils/validation.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/conftest.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/broken_links/test_broken_links_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/conftest.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/content/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/conftest.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/test_invoice_extraction.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/test_llm_runner.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/test_pipeline_integration.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/test_regex_runner.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/custom/test_transformer_runners.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/pii/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/pii/conftest.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/pii/sample_invoice.pdf +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/pii/test_pii_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/pii/test_pii_detector_extended.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/secrets/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/secrets/test_secrets_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/secrets/test_secrets_detector_extended.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_base_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_custom_detector_examples_runtime.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_detector_catalog_commercial.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_detector_pipeline_types.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_detector_schema_examples.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_detector_types.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_phase2_detectors.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/test_registry.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/threat/__init__.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/threat/test_code_security_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/detectors/threat/test_yara_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/integration/test_wordpress_broken_links_detector.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/integration/test_wordpress_links_assets.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/pipeline/test_detector_pipeline.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/pipeline/test_worker_pool.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_assets_metadata_catalog.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_azure_blob_storage_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_base_source_attachment.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_base_source_sampling.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_config.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_confluence_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_custom_extractor.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_databricks_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_dependency_groups.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_email_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_google_cloud_storage_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_hashing.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_hive_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_jira_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_mongodb_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_mssql_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_mysql_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_neo4j_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_notion_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_oracle_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_outputs.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_postgresql_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_powerbi_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_recipe_normalizer.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_s3_compatible_storage_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_sampling_automatic.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_sandbox_runner.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_servicedesk_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_slack_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_snowflake_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_source_dependency_groups.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_sqlite_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_tableau_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_tabular_automatic_sampling.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_tabular_utils.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_uv_sync.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_wordpress_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_youtube_source.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/test_youtube_source_integration.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_content_extraction.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_embedded_images.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_file_metadata.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_file_parser.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_file_to_images.py +0 -0
- {classifyre_cli-0.4.33 → classifyre_cli-0.4.35}/tests/utils/test_transcription.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "classifyre-cli"
|
|
3
|
-
version = "0.4.
|
|
3
|
+
version = "0.4.35"
|
|
4
4
|
description = "Classifyre CLI — scan and classify unstructured data sources"
|
|
5
5
|
readme = "README.md"
|
|
6
6
|
requires-python = ">=3.12"
|
|
@@ -202,6 +202,38 @@ youtube = [
|
|
|
202
202
|
"yt-dlp>=2025.1.0",
|
|
203
203
|
"youtube-transcript-api>=1.0.0",
|
|
204
204
|
]
|
|
205
|
+
spark = [
|
|
206
|
+
# Shared PySpark runtime for the lakehouse sources. Requires a JDK (Java 21
|
|
207
|
+
# LTS) on the host; format JARs (Delta/Iceberg/Hudi) are resolved at runtime
|
|
208
|
+
# via spark.jars.packages (see SPARK_* env vars). Pinned to the Spark 4.1
|
|
209
|
+
# minor so the format-JAR coordinates below stay version-matched.
|
|
210
|
+
#
|
|
211
|
+
# The `connect` extra pulls in pandas>=2.2, pyarrow, and grpcio, which the
|
|
212
|
+
# Spark Connect client (Spark Catalog via sc:// URLs) hard-requires at session
|
|
213
|
+
# build time. Classic/local Spark (Delta/Hudi/Iceberg) does not need them, but
|
|
214
|
+
# they share this group, so we ship the client deps once for all of them.
|
|
215
|
+
"pyspark[connect]>=4.1,<4.2",
|
|
216
|
+
]
|
|
217
|
+
delta-lake = [
|
|
218
|
+
{ include-group = "spark" },
|
|
219
|
+
"delta-spark>=4.0",
|
|
220
|
+
]
|
|
221
|
+
hudi = [
|
|
222
|
+
# Hudi Spark integration ships as Maven JARs configured via
|
|
223
|
+
# SPARK_JARS_PACKAGES; only the shared PySpark runtime is needed here.
|
|
224
|
+
{ include-group = "spark" },
|
|
225
|
+
]
|
|
226
|
+
spark-catalog = [
|
|
227
|
+
{ include-group = "spark" },
|
|
228
|
+
]
|
|
229
|
+
iceberg = [
|
|
230
|
+
# Inspected through Spark (iceberg-spark-runtime JARs via SPARK_JARS_PACKAGES),
|
|
231
|
+
# sharing the JVM the other lakehouse sources already require.
|
|
232
|
+
{ include-group = "spark" },
|
|
233
|
+
]
|
|
234
|
+
kafka = [
|
|
235
|
+
"kafka-python>=2.0",
|
|
236
|
+
]
|
|
205
237
|
otel = [
|
|
206
238
|
"opentelemetry-sdk>=1.42.0",
|
|
207
239
|
"opentelemetry-exporter-otlp-proto-http>=1.27.0",
|