openmetadata-ingestion 1.5.4.1__py3-none-any.whl → 1.5.6.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of openmetadata-ingestion might be problematic. Click here for more details.
- metadata/data_quality/validations/runtime_param_setter/table_diff_params_setter.py +2 -1
- metadata/examples/workflows/salesforce.yaml +1 -0
- metadata/generated/schema/analytics/__init__.py +1 -1
- metadata/generated/schema/analytics/basic.py +1 -1
- metadata/generated/schema/analytics/reportData.py +1 -1
- metadata/generated/schema/analytics/reportDataType/__init__.py +1 -1
- metadata/generated/schema/analytics/reportDataType/aggregatedCostAnalysisReportData.py +1 -1
- metadata/generated/schema/analytics/reportDataType/entityReportData.py +1 -1
- metadata/generated/schema/analytics/reportDataType/rawCostAnalysisReportData.py +1 -1
- metadata/generated/schema/analytics/reportDataType/webAnalyticEntityViewReportData.py +1 -1
- metadata/generated/schema/analytics/reportDataType/webAnalyticUserActivityReportData.py +1 -1
- metadata/generated/schema/analytics/webAnalyticEvent.py +1 -1
- metadata/generated/schema/analytics/webAnalyticEventData.py +1 -1
- metadata/generated/schema/analytics/webAnalyticEventType/__init__.py +1 -1
- metadata/generated/schema/analytics/webAnalyticEventType/customEvent.py +1 -1
- metadata/generated/schema/analytics/webAnalyticEventType/pageViewEvent.py +1 -1
- metadata/generated/schema/api/__init__.py +1 -1
- metadata/generated/schema/api/addGlossaryToAssetsRequest.py +1 -1
- metadata/generated/schema/api/analytics/__init__.py +1 -1
- metadata/generated/schema/api/analytics/createWebAnalyticEvent.py +1 -1
- metadata/generated/schema/api/automations/__init__.py +1 -1
- metadata/generated/schema/api/automations/createWorkflow.py +1 -1
- metadata/generated/schema/api/bulkAssets.py +1 -1
- metadata/generated/schema/api/classification/__init__.py +1 -1
- metadata/generated/schema/api/classification/createClassification.py +1 -1
- metadata/generated/schema/api/classification/createTag.py +1 -1
- metadata/generated/schema/api/classification/loadTags.py +1 -1
- metadata/generated/schema/api/createBot.py +1 -1
- metadata/generated/schema/api/createEventPublisherJob.py +1 -1
- metadata/generated/schema/api/createType.py +1 -1
- metadata/generated/schema/api/data/__init__.py +1 -1
- metadata/generated/schema/api/data/createAPICollection.py +1 -1
- metadata/generated/schema/api/data/createAPIEndpoint.py +1 -1
- metadata/generated/schema/api/data/createChart.py +1 -1
- metadata/generated/schema/api/data/createContainer.py +1 -1
- metadata/generated/schema/api/data/createCustomProperty.py +1 -1
- metadata/generated/schema/api/data/createDashboard.py +1 -1
- metadata/generated/schema/api/data/createDashboardDataModel.py +1 -1
- metadata/generated/schema/api/data/createDatabase.py +1 -1
- metadata/generated/schema/api/data/createDatabaseSchema.py +1 -1
- metadata/generated/schema/api/data/createGlossary.py +1 -1
- metadata/generated/schema/api/data/createGlossaryTerm.py +1 -1
- metadata/generated/schema/api/data/createMlModel.py +1 -1
- metadata/generated/schema/api/data/createPipeline.py +1 -1
- metadata/generated/schema/api/data/createQuery.py +1 -1
- metadata/generated/schema/api/data/createSearchIndex.py +1 -1
- metadata/generated/schema/api/data/createStoredProcedure.py +1 -1
- metadata/generated/schema/api/data/createTable.py +1 -1
- metadata/generated/schema/api/data/createTableProfile.py +1 -1
- metadata/generated/schema/api/data/createTopic.py +1 -1
- metadata/generated/schema/api/data/loadGlossary.py +1 -1
- metadata/generated/schema/api/data/restoreEntity.py +1 -1
- metadata/generated/schema/api/dataInsight/__init__.py +1 -1
- metadata/generated/schema/api/dataInsight/createDataInsightChart.py +1 -1
- metadata/generated/schema/api/dataInsight/custom/__init__.py +1 -1
- metadata/generated/schema/api/dataInsight/custom/createDataInsightCustomChart.py +1 -1
- metadata/generated/schema/api/dataInsight/kpi/__init__.py +1 -1
- metadata/generated/schema/api/dataInsight/kpi/createKpiRequest.py +1 -1
- metadata/generated/schema/api/docStore/__init__.py +1 -1
- metadata/generated/schema/api/docStore/createDocument.py +1 -1
- metadata/generated/schema/api/domains/__init__.py +1 -1
- metadata/generated/schema/api/domains/createDataProduct.py +1 -1
- metadata/generated/schema/api/domains/createDomain.py +1 -1
- metadata/generated/schema/api/feed/__init__.py +1 -1
- metadata/generated/schema/api/feed/closeTask.py +1 -1
- metadata/generated/schema/api/feed/createPost.py +1 -1
- metadata/generated/schema/api/feed/createSuggestion.py +1 -1
- metadata/generated/schema/api/feed/createThread.py +1 -1
- metadata/generated/schema/api/feed/resolveTask.py +1 -1
- metadata/generated/schema/api/feed/threadCount.py +1 -1
- metadata/generated/schema/api/lineage/__init__.py +1 -1
- metadata/generated/schema/api/lineage/addLineage.py +1 -1
- metadata/generated/schema/api/openMetadataServerVersion.py +1 -1
- metadata/generated/schema/api/policies/__init__.py +1 -1
- metadata/generated/schema/api/policies/createPolicy.py +1 -1
- metadata/generated/schema/api/services/__init__.py +1 -1
- metadata/generated/schema/api/services/createApiService.py +1 -1
- metadata/generated/schema/api/services/createDashboardService.py +1 -1
- metadata/generated/schema/api/services/createDatabaseService.py +1 -1
- metadata/generated/schema/api/services/createMessagingService.py +1 -1
- metadata/generated/schema/api/services/createMetadataService.py +1 -1
- metadata/generated/schema/api/services/createMlModelService.py +1 -1
- metadata/generated/schema/api/services/createPipelineService.py +1 -1
- metadata/generated/schema/api/services/createSearchService.py +1 -1
- metadata/generated/schema/api/services/createStorageService.py +1 -1
- metadata/generated/schema/api/services/ingestionPipelines/__init__.py +1 -1
- metadata/generated/schema/api/services/ingestionPipelines/createIngestionPipeline.py +1 -1
- metadata/generated/schema/api/setOwner.py +1 -1
- metadata/generated/schema/api/teams/__init__.py +1 -1
- metadata/generated/schema/api/teams/createPersona.py +1 -1
- metadata/generated/schema/api/teams/createRole.py +1 -1
- metadata/generated/schema/api/teams/createTeam.py +1 -1
- metadata/generated/schema/api/teams/createUser.py +1 -1
- metadata/generated/schema/api/tests/__init__.py +1 -1
- metadata/generated/schema/api/tests/createCustomMetric.py +1 -1
- metadata/generated/schema/api/tests/createLogicalTestCases.py +1 -1
- metadata/generated/schema/api/tests/createTestCase.py +1 -1
- metadata/generated/schema/api/tests/createTestCaseResolutionStatus.py +1 -1
- metadata/generated/schema/api/tests/createTestDefinition.py +1 -1
- metadata/generated/schema/api/tests/createTestSuite.py +1 -1
- metadata/generated/schema/api/voteRequest.py +1 -1
- metadata/generated/schema/auth/__init__.py +1 -1
- metadata/generated/schema/auth/basicAuth.py +1 -1
- metadata/generated/schema/auth/basicLoginRequest.py +1 -1
- metadata/generated/schema/auth/changePasswordRequest.py +1 -1
- metadata/generated/schema/auth/createPersonalToken.py +1 -1
- metadata/generated/schema/auth/emailRequest.py +1 -1
- metadata/generated/schema/auth/emailVerificationToken.py +1 -1
- metadata/generated/schema/auth/generateToken.py +1 -1
- metadata/generated/schema/auth/jwtAuth.py +1 -1
- metadata/generated/schema/auth/loginRequest.py +1 -1
- metadata/generated/schema/auth/logoutRequest.py +1 -1
- metadata/generated/schema/auth/passwordResetRequest.py +1 -1
- metadata/generated/schema/auth/passwordResetToken.py +1 -1
- metadata/generated/schema/auth/personalAccessToken.py +1 -1
- metadata/generated/schema/auth/refreshToken.py +1 -1
- metadata/generated/schema/auth/registrationRequest.py +1 -1
- metadata/generated/schema/auth/revokePersonalToken.py +1 -1
- metadata/generated/schema/auth/revokeToken.py +1 -1
- metadata/generated/schema/auth/serviceTokenEnum.py +1 -1
- metadata/generated/schema/auth/ssoAuth.py +1 -1
- metadata/generated/schema/auth/tokenRefreshRequest.py +1 -1
- metadata/generated/schema/configuration/__init__.py +1 -1
- metadata/generated/schema/configuration/appsPrivateConfiguration.py +1 -1
- metadata/generated/schema/configuration/authConfig.py +1 -1
- metadata/generated/schema/configuration/authenticationConfiguration.py +1 -1
- metadata/generated/schema/configuration/authorizerConfiguration.py +1 -1
- metadata/generated/schema/configuration/changeEventConfiguration.py +1 -1
- metadata/generated/schema/configuration/dataQualityConfiguration.py +1 -1
- metadata/generated/schema/configuration/elasticSearchConfiguration.py +1 -1
- metadata/generated/schema/configuration/eventHandlerConfiguration.py +1 -1
- metadata/generated/schema/configuration/fernetConfiguration.py +1 -1
- metadata/generated/schema/configuration/jwtTokenConfiguration.py +1 -1
- metadata/generated/schema/configuration/kafkaEventConfiguration.py +1 -1
- metadata/generated/schema/configuration/ldapConfiguration.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/__init__.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/customTrustManagerConfig.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/hostNameConfig.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/jvmDefaultConfig.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/trustAllConfig.py +1 -1
- metadata/generated/schema/configuration/ldapTrustStoreConfig/truststoreConfig.py +1 -1
- metadata/generated/schema/configuration/limitsConfiguration.py +1 -1
- metadata/generated/schema/configuration/loginConfiguration.py +1 -1
- metadata/generated/schema/configuration/logoConfiguration.py +1 -1
- metadata/generated/schema/configuration/pipelineServiceClientConfiguration.py +1 -1
- metadata/generated/schema/configuration/profilerConfiguration.py +1 -1
- metadata/generated/schema/configuration/slackAppConfiguration.py +1 -1
- metadata/generated/schema/configuration/taskNotificationConfiguration.py +1 -1
- metadata/generated/schema/configuration/testResultNotificationConfiguration.py +1 -1
- metadata/generated/schema/configuration/themeConfiguration.py +1 -1
- metadata/generated/schema/configuration/uiThemePreference.py +1 -1
- metadata/generated/schema/dataInsight/__init__.py +1 -1
- metadata/generated/schema/dataInsight/custom/__init__.py +1 -1
- metadata/generated/schema/dataInsight/custom/dataInsightCustomChart.py +1 -1
- metadata/generated/schema/dataInsight/custom/dataInsightCustomChartResult.py +1 -1
- metadata/generated/schema/dataInsight/custom/dataInsightCustomChartResultList.py +1 -1
- metadata/generated/schema/dataInsight/custom/formulaHolder.py +1 -1
- metadata/generated/schema/dataInsight/custom/lineChart.py +1 -1
- metadata/generated/schema/dataInsight/custom/summaryCard.py +1 -1
- metadata/generated/schema/dataInsight/dataInsightChart.py +1 -1
- metadata/generated/schema/dataInsight/dataInsightChartResult.py +1 -1
- metadata/generated/schema/dataInsight/kpi/__init__.py +1 -1
- metadata/generated/schema/dataInsight/kpi/basic.py +1 -1
- metadata/generated/schema/dataInsight/kpi/kpi.py +1 -1
- metadata/generated/schema/dataInsight/type/__init__.py +1 -1
- metadata/generated/schema/dataInsight/type/aggregatedUnusedAssetsCount.py +1 -1
- metadata/generated/schema/dataInsight/type/aggregatedUnusedAssetsSize.py +1 -1
- metadata/generated/schema/dataInsight/type/aggregatedUsedVsUnusedAssetsCount.py +1 -1
- metadata/generated/schema/dataInsight/type/aggregatedUsedVsUnusedAssetsSize.py +1 -1
- metadata/generated/schema/dataInsight/type/dailyActiveUsers.py +1 -1
- metadata/generated/schema/dataInsight/type/mostActiveUsers.py +1 -1
- metadata/generated/schema/dataInsight/type/mostViewedEntities.py +1 -1
- metadata/generated/schema/dataInsight/type/pageViewsByEntities.py +1 -1
- metadata/generated/schema/dataInsight/type/unusedAssets.py +1 -1
- metadata/generated/schema/email/__init__.py +1 -1
- metadata/generated/schema/email/emailRequest.py +1 -1
- metadata/generated/schema/email/emailTemplate.py +1 -1
- metadata/generated/schema/email/emailTemplatePlaceholder.py +1 -1
- metadata/generated/schema/email/smtpSettings.py +1 -1
- metadata/generated/schema/email/templateValidationReponse.py +1 -1
- metadata/generated/schema/entity/__init__.py +1 -1
- metadata/generated/schema/entity/applications/__init__.py +1 -1
- metadata/generated/schema/entity/applications/app.py +1 -1
- metadata/generated/schema/entity/applications/appRunRecord.py +1 -1
- metadata/generated/schema/entity/applications/configuration/__init__.py +1 -1
- metadata/generated/schema/entity/applications/configuration/applicationConfig.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/__init__.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/__init__.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/addDescriptionAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/addDomainAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/addOwnerAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/addTagsAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/addTierAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/lineagePropagationAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/mlTaggingAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/removeDescriptionAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/removeDomainAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/removeOwnerAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/removeTagsAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automator/removeTierAction.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/automatorAppConfig.py +1 -1
- metadata/generated/schema/entity/applications/configuration/external/metaPilotAppConfig.py +1 -1
- metadata/generated/schema/entity/applications/configuration/internal/__init__.py +1 -1
- metadata/generated/schema/entity/applications/configuration/internal/dataInsightsAppConfig.py +1 -1
- metadata/generated/schema/entity/applications/configuration/internal/dataInsightsReportAppConfig.py +1 -1
- metadata/generated/schema/entity/applications/configuration/internal/searchIndexingAppConfig.py +8 -1
- metadata/generated/schema/entity/applications/configuration/private/external/__init__.py +1 -1
- metadata/generated/schema/entity/applications/configuration/private/external/metaPilotAppPrivateConfig.py +1 -1
- metadata/generated/schema/entity/applications/createAppRequest.py +1 -1
- metadata/generated/schema/entity/applications/jobStatus.py +1 -1
- metadata/generated/schema/entity/applications/liveExecutionContext.py +1 -1
- metadata/generated/schema/entity/applications/marketplace/__init__.py +1 -1
- metadata/generated/schema/entity/applications/marketplace/appMarketPlaceDefinition.py +1 -1
- metadata/generated/schema/entity/applications/marketplace/createAppMarketPlaceDefinitionReq.py +1 -1
- metadata/generated/schema/entity/applications/scheduledExecutionContext.py +1 -1
- metadata/generated/schema/entity/automations/__init__.py +1 -1
- metadata/generated/schema/entity/automations/testServiceConnection.py +1 -1
- metadata/generated/schema/entity/automations/workflow.py +1 -1
- metadata/generated/schema/entity/bot.py +1 -1
- metadata/generated/schema/entity/classification/__init__.py +1 -1
- metadata/generated/schema/entity/classification/classification.py +1 -1
- metadata/generated/schema/entity/classification/tag.py +1 -1
- metadata/generated/schema/entity/data/__init__.py +1 -1
- metadata/generated/schema/entity/data/apiCollection.py +1 -1
- metadata/generated/schema/entity/data/apiEndpoint.py +1 -1
- metadata/generated/schema/entity/data/chart.py +1 -1
- metadata/generated/schema/entity/data/container.py +1 -1
- metadata/generated/schema/entity/data/dashboard.py +1 -1
- metadata/generated/schema/entity/data/dashboardDataModel.py +1 -1
- metadata/generated/schema/entity/data/database.py +1 -1
- metadata/generated/schema/entity/data/databaseSchema.py +1 -1
- metadata/generated/schema/entity/data/glossary.py +1 -1
- metadata/generated/schema/entity/data/glossaryTerm.py +1 -1
- metadata/generated/schema/entity/data/metrics.py +1 -1
- metadata/generated/schema/entity/data/mlmodel.py +1 -1
- metadata/generated/schema/entity/data/pipeline.py +1 -1
- metadata/generated/schema/entity/data/query.py +1 -1
- metadata/generated/schema/entity/data/report.py +1 -1
- metadata/generated/schema/entity/data/searchIndex.py +1 -1
- metadata/generated/schema/entity/data/storedProcedure.py +1 -1
- metadata/generated/schema/entity/data/table.py +1 -1
- metadata/generated/schema/entity/data/topic.py +1 -1
- metadata/generated/schema/entity/docStore/__init__.py +1 -1
- metadata/generated/schema/entity/docStore/document.py +1 -1
- metadata/generated/schema/entity/domains/__init__.py +1 -1
- metadata/generated/schema/entity/domains/dataProduct.py +1 -1
- metadata/generated/schema/entity/domains/domain.py +1 -1
- metadata/generated/schema/entity/events/__init__.py +1 -1
- metadata/generated/schema/entity/events/webhook.py +1 -1
- metadata/generated/schema/entity/feed/__init__.py +1 -1
- metadata/generated/schema/entity/feed/assets.py +1 -1
- metadata/generated/schema/entity/feed/customProperty.py +1 -1
- metadata/generated/schema/entity/feed/description.py +1 -1
- metadata/generated/schema/entity/feed/domain.py +1 -1
- metadata/generated/schema/entity/feed/entityInfo.py +1 -1
- metadata/generated/schema/entity/feed/owner.py +1 -1
- metadata/generated/schema/entity/feed/suggestion.py +1 -1
- metadata/generated/schema/entity/feed/tag.py +1 -1
- metadata/generated/schema/entity/feed/testCaseResult.py +1 -1
- metadata/generated/schema/entity/feed/thread.py +1 -1
- metadata/generated/schema/entity/policies/__init__.py +1 -1
- metadata/generated/schema/entity/policies/accessControl/__init__.py +1 -1
- metadata/generated/schema/entity/policies/accessControl/resourceDescriptor.py +1 -1
- metadata/generated/schema/entity/policies/accessControl/resourcePermission.py +1 -1
- metadata/generated/schema/entity/policies/accessControl/rule.py +1 -1
- metadata/generated/schema/entity/policies/filters.py +1 -1
- metadata/generated/schema/entity/policies/policy.py +1 -1
- metadata/generated/schema/entity/services/__init__.py +1 -1
- metadata/generated/schema/entity/services/apiService.py +1 -1
- metadata/generated/schema/entity/services/connections/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/apiService/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/apiService/restConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/common/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/common/sslCertPaths.py +1 -1
- metadata/generated/schema/entity/services/connections/common/sslCertValues.py +1 -1
- metadata/generated/schema/entity/services/connections/common/sslConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/connectionBasicType.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/customDashboardConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/domoDashboardConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/lightdashConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/lookerConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/metabaseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/modeConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/mstrConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerBIConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerbi/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerbi/azureConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerbi/bucketDetails.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerbi/gcsConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/powerbi/s3Config.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/qlikCloudConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/qlikSenseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/quickSightConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/redashConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/supersetConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/dashboard/tableauConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/athenaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/azureSQLConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/bigQueryConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/bigTableConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/clickhouseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/common/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/common/azureConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/common/basicAuth.py +1 -1
- metadata/generated/schema/entity/services/connections/database/common/iamAuthConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/common/jwtAuth.py +1 -1
- metadata/generated/schema/entity/services/connections/database/couchbaseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/customDatabaseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/databricksConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/datalake/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/datalake/azureConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/datalake/gcsConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/datalake/s3Config.py +1 -1
- metadata/generated/schema/entity/services/connections/database/datalakeConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/db2Connection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/deltaLakeConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/deltalake/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/deltalake/metastoreConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/deltalake/storageConfig.py +1 -1
- metadata/generated/schema/entity/services/connections/database/domoDatabaseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/dorisConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/druidConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/dynamoDBConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/glueConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/greenplumConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/hiveConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/dynamoDbCatalogConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/glueCatalogConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/hiveCatalogConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/icebergCatalog.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/icebergFileSystem.py +1 -1
- metadata/generated/schema/entity/services/connections/database/iceberg/restCatalogConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/icebergConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/impalaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/mariaDBConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/mongoDBConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/mssqlConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/mysqlConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/oracleConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/pinotDBConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/postgresConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/prestoConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/redshiftConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/salesforceConnection.py +9 -1
- metadata/generated/schema/entity/services/connections/database/sapErpConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sapHana/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sapHana/sapHanaHDBConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sapHana/sapHanaSQLConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sapHanaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sasConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/singleStoreConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/snowflakeConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/sqliteConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/synapseConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/teradataConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/trinoConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/unityCatalogConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/database/verticaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/customMessagingConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/kafkaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/kinesisConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/pulsarConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/redpandaConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/messaging/saslMechanismType.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/alationConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/alationSinkConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/amundsenConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/atlasConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/metadataESConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/metadata/openMetadataConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/customMlModelConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/mlflowConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/sageMakerConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/sklearnConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/mlmodel/vertexaiConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/airbyteConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/airflowConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/backendConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/customPipelineConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/dagsterConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/databricksPipelineConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/dbtCloudConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/domoPipelineConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/fivetranConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/flinkConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/gluePipelineConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/kafkaConnectConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/nifiConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/openLineageConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/sparkConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/pipeline/splineConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/search/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/search/customSearchConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/search/elasticSearch/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/search/elasticSearch/apiAuth.py +1 -1
- metadata/generated/schema/entity/services/connections/search/elasticSearch/basicAuth.py +1 -1
- metadata/generated/schema/entity/services/connections/search/elasticSearchConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/search/openSearchConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/serviceConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/storage/__init__.py +1 -1
- metadata/generated/schema/entity/services/connections/storage/adlsConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/storage/customStorageConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/storage/gcsConnection.py +1 -1
- metadata/generated/schema/entity/services/connections/storage/s3Connection.py +1 -1
- metadata/generated/schema/entity/services/connections/testConnectionDefinition.py +1 -1
- metadata/generated/schema/entity/services/connections/testConnectionResult.py +1 -1
- metadata/generated/schema/entity/services/dashboardService.py +1 -1
- metadata/generated/schema/entity/services/databaseService.py +1 -1
- metadata/generated/schema/entity/services/ingestionPipelines/__init__.py +1 -1
- metadata/generated/schema/entity/services/ingestionPipelines/ingestionPipeline.py +1 -1
- metadata/generated/schema/entity/services/ingestionPipelines/pipelineServiceClientResponse.py +1 -1
- metadata/generated/schema/entity/services/ingestionPipelines/status.py +1 -1
- metadata/generated/schema/entity/services/messagingService.py +1 -1
- metadata/generated/schema/entity/services/metadataService.py +1 -1
- metadata/generated/schema/entity/services/mlmodelService.py +1 -1
- metadata/generated/schema/entity/services/pipelineService.py +1 -1
- metadata/generated/schema/entity/services/searchService.py +1 -1
- metadata/generated/schema/entity/services/serviceType.py +1 -1
- metadata/generated/schema/entity/services/storageService.py +1 -1
- metadata/generated/schema/entity/teams/__init__.py +1 -1
- metadata/generated/schema/entity/teams/persona.py +1 -1
- metadata/generated/schema/entity/teams/role.py +1 -1
- metadata/generated/schema/entity/teams/team.py +1 -1
- metadata/generated/schema/entity/teams/teamHierarchy.py +1 -1
- metadata/generated/schema/entity/teams/user.py +1 -1
- metadata/generated/schema/entity/type.py +1 -1
- metadata/generated/schema/entity/utils/__init__.py +1 -1
- metadata/generated/schema/entity/utils/entitiesCount.py +1 -1
- metadata/generated/schema/entity/utils/servicesCount.py +1 -1
- metadata/generated/schema/entity/utils/supersetApiConnection.py +1 -1
- metadata/generated/schema/events/__init__.py +1 -1
- metadata/generated/schema/events/alertMetrics.py +1 -1
- metadata/generated/schema/events/api/__init__.py +1 -1
- metadata/generated/schema/events/api/createEventSubscription.py +1 -1
- metadata/generated/schema/events/api/testEventSubscriptionDestination.py +1 -1
- metadata/generated/schema/events/emailAlertConfig.py +1 -1
- metadata/generated/schema/events/eventFilterRule.py +1 -1
- metadata/generated/schema/events/eventSubscription.py +1 -1
- metadata/generated/schema/events/eventSubscriptionOffset.py +1 -1
- metadata/generated/schema/events/failedEvent.py +1 -1
- metadata/generated/schema/events/filterResourceDescriptor.py +1 -1
- metadata/generated/schema/events/subscriptionResourceDescriptor.py +1 -1
- metadata/generated/schema/metadataIngestion/__init__.py +1 -1
- metadata/generated/schema/metadataIngestion/application.py +1 -1
- metadata/generated/schema/metadataIngestion/applicationPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/dashboardServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/dataInsightPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/databaseServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/databaseServiceProfilerPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/databaseServiceQueryLineagePipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/databaseServiceQueryUsagePipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/__init__.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtAzureConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtBucketDetails.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtCloudConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtGCSConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtHttpConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtLocalConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/dbtconfig/dbtS3Config.py +1 -1
- metadata/generated/schema/metadataIngestion/messagingServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/metadataToElasticSearchPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/mlmodelServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/pipelineServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/searchServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/__init__.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/containerMetadataConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/manifestMetadataConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageBucketDetails.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageMetadataADLSConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageMetadataGCSConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageMetadataHttpConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageMetadataLocalConfig.py +1 -1
- metadata/generated/schema/metadataIngestion/storage/storageMetadataS3Config.py +1 -1
- metadata/generated/schema/metadataIngestion/storageServiceMetadataPipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/testSuitePipeline.py +1 -1
- metadata/generated/schema/metadataIngestion/workflow.py +1 -1
- metadata/generated/schema/monitoring/__init__.py +1 -1
- metadata/generated/schema/monitoring/eventMonitorProvider.py +1 -1
- metadata/generated/schema/security/__init__.py +1 -1
- metadata/generated/schema/security/client/__init__.py +1 -1
- metadata/generated/schema/security/client/auth0SSOClientConfig.py +1 -1
- metadata/generated/schema/security/client/azureSSOClientConfig.py +1 -1
- metadata/generated/schema/security/client/customOidcSSOClientConfig.py +1 -1
- metadata/generated/schema/security/client/googleSSOClientConfig.py +1 -1
- metadata/generated/schema/security/client/oidcClientConfig.py +1 -1
- metadata/generated/schema/security/client/oktaSSOClientConfig.py +1 -1
- metadata/generated/schema/security/client/openMetadataJWTClientConfig.py +1 -1
- metadata/generated/schema/security/client/samlSSOClientConfig.py +1 -1
- metadata/generated/schema/security/credentials/__init__.py +1 -1
- metadata/generated/schema/security/credentials/accessTokenAuth.py +1 -1
- metadata/generated/schema/security/credentials/apiAccessTokenAuth.py +1 -1
- metadata/generated/schema/security/credentials/awsCredentials.py +1 -1
- metadata/generated/schema/security/credentials/azureCredentials.py +1 -1
- metadata/generated/schema/security/credentials/basicAuth.py +1 -1
- metadata/generated/schema/security/credentials/bitbucketCredentials.py +1 -1
- metadata/generated/schema/security/credentials/gcpCredentials.py +1 -1
- metadata/generated/schema/security/credentials/gcpExternalAccount.py +1 -1
- metadata/generated/schema/security/credentials/gcpValues.py +1 -1
- metadata/generated/schema/security/credentials/gitCredentials.py +1 -1
- metadata/generated/schema/security/credentials/githubCredentials.py +1 -1
- metadata/generated/schema/security/credentials/gitlabCredentials.py +1 -1
- metadata/generated/schema/security/sasl/__init__.py +1 -1
- metadata/generated/schema/security/sasl/saslClientConfig.py +1 -1
- metadata/generated/schema/security/secrets/__init__.py +1 -1
- metadata/generated/schema/security/secrets/secretsManagerClientLoader.py +1 -1
- metadata/generated/schema/security/secrets/secretsManagerConfiguration.py +1 -1
- metadata/generated/schema/security/secrets/secretsManagerProvider.py +1 -1
- metadata/generated/schema/security/securityConfiguration.py +1 -1
- metadata/generated/schema/security/ssl/__init__.py +1 -1
- metadata/generated/schema/security/ssl/validateSSLClientConfig.py +1 -1
- metadata/generated/schema/security/ssl/verifySSLConfig.py +1 -1
- metadata/generated/schema/settings/__init__.py +1 -1
- metadata/generated/schema/settings/settings.py +1 -1
- metadata/generated/schema/system/__init__.py +1 -1
- metadata/generated/schema/system/entityError.py +1 -1
- metadata/generated/schema/system/eventPublisherJob.py +2 -2
- metadata/generated/schema/system/indexingError.py +1 -1
- metadata/generated/schema/system/limitsResponse.py +1 -1
- metadata/generated/schema/system/ui/__init__.py +1 -1
- metadata/generated/schema/system/ui/knowledgePanel.py +1 -1
- metadata/generated/schema/system/ui/page.py +1 -1
- metadata/generated/schema/system/validationResponse.py +1 -1
- metadata/generated/schema/tests/__init__.py +1 -1
- metadata/generated/schema/tests/assigned.py +1 -1
- metadata/generated/schema/tests/basic.py +1 -1
- metadata/generated/schema/tests/customMetric.py +1 -1
- metadata/generated/schema/tests/dataQualityReport.py +1 -1
- metadata/generated/schema/tests/resolved.py +1 -1
- metadata/generated/schema/tests/testCase.py +1 -1
- metadata/generated/schema/tests/testCaseResolutionStatus.py +1 -1
- metadata/generated/schema/tests/testDefinition.py +1 -1
- metadata/generated/schema/tests/testSuite.py +1 -1
- metadata/generated/schema/type/__init__.py +1 -1
- metadata/generated/schema/type/apiSchema.py +1 -1
- metadata/generated/schema/type/auditLog.py +1 -1
- metadata/generated/schema/type/basic.py +1 -1
- metadata/generated/schema/type/bulkOperationResult.py +1 -1
- metadata/generated/schema/type/changeEvent.py +1 -1
- metadata/generated/schema/type/changeEventType.py +1 -1
- metadata/generated/schema/type/collectionDescriptor.py +1 -1
- metadata/generated/schema/type/csvDocumentation.py +1 -1
- metadata/generated/schema/type/csvErrorType.py +1 -1
- metadata/generated/schema/type/csvFile.py +1 -1
- metadata/generated/schema/type/csvImportResult.py +1 -1
- metadata/generated/schema/type/customProperties/__init__.py +1 -1
- metadata/generated/schema/type/customProperties/complexTypes.py +1 -1
- metadata/generated/schema/type/customProperties/enumConfig.py +1 -1
- metadata/generated/schema/type/customProperty.py +1 -1
- metadata/generated/schema/type/dailyCount.py +1 -1
- metadata/generated/schema/type/databaseConnectionConfig.py +1 -1
- metadata/generated/schema/type/entityHierarchy.py +1 -1
- metadata/generated/schema/type/entityHistory.py +1 -1
- metadata/generated/schema/type/entityLineage.py +1 -1
- metadata/generated/schema/type/entityReference.py +1 -1
- metadata/generated/schema/type/entityReferenceList.py +1 -1
- metadata/generated/schema/type/entityRelationship.py +1 -1
- metadata/generated/schema/type/entityUsage.py +1 -1
- metadata/generated/schema/type/filterPattern.py +1 -1
- metadata/generated/schema/type/function.py +1 -1
- metadata/generated/schema/type/include.py +1 -1
- metadata/generated/schema/type/jdbcConnection.py +1 -1
- metadata/generated/schema/type/lifeCycle.py +1 -1
- metadata/generated/schema/type/paging.py +1 -1
- metadata/generated/schema/type/profile.py +1 -1
- metadata/generated/schema/type/queryParserData.py +1 -1
- metadata/generated/schema/type/reaction.py +1 -1
- metadata/generated/schema/type/schedule.py +1 -1
- metadata/generated/schema/type/schema.py +1 -1
- metadata/generated/schema/type/tableQuery.py +1 -1
- metadata/generated/schema/type/tableUsageCount.py +1 -1
- metadata/generated/schema/type/tagLabel.py +1 -1
- metadata/generated/schema/type/usageDetails.py +1 -1
- metadata/generated/schema/type/usageRequest.py +1 -1
- metadata/generated/schema/type/votes.py +1 -1
- metadata/ingestion/ometa/mixins/lineage_mixin.py +22 -6
- metadata/ingestion/sink/metadata_rest.py +2 -2
- metadata/ingestion/source/dashboard/powerbi/metadata.py +6 -20
- metadata/ingestion/source/database/bigquery/connection.py +2 -28
- metadata/ingestion/source/database/dbt/dbt_service.py +47 -1
- metadata/ingestion/source/database/iceberg/catalog/rest.py +1 -1
- metadata/ingestion/source/database/redshift/connection.py +2 -9
- metadata/ingestion/source/database/redshift/queries.py +3 -5
- metadata/ingestion/source/database/redshift/utils.py +1 -1
- metadata/ingestion/source/database/salesforce/connection.py +5 -3
- metadata/ingestion/source/database/snowflake/connection.py +1 -6
- metadata/ingestion/source/database/snowflake/queries.py +0 -4
- metadata/ingestion/source/metadata/alationsink/metadata.py +77 -10
- metadata/ingestion/source/pipeline/dbtcloud/metadata.py +1 -1
- metadata/pii/ner.py +19 -1
- metadata/pii/processor.py +1 -1
- metadata/pii/scanners/ner_scanner.py +24 -5
- metadata/profiler/api/models.py +13 -2
- metadata/profiler/metrics/composed/null_ratio.py +5 -4
- metadata/profiler/orm/functions/table_metric_computer.py +2 -0
- metadata/profiler/orm/types/custom_hex_byte_string.py +16 -3
- metadata/profiler/processor/core.py +12 -5
- metadata/profiler/processor/models.py +19 -24
- metadata/workflow/base.py +1 -0
- metadata/workflow/profiler.py +15 -2
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/METADATA +363 -359
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/RECORD +613 -613
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/LICENSE +0 -0
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/WHEEL +0 -0
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/entry_points.txt +0 -0
- {openmetadata_ingestion-1.5.4.1.dist-info → openmetadata_ingestion-1.5.6.0.dist-info}/top_level.txt +0 -0
|
@@ -14,11 +14,17 @@ AlationSink source to extract metadata
|
|
|
14
14
|
"""
|
|
15
15
|
|
|
16
16
|
import traceback
|
|
17
|
-
from typing import Iterable, Optional
|
|
17
|
+
from typing import Iterable, List, Optional
|
|
18
18
|
|
|
19
19
|
from metadata.generated.schema.entity.data.database import Database
|
|
20
20
|
from metadata.generated.schema.entity.data.databaseSchema import DatabaseSchema
|
|
21
|
-
from metadata.generated.schema.entity.data.table import
|
|
21
|
+
from metadata.generated.schema.entity.data.table import (
|
|
22
|
+
Column,
|
|
23
|
+
Constraint,
|
|
24
|
+
ConstraintType,
|
|
25
|
+
Table,
|
|
26
|
+
TableConstraint,
|
|
27
|
+
)
|
|
22
28
|
from metadata.generated.schema.entity.services.connections.metadata.alationSinkConnection import (
|
|
23
29
|
AlationSinkConnection,
|
|
24
30
|
)
|
|
@@ -108,7 +114,9 @@ class AlationsinkSource(Source):
|
|
|
108
114
|
),
|
|
109
115
|
),
|
|
110
116
|
db_username="Test",
|
|
111
|
-
title=
|
|
117
|
+
title=om_database.displayName
|
|
118
|
+
if om_database.displayName
|
|
119
|
+
else model_str(om_database.name),
|
|
112
120
|
description=model_str(om_database.description),
|
|
113
121
|
)
|
|
114
122
|
except Exception as exc:
|
|
@@ -129,7 +137,9 @@ class AlationsinkSource(Source):
|
|
|
129
137
|
key=fqn._build( # pylint: disable=protected-access
|
|
130
138
|
str(alation_datasource_id), model_str(om_schema.name)
|
|
131
139
|
),
|
|
132
|
-
title=
|
|
140
|
+
title=om_schema.displayName
|
|
141
|
+
if om_schema.displayName
|
|
142
|
+
else model_str(om_schema.name),
|
|
133
143
|
description=model_str(om_schema.description),
|
|
134
144
|
)
|
|
135
145
|
except Exception as exc:
|
|
@@ -150,7 +160,9 @@ class AlationsinkSource(Source):
|
|
|
150
160
|
key=fqn._build( # pylint: disable=protected-access
|
|
151
161
|
str(alation_datasource_id), schema_name, model_str(om_table.name)
|
|
152
162
|
),
|
|
153
|
-
title=
|
|
163
|
+
title=om_table.displayName
|
|
164
|
+
if om_table.displayName
|
|
165
|
+
else model_str(om_table.name),
|
|
154
166
|
description=model_str(om_table.description),
|
|
155
167
|
table_type=TABLE_TYPE_MAPPER.get(om_table.tableType, "TABLE"),
|
|
156
168
|
sql=om_table.schemaDefinition,
|
|
@@ -162,14 +174,60 @@ class AlationsinkSource(Source):
|
|
|
162
174
|
)
|
|
163
175
|
return None
|
|
164
176
|
|
|
165
|
-
def
|
|
177
|
+
def _update_foreign_key(
|
|
178
|
+
self,
|
|
179
|
+
alation_datasource_id: int,
|
|
180
|
+
om_column: Column,
|
|
181
|
+
table_constraints: Optional[List[TableConstraint]],
|
|
182
|
+
column_index: ColumnIndex,
|
|
183
|
+
):
|
|
184
|
+
"""
|
|
185
|
+
Method to update the foreign key metadata in columns index
|
|
186
|
+
"""
|
|
187
|
+
try:
|
|
188
|
+
for table_constraint in table_constraints or []:
|
|
189
|
+
if table_constraint.constraintType == ConstraintType.FOREIGN_KEY:
|
|
190
|
+
for i, constraint_column in enumerate(
|
|
191
|
+
table_constraint.columns or []
|
|
192
|
+
):
|
|
193
|
+
if constraint_column == model_str(om_column.name):
|
|
194
|
+
column_index.isForeignKey = True
|
|
195
|
+
# update the service name of OM with the alation datasource id in the column FQN
|
|
196
|
+
splitted_col_fqn = fqn.split(
|
|
197
|
+
model_str(table_constraint.referredColumns[i])
|
|
198
|
+
)
|
|
199
|
+
splitted_col_fqn[0] = str(alation_datasource_id)
|
|
200
|
+
column_index.referencedColumnId = (
|
|
201
|
+
fqn._build( # pylint: disable=protected-access
|
|
202
|
+
*splitted_col_fqn
|
|
203
|
+
)
|
|
204
|
+
)
|
|
205
|
+
break
|
|
206
|
+
except Exception as exc:
|
|
207
|
+
logger.debug(traceback.format_exc())
|
|
208
|
+
logger.warning(
|
|
209
|
+
f"Failed to update foreign key for {model_str(om_column.name)}: {exc}"
|
|
210
|
+
)
|
|
211
|
+
|
|
212
|
+
def _get_column_index(
|
|
213
|
+
self,
|
|
214
|
+
alation_datasource_id: int,
|
|
215
|
+
om_column: Column,
|
|
216
|
+
table_constraints: Optional[List[TableConstraint]],
|
|
217
|
+
) -> Optional[ColumnIndex]:
|
|
166
218
|
"""
|
|
167
219
|
Method to get the alation column index
|
|
168
220
|
"""
|
|
169
221
|
column_index = ColumnIndex()
|
|
170
222
|
try:
|
|
223
|
+
# Attach the primary key
|
|
171
224
|
if om_column.constraint == Constraint.PRIMARY_KEY:
|
|
172
|
-
|
|
225
|
+
column_index.isPrimaryKey = True
|
|
226
|
+
|
|
227
|
+
# Attach the foreign key
|
|
228
|
+
self._update_foreign_key(
|
|
229
|
+
alation_datasource_id, om_column, table_constraints, column_index
|
|
230
|
+
)
|
|
173
231
|
except Exception as exc:
|
|
174
232
|
logger.debug(traceback.format_exc())
|
|
175
233
|
logger.warning(
|
|
@@ -199,6 +257,7 @@ class AlationsinkSource(Source):
|
|
|
199
257
|
schema_name: str,
|
|
200
258
|
table_name: str,
|
|
201
259
|
om_column: Column,
|
|
260
|
+
table_constraints: Optional[List[TableConstraint]],
|
|
202
261
|
) -> Optional[CreateColumnRequest]:
|
|
203
262
|
"""
|
|
204
263
|
Method to form the CreateColumnRequest object
|
|
@@ -211,13 +270,19 @@ class AlationsinkSource(Source):
|
|
|
211
270
|
table_name,
|
|
212
271
|
model_str(om_column.name),
|
|
213
272
|
),
|
|
214
|
-
column_type=om_column.
|
|
215
|
-
|
|
273
|
+
column_type=om_column.dataTypeDisplay.lower()
|
|
274
|
+
if om_column.dataTypeDisplay
|
|
275
|
+
else om_column.dataType.value.lower(),
|
|
276
|
+
title=om_column.displayName
|
|
277
|
+
if om_column.displayName
|
|
278
|
+
else model_str(om_column.name),
|
|
216
279
|
description=model_str(om_column.description),
|
|
217
280
|
position=str(om_column.ordinalPosition)
|
|
218
281
|
if om_column.ordinalPosition
|
|
219
282
|
else None,
|
|
220
|
-
index=self._get_column_index(
|
|
283
|
+
index=self._get_column_index(
|
|
284
|
+
alation_datasource_id, om_column, table_constraints
|
|
285
|
+
),
|
|
221
286
|
nullable=self._check_nullable_column(om_column),
|
|
222
287
|
)
|
|
223
288
|
except Exception as exc:
|
|
@@ -241,6 +306,7 @@ class AlationsinkSource(Source):
|
|
|
241
306
|
schema_name=schema_name,
|
|
242
307
|
table_name=model_str(om_table.name),
|
|
243
308
|
om_column=om_column,
|
|
309
|
+
table_constraints=om_table.tableConstraints,
|
|
244
310
|
)
|
|
245
311
|
if create_column_request:
|
|
246
312
|
create_requests.root.append(create_column_request)
|
|
@@ -266,6 +332,7 @@ class AlationsinkSource(Source):
|
|
|
266
332
|
entity=Table,
|
|
267
333
|
skip_on_failure=True,
|
|
268
334
|
params={"database": model_str(om_schema.fullyQualifiedName)},
|
|
335
|
+
fields=["tableConstraints, columns"],
|
|
269
336
|
)
|
|
270
337
|
)
|
|
271
338
|
create_requests = CreateTableRequestList(root=[])
|
|
@@ -314,7 +314,7 @@ class DbtcloudSource(PipelineServiceSource):
|
|
|
314
314
|
timestamp=Timestamp(
|
|
315
315
|
datetime_to_ts(
|
|
316
316
|
datetime.strptime(
|
|
317
|
-
pipeline_details.created_at, "%Y-%m-%
|
|
317
|
+
pipeline_details.created_at, "%Y-%m-%d %H:%M:%S.%f%z"
|
|
318
318
|
)
|
|
319
319
|
if pipeline_details.created_at
|
|
320
320
|
else None
|
metadata/pii/ner.py
CHANGED
|
@@ -51,7 +51,8 @@ class NEREntity(Enum):
|
|
|
51
51
|
UK_NHS = TagType.SENSITIVE.value
|
|
52
52
|
|
|
53
53
|
# Spain
|
|
54
|
-
|
|
54
|
+
ES_NIF = TagType.SENSITIVE.value
|
|
55
|
+
ES_NIE = TagType.SENSITIVE.value
|
|
55
56
|
|
|
56
57
|
# Italy
|
|
57
58
|
IT_FISCAL_CODE = TagType.SENSITIVE.value
|
|
@@ -60,8 +61,25 @@ class NEREntity(Enum):
|
|
|
60
61
|
IT_PASSPORT = TagType.SENSITIVE.value
|
|
61
62
|
IT_IDENTITY_CARD = TagType.SENSITIVE.value
|
|
62
63
|
|
|
64
|
+
# Poland
|
|
65
|
+
PL_PESEL = TagType.SENSITIVE.value
|
|
66
|
+
|
|
67
|
+
# Singapore
|
|
68
|
+
SG_NRIC_FIN = TagType.SENSITIVE.value
|
|
69
|
+
SG_UEN = TagType.SENSITIVE.value
|
|
70
|
+
|
|
63
71
|
# Australia
|
|
64
72
|
AU_ABN = TagType.SENSITIVE.value
|
|
65
73
|
AU_ACN = TagType.SENSITIVE.value
|
|
66
74
|
AU_TFN = TagType.SENSITIVE.value
|
|
67
75
|
AU_MEDICARE = TagType.SENSITIVE.value
|
|
76
|
+
|
|
77
|
+
# India
|
|
78
|
+
IN_PAN = TagType.SENSITIVE.value
|
|
79
|
+
IN_AADHAAR = TagType.SENSITIVE.value
|
|
80
|
+
IN_VEHICLE_REGISTRATION = TagType.SENSITIVE.value
|
|
81
|
+
IN_VOTER = TagType.SENSITIVE.value
|
|
82
|
+
IN_PASSPORT = TagType.SENSITIVE.value
|
|
83
|
+
|
|
84
|
+
# Finland
|
|
85
|
+
FI_PERSONAL_IDENTITY_CODE = TagType.SENSITIVE.value
|
metadata/pii/processor.py
CHANGED
|
@@ -14,6 +14,7 @@ NER Scanner based on Presidio.
|
|
|
14
14
|
Supported Entities https://microsoft.github.io/presidio/supported_entities/
|
|
15
15
|
"""
|
|
16
16
|
import json
|
|
17
|
+
import logging
|
|
17
18
|
import traceback
|
|
18
19
|
from collections import defaultdict
|
|
19
20
|
from typing import Any, Dict, List, Optional, Tuple, Union
|
|
@@ -26,9 +27,11 @@ from metadata.pii.models import TagAndConfidence
|
|
|
26
27
|
from metadata.pii.ner import NEREntity
|
|
27
28
|
from metadata.pii.scanners.base import BaseScanner
|
|
28
29
|
from metadata.utils import fqn
|
|
29
|
-
from metadata.utils.logger import pii_logger
|
|
30
|
+
from metadata.utils.logger import METADATA_LOGGER, pii_logger
|
|
30
31
|
|
|
31
32
|
logger = pii_logger()
|
|
33
|
+
SUPPORTED_LANG = "en"
|
|
34
|
+
PRESIDIO_LOGGER = "presidio-analyzer"
|
|
32
35
|
|
|
33
36
|
|
|
34
37
|
class StringAnalysis(BaseModel):
|
|
@@ -40,11 +43,16 @@ class StringAnalysis(BaseModel):
|
|
|
40
43
|
appearances: int
|
|
41
44
|
|
|
42
45
|
|
|
46
|
+
class NLPEngineModel(BaseModel):
|
|
47
|
+
"""Required to pass the nlp_engine as {"lang_code": "en", "model_name": "en_core_web_lg"}"""
|
|
48
|
+
|
|
49
|
+
lang_code: str
|
|
50
|
+
model_name: str
|
|
51
|
+
|
|
52
|
+
|
|
43
53
|
# pylint: disable=import-outside-toplevel
|
|
44
54
|
class NERScanner(BaseScanner):
|
|
45
|
-
"""
|
|
46
|
-
Based on https://microsoft.github.io/presidio/
|
|
47
|
-
"""
|
|
55
|
+
"""Based on https://microsoft.github.io/presidio/"""
|
|
48
56
|
|
|
49
57
|
def __init__(self):
|
|
50
58
|
import spacy
|
|
@@ -60,8 +68,19 @@ class NERScanner(BaseScanner):
|
|
|
60
68
|
download(SPACY_EN_MODEL)
|
|
61
69
|
spacy.load(SPACY_EN_MODEL)
|
|
62
70
|
|
|
71
|
+
nlp_engine_model = NLPEngineModel(
|
|
72
|
+
lang_code=SUPPORTED_LANG, model_name=SPACY_EN_MODEL
|
|
73
|
+
)
|
|
74
|
+
|
|
75
|
+
# Set the presidio logger to talk less about internal entities unless we are debugging
|
|
76
|
+
logging.getLogger(PRESIDIO_LOGGER).setLevel(
|
|
77
|
+
logging.INFO
|
|
78
|
+
if logging.getLogger(METADATA_LOGGER).level == logging.DEBUG
|
|
79
|
+
else logging.ERROR
|
|
80
|
+
)
|
|
81
|
+
|
|
63
82
|
self.analyzer = AnalyzerEngine(
|
|
64
|
-
nlp_engine=SpacyNlpEngine(models=
|
|
83
|
+
nlp_engine=SpacyNlpEngine(models=[nlp_engine_model.model_dump()])
|
|
65
84
|
)
|
|
66
85
|
|
|
67
86
|
@staticmethod
|
metadata/profiler/api/models.py
CHANGED
|
@@ -17,9 +17,10 @@ multiple profilers per table and columns.
|
|
|
17
17
|
"""
|
|
18
18
|
from typing import List, Optional, Type, Union
|
|
19
19
|
|
|
20
|
-
from pydantic import ConfigDict
|
|
20
|
+
from pydantic import ConfigDict, Field
|
|
21
21
|
from sqlalchemy import Column
|
|
22
22
|
from sqlalchemy.orm import DeclarativeMeta
|
|
23
|
+
from typing_extensions import Annotated
|
|
23
24
|
|
|
24
25
|
from metadata.config.common import ConfigModel
|
|
25
26
|
from metadata.generated.schema.api.data.createTableProfile import (
|
|
@@ -37,6 +38,7 @@ from metadata.generated.schema.entity.services.connections.connectionBasicType i
|
|
|
37
38
|
)
|
|
38
39
|
from metadata.generated.schema.tests.customMetric import CustomMetric
|
|
39
40
|
from metadata.generated.schema.type.basic import FullyQualifiedEntityName
|
|
41
|
+
from metadata.ingestion.models.custom_pydantic import BaseModel
|
|
40
42
|
from metadata.ingestion.models.table_metadata import ColumnTag
|
|
41
43
|
from metadata.profiler.metrics.core import Metric, MetricTypes
|
|
42
44
|
from metadata.profiler.processor.models import ProfilerDef
|
|
@@ -104,6 +106,15 @@ class ProfilerProcessorConfig(ConfigModel):
|
|
|
104
106
|
databaseConfig: Optional[List[DatabaseAndSchemaConfig]] = []
|
|
105
107
|
|
|
106
108
|
|
|
109
|
+
class SampleData(BaseModel):
|
|
110
|
+
"""TableData wrapper to handle ephemeral SampleData"""
|
|
111
|
+
|
|
112
|
+
data: Annotated[TableData, Field(None, description="Table Sample Data")]
|
|
113
|
+
store: Annotated[
|
|
114
|
+
bool, Field(False, description="Is the sample data should be stored or not")
|
|
115
|
+
]
|
|
116
|
+
|
|
117
|
+
|
|
107
118
|
class ProfilerResponse(ConfigModel):
|
|
108
119
|
"""
|
|
109
120
|
ORM Profiler processor response.
|
|
@@ -114,7 +125,7 @@ class ProfilerResponse(ConfigModel):
|
|
|
114
125
|
|
|
115
126
|
table: Table
|
|
116
127
|
profile: CreateTableProfileRequest
|
|
117
|
-
sample_data: Optional[
|
|
128
|
+
sample_data: Optional[SampleData] = None
|
|
118
129
|
column_tags: Optional[List[ColumnTag]] = None
|
|
119
130
|
|
|
120
131
|
def __str__(self):
|
|
@@ -50,8 +50,9 @@ class NullRatio(ComposedMetric):
|
|
|
50
50
|
results of other Metrics
|
|
51
51
|
"""
|
|
52
52
|
|
|
53
|
-
count = res.get(Count.name())
|
|
54
|
-
null_count = res.get(NullCount.name())
|
|
55
|
-
|
|
53
|
+
count = res.get(Count.name(), 0)
|
|
54
|
+
null_count = res.get(NullCount.name(), 0)
|
|
55
|
+
total = count + null_count
|
|
56
|
+
if total == 0:
|
|
56
57
|
return None
|
|
57
|
-
return null_count /
|
|
58
|
+
return null_count / total
|
|
@@ -176,6 +176,8 @@ class SnowflakeTableMetricComputer(BaseTableMetricComputer):
|
|
|
176
176
|
)
|
|
177
177
|
|
|
178
178
|
rest = self._runner._session.execute(query).first()
|
|
179
|
+
if not rest:
|
|
180
|
+
return None
|
|
179
181
|
if rest.rowCount is None:
|
|
180
182
|
# if we don't have any row count, fallback to the base logic
|
|
181
183
|
return super().compute()
|
|
@@ -22,6 +22,7 @@ from sqlalchemy.sql.sqltypes import String, TypeDecorator
|
|
|
22
22
|
from metadata.utils.logger import ingestion_logger
|
|
23
23
|
|
|
24
24
|
logger = ingestion_logger()
|
|
25
|
+
NULL_BYTE = "\x00"
|
|
25
26
|
|
|
26
27
|
|
|
27
28
|
class HexByteString(TypeDecorator):
|
|
@@ -63,10 +64,22 @@ class HexByteString(TypeDecorator):
|
|
|
63
64
|
detected_encoding = chardet.detect(bytes_value).get("encoding")
|
|
64
65
|
if detected_encoding:
|
|
65
66
|
try:
|
|
66
|
-
value
|
|
67
|
-
|
|
67
|
+
# Decode the bytes value with the detected encoding and replace errors with "?"
|
|
68
|
+
# if bytes cannot be decoded e.g. b"\x66\x67\x67\x9c", if detected_encoding="utf-8"
|
|
69
|
+
# will result in 'foo�' (instead of failing)
|
|
70
|
+
str_value = bytes_value.decode(
|
|
71
|
+
encoding=detected_encoding, errors="replace"
|
|
72
|
+
)
|
|
73
|
+
# Replace NULL_BYTE with empty string to avoid errors with
|
|
74
|
+
# the database client (should be O(n))
|
|
75
|
+
str_value = (
|
|
76
|
+
str_value.replace(NULL_BYTE, "")
|
|
77
|
+
if NULL_BYTE in str_value
|
|
78
|
+
else str_value
|
|
79
|
+
)
|
|
80
|
+
return str_value
|
|
68
81
|
except Exception as exc:
|
|
69
|
-
logger.debug("Failed to parse bytes
|
|
82
|
+
logger.debug("Failed to parse bytes value as string: %s", exc)
|
|
70
83
|
logger.debug(traceback.format_exc())
|
|
71
84
|
|
|
72
85
|
return value.hex()
|
|
@@ -33,7 +33,6 @@ from metadata.generated.schema.entity.data.table import (
|
|
|
33
33
|
ColumnProfile,
|
|
34
34
|
ColumnProfilerConfig,
|
|
35
35
|
SystemProfile,
|
|
36
|
-
TableData,
|
|
37
36
|
TableProfile,
|
|
38
37
|
)
|
|
39
38
|
from metadata.generated.schema.settings.settings import Settings
|
|
@@ -41,7 +40,7 @@ from metadata.generated.schema.tests.customMetric import (
|
|
|
41
40
|
CustomMetric as CustomMetricEntity,
|
|
42
41
|
)
|
|
43
42
|
from metadata.generated.schema.type.basic import Timestamp
|
|
44
|
-
from metadata.profiler.api.models import ProfilerResponse, ThreadPoolMetrics
|
|
43
|
+
from metadata.profiler.api.models import ProfilerResponse, SampleData, ThreadPoolMetrics
|
|
45
44
|
from metadata.profiler.interface.profiler_interface import ProfilerInterface
|
|
46
45
|
from metadata.profiler.metrics.core import (
|
|
47
46
|
ComposedMetric,
|
|
@@ -492,7 +491,12 @@ class Profiler(Generic[TMetric]):
|
|
|
492
491
|
)
|
|
493
492
|
self.compute_metrics()
|
|
494
493
|
|
|
495
|
-
|
|
494
|
+
# We need the sample data for Sample Data or PII Sensitive processing.
|
|
495
|
+
# We'll nullify the Sample Data after the PII processing so that it's not stored.
|
|
496
|
+
if (
|
|
497
|
+
self.source_config.generateSampleData
|
|
498
|
+
or self.source_config.processPiiSensitive
|
|
499
|
+
):
|
|
496
500
|
sample_data = self.generate_sample_data()
|
|
497
501
|
else:
|
|
498
502
|
sample_data = None
|
|
@@ -510,7 +514,7 @@ class Profiler(Generic[TMetric]):
|
|
|
510
514
|
return table_profile
|
|
511
515
|
|
|
512
516
|
@calculate_execution_time(store=False)
|
|
513
|
-
def generate_sample_data(self) -> Optional[
|
|
517
|
+
def generate_sample_data(self) -> Optional[SampleData]:
|
|
514
518
|
"""Fetch and ingest sample data
|
|
515
519
|
|
|
516
520
|
Returns:
|
|
@@ -532,7 +536,10 @@ class Profiler(Generic[TMetric]):
|
|
|
532
536
|
SAMPLE_DATA_DEFAULT_COUNT, self.profiler_interface.sample_data_count
|
|
533
537
|
)
|
|
534
538
|
]
|
|
535
|
-
return
|
|
539
|
+
return SampleData(
|
|
540
|
+
data=table_data, store=self.source_config.generateSampleData
|
|
541
|
+
)
|
|
542
|
+
|
|
536
543
|
except Exception as err:
|
|
537
544
|
logger.debug(traceback.format_exc())
|
|
538
545
|
logger.warning(f"Error fetching sample data: {err}")
|
|
@@ -15,11 +15,28 @@ JSON workflows to the profiler
|
|
|
15
15
|
"""
|
|
16
16
|
from typing import List, Optional
|
|
17
17
|
|
|
18
|
-
from pydantic import BaseModel,
|
|
18
|
+
from pydantic import BaseModel, BeforeValidator
|
|
19
|
+
from typing_extensions import Annotated
|
|
19
20
|
|
|
20
21
|
from metadata.profiler.metrics.registry import Metrics
|
|
21
22
|
|
|
22
23
|
|
|
24
|
+
def valid_metric(value: str):
|
|
25
|
+
"""
|
|
26
|
+
Validate that the input metrics are correctly named
|
|
27
|
+
and can be found in the Registry
|
|
28
|
+
"""
|
|
29
|
+
if not Metrics.get(value.upper()):
|
|
30
|
+
raise ValueError(
|
|
31
|
+
f"Metric name {value} is not a proper metric name from the Registry"
|
|
32
|
+
)
|
|
33
|
+
|
|
34
|
+
return value.upper()
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
ValidMetric = Annotated[str, BeforeValidator(valid_metric)]
|
|
38
|
+
|
|
39
|
+
|
|
23
40
|
class ProfilerDef(BaseModel):
|
|
24
41
|
"""
|
|
25
42
|
Incoming profiler definition from the
|
|
@@ -30,26 +47,4 @@ class ProfilerDef(BaseModel):
|
|
|
30
47
|
timeout_seconds: Optional[
|
|
31
48
|
int
|
|
32
49
|
] = None # Stop running a query after X seconds and continue
|
|
33
|
-
metrics: Optional[
|
|
34
|
-
List[str]
|
|
35
|
-
] = None # names of currently supported Static and Composed metrics
|
|
36
|
-
# TBD:
|
|
37
|
-
# time_metrics: List[TimeMetricDef] = None
|
|
38
|
-
# custom_metrics: List[CustomMetricDef] = None
|
|
39
|
-
# rule_metrics: ...
|
|
40
|
-
|
|
41
|
-
# pylint: disable=no-self-argument
|
|
42
|
-
@validator("metrics", each_item=True)
|
|
43
|
-
def valid_metric(cls, value):
|
|
44
|
-
"""
|
|
45
|
-
We are using cls as per pydantic docs
|
|
46
|
-
|
|
47
|
-
Validate that the input metrics are correctly named
|
|
48
|
-
and can be found in the Registry
|
|
49
|
-
"""
|
|
50
|
-
if not Metrics.get(value.upper()):
|
|
51
|
-
raise ValueError(
|
|
52
|
-
f"Metric name {value} is not a proper metric name from the Registry"
|
|
53
|
-
)
|
|
54
|
-
|
|
55
|
-
return value.upper()
|
|
50
|
+
metrics: Optional[List[ValidMetric]] = None
|
metadata/workflow/base.py
CHANGED
|
@@ -289,6 +289,7 @@ class BaseWorkflow(ABC, WorkflowStatusMixin):
|
|
|
289
289
|
for step in self.workflow_steps():
|
|
290
290
|
logger.info(
|
|
291
291
|
f"{step.name}: Processed {len(step.status.records)} records,"
|
|
292
|
+
f" updated {len(step.status.updated_records)} records,"
|
|
292
293
|
f" filtered {len(step.status.filtered)} records,"
|
|
293
294
|
f" found {len(step.status.failures)} errors"
|
|
294
295
|
)
|
metadata/workflow/profiler.py
CHANGED
|
@@ -11,6 +11,11 @@
|
|
|
11
11
|
"""
|
|
12
12
|
Workflow definition for the profiler
|
|
13
13
|
"""
|
|
14
|
+
from typing import cast
|
|
15
|
+
|
|
16
|
+
from metadata.generated.schema.metadataIngestion.databaseServiceProfilerPipeline import (
|
|
17
|
+
DatabaseServiceProfilerPipeline,
|
|
18
|
+
)
|
|
14
19
|
from metadata.generated.schema.metadataIngestion.workflow import (
|
|
15
20
|
OpenMetadataWorkflowConfig,
|
|
16
21
|
)
|
|
@@ -58,9 +63,17 @@ class ProfilerWorkflow(IngestionWorkflow):
|
|
|
58
63
|
self.source = source_class.create(self.config.model_dump(), self.metadata)
|
|
59
64
|
|
|
60
65
|
profiler_processor = self._get_profiler_processor()
|
|
61
|
-
pii_processor = self._get_pii_processor()
|
|
62
66
|
sink = self._get_sink()
|
|
63
|
-
|
|
67
|
+
|
|
68
|
+
# Only instantiate the PII Processor on demand
|
|
69
|
+
source_config: DatabaseServiceProfilerPipeline = cast(
|
|
70
|
+
DatabaseServiceProfilerPipeline, self.config.source.sourceConfig.config
|
|
71
|
+
)
|
|
72
|
+
if source_config.processPiiSensitive:
|
|
73
|
+
pii_processor = self._get_pii_processor()
|
|
74
|
+
self.steps = (profiler_processor, pii_processor, sink)
|
|
75
|
+
else:
|
|
76
|
+
self.steps = (profiler_processor, sink)
|
|
64
77
|
|
|
65
78
|
def test_connection(self):
|
|
66
79
|
service_config = self.config.source.serviceConnection.root.config
|