validmind 2.7.9__tar.gz → 2.8.10__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {validmind-2.7.9 → validmind-2.8.10}/PKG-INFO +5 -4
- {validmind-2.7.9 → validmind-2.8.10}/README.pypi.md +2 -1
- {validmind-2.7.9 → validmind-2.8.10}/pyproject.toml +3 -4
- {validmind-2.7.9 → validmind-2.8.10}/validmind/__init__.py +58 -10
- validmind-2.8.10/validmind/__version__.py +1 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/ai/test_descriptions.py +17 -73
- {validmind-2.7.9 → validmind-2.8.10}/validmind/api_client.py +18 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/errors.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/r_model.py +5 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/comparison.py +28 -2
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/FeatureTargetCorrelationPlot.py +4 -9
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ContextualRecall.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/MeteorScore.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ToxicityScore.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/StabilityAnalysisRandomNoise.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/StabilityAnalysisSynonyms.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/StabilityAnalysisTranslation.py +1 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/utils.py +6 -9
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/utils.py +8 -7
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/MinimumROCAUCScore.py +3 -7
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionModelSummary.py +7 -7
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/ai_powered_test.py +5 -4
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/run.py +5 -1
- {validmind-2.7.9 → validmind-2.8.10}/validmind/utils.py +35 -5
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/result/result.py +43 -2
- validmind-2.7.9/validmind/__version__.py +0 -1
- validmind-2.7.9/validmind/ai/test_result_description/config.yaml +0 -29
- validmind-2.7.9/validmind/ai/test_result_description/context.py +0 -73
- validmind-2.7.9/validmind/ai/test_result_description/image_processing.py +0 -124
- validmind-2.7.9/validmind/ai/test_result_description/system.jinja +0 -39
- validmind-2.7.9/validmind/ai/test_result_description/user.jinja +0 -30
- {validmind-2.7.9 → validmind-2.8.10}/LICENSE +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/ai/utils.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/client.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/client_config.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/classification/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/classification/customer_churn.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/classification/datasets/bank_customer_churn.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/classification/datasets/taiwan_credit.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/classification/taiwan_credit.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/cluster/digits.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/credit_risk/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/credit_risk/datasets/lending_club_biased.csv.gz +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/credit_risk/datasets/lending_club_loan_data_2007_2014_clean.csv.gz +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/credit_risk/lending_club.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/credit_risk/lending_club_bias.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/datasets/rfp_existing_questions_client_1.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/datasets/rfp_existing_questions_client_2.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/datasets/rfp_existing_questions_client_3.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/datasets/rfp_existing_questions_client_4.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/datasets/rfp_existing_questions_client_5.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/llm/rag/rfp.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/cnn_dailymail.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/datasets/Covid_19.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/datasets/cnn_dailymail_100_with_predictions.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/datasets/cnn_dailymail_500_with_predictions.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/datasets/sentiments_with_predictions.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/nlp/twitter_covid_19.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/california_housing.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/CPIAUCSL.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/CSUSHPISA.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/DRSFRMACBS.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/FEDFUNDS.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/GDP.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/GDPC1.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/GS10.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/GS3.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/GS5.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/MORTGAGE30US.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred/UNRATE.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates_test_1.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates_test_2.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates_test_3.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates_test_4.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/fred_loan_rates_test_5.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/datasets/leanding_club_loan_rates.csv +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/fred.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/fred_timeseries.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/lending_club.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/models/fred_loan_rates_model_1.pkl +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/models/fred_loan_rates_model_2.pkl +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/models/fred_loan_rates_model_3.pkl +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/models/fred_loan_rates_model_4.pkl +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/datasets/regression/models/fred_loan_rates_model_5.pkl +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/html_templates/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/html_templates/content_blocks.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/input_registry.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/logging.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/foundation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/function.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/huggingface.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/metadata.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/pipeline.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/pytorch.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/models/sklearn.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/template.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/classifier.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/cluster.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/embeddings.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/llm.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/nlp.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/parameters_optimization.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/regression.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/statsmodels_timeseries.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/summarization.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/tabular_datasets.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/text_data.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/test_suites/time_series.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/__types__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/_store.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ACFandPACFPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ADF.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/AutoAR.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/AutoMA.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/AutoStationarity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/BivariateScatterPlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/BoxPierce.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ChiSquaredFeaturesTable.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ClassImbalance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/DatasetDescription.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/DatasetSplit.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/DescriptiveStatistics.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/DickeyFullerGLS.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/Duplicates.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/EngleGrangerCoint.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/HighCardinality.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/HighPearsonCorrelation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/IQROutliersBarPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/IQROutliersTable.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/IsolationForestOutliers.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/JarqueBera.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/KPSS.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/LJungBox.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/LaggedCorrelationHeatmap.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/MissingValues.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/MissingValuesBarPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/MutualInformation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/PearsonCorrelationMatrix.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/PhillipsPerronArch.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ProtectedClassesCombination.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ProtectedClassesDescription.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ProtectedClassesDisparity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ProtectedClassesThresholdOptimizer.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/RollingStatsPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/RunsTest.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ScatterPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ScoreBandDefaultRates.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/SeasonalDecompose.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ShapiroWilk.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/Skewness.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/SpreadPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TabularCategoricalBarPlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TabularDateTimeHistograms.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TabularDescriptionTables.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TabularNumericalHistograms.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TargetRateBarPlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesDescription.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesDescriptiveStatistics.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesFrequency.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesHistogram.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesLinePlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesMissingValues.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TimeSeriesOutliers.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/TooManyZeroValues.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/UniqueRows.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/WOEBinPlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/WOEBinTable.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/ZivotAndrewsArch.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/CommonWords.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/Hashtags.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/LanguageDetection.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/Mentions.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/PolarityAndSubjectivity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/Punctuations.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/Sentiment.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/StopWords.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/TextDescription.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/Toxicity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/nlp/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/decorator.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/load.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/BertScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/BleuScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ClusterSizeDistribution.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/FeaturesAUC.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ModelMetadata.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ModelPredictionResiduals.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/RegardScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/RegressionResidualsPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/RougeScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/TimeSeriesPredictionWithCI.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/TimeSeriesPredictionsPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/TimeSeriesR2SquareBySegments.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/TokenDisparity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/ClusterDistribution.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/CosineSimilarityComparison.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/CosineSimilarityDistribution.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/CosineSimilarityHeatmap.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/DescriptiveAnalytics.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/EmbeddingsVisualization2D.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/EuclideanDistanceComparison.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/EuclideanDistanceHeatmap.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/PCAComponentsPairwisePlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/StabilityAnalysisKeyword.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/embeddings/TSNEComponentsPairwisePlots.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/AnswerCorrectness.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/AspectCritic.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/ContextEntityRecall.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/ContextPrecision.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/ContextPrecisionWithoutReference.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/ContextRecall.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/Faithfulness.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/NoiseSensitivity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/ResponseRelevancy.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/ragas/SemanticSimilarity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/AdjustedMutualInformation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/AdjustedRandIndex.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/CalibrationCurve.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ClassifierPerformance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ClassifierThresholdOptimization.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ClusterCosineSimilarity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ClusterPerformanceMetrics.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/CompletenessScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ConfusionMatrix.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/FeatureImportance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/FowlkesMallowsScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/HomogeneityScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/HyperParametersTuning.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/KMeansClustersOptimization.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/MinimumAccuracy.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/MinimumF1Score.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ModelParameters.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ModelsPerformanceComparison.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/OverfitDiagnosis.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/PermutationFeatureImportance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/PopulationStabilityIndex.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/PrecisionRecallCurve.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ROCCurve.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RegressionErrors.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RegressionErrorsComparison.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RegressionPerformance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RegressionR2Square.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RegressionR2SquareComparison.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/RobustnessDiagnosis.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/SHAPGlobalImportance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/ScoreProbabilityAlignment.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/SilhouettePlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/TrainingTestDegradation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/VMeasure.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/WeakspotsDiagnosis.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/AutoARIMA.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/CumulativePredictionProbabilities.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/DurbinWatsonTest.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/GINITable.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/KolmogorovSmirnov.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/Lilliefors.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/PredictionProbabilitiesHistogram.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionCoeffs.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionFeatureSignificance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionModelForecastPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionModelForecastPlotLevels.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionModelSensitivityPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/RegressionPermutationFeatureImportance.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/ScorecardHistogram.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/statsmodels/statsutils.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/CalibrationCurveDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ClassDiscriminationDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ClassImbalanceDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ClassificationAccuracyDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ConfusionMatrixDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/CumulativePredictionProbabilitiesDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/FeatureDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/PredictionAcrossEachFeature.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/PredictionCorrelation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/PredictionProbabilitiesHistogramDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/PredictionQuantilesAcrossFeatures.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ROCCurveDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ScoreBandsDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/ScorecardHistogramDrift.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/ongoing_monitoring/TargetPredictionDistributionPlot.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/output.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Bias.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Clarity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Conciseness.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Delimitation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/NegativeInstruction.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Robustness.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/Specificity.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/prompt_validation/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/test_providers.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/tests/utils.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/classification/Accuracy.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/classification/F1.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/classification/Precision.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/classification/ROC_AUC.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/classification/Recall.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/AdjustedRSquaredScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/GiniCoefficient.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/HuberLoss.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/KolmogorovSmirnovStatistic.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/MeanAbsoluteError.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/MeanAbsolutePercentageError.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/MeanBiasDeviation.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/MeanSquaredError.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/QuantileLoss.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/RSquaredScore.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/unit_metrics/regression/RootMeanSquaredError.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/dataset/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/dataset/dataset.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/dataset/utils.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/figure.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/input.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/model.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/result/__init__.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/result/result.jinja +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/result/utils.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/test_suite/runner.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/test_suite/summary.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/test_suite/test.py +0 -0
- {validmind-2.7.9 → validmind-2.8.10}/validmind/vm_models/test_suite/test_suite.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.3
|
2
2
|
Name: validmind
|
3
|
-
Version: 2.
|
3
|
+
Version: 2.8.10
|
4
4
|
Summary: ValidMind Library
|
5
5
|
License: Commercial License
|
6
6
|
Author: Andres Rodriguez
|
@@ -15,8 +15,8 @@ Provides-Extra: all
|
|
15
15
|
Provides-Extra: huggingface
|
16
16
|
Provides-Extra: llm
|
17
17
|
Provides-Extra: pytorch
|
18
|
-
Provides-Extra: r-support
|
19
18
|
Requires-Dist: aiohttp[speedups]
|
19
|
+
Requires-Dist: anywidget (>=0.9.13,<0.10.0)
|
20
20
|
Requires-Dist: arch
|
21
21
|
Requires-Dist: bert-score (>=0.3.13)
|
22
22
|
Requires-Dist: catboost
|
@@ -42,7 +42,6 @@ Requires-Dist: pycocoevalcap (>=1.2,<2.0) ; extra == "all" or extra == "llm"
|
|
42
42
|
Requires-Dist: python-dotenv
|
43
43
|
Requires-Dist: ragas (>=0.2.3) ; extra == "all" or extra == "llm"
|
44
44
|
Requires-Dist: rouge (>=1)
|
45
|
-
Requires-Dist: rpy2 (>=3.5.10,<4.0.0) ; extra == "all" or extra == "r-support"
|
46
45
|
Requires-Dist: scikit-learn (<1.6.0)
|
47
46
|
Requires-Dist: scipy
|
48
47
|
Requires-Dist: scorecardpy (>=0.1.9.6,<0.2.0.0)
|
@@ -53,6 +52,7 @@ Requires-Dist: shap (==0.44.1)
|
|
53
52
|
Requires-Dist: statsmodels
|
54
53
|
Requires-Dist: tabulate (>=0.8.9,<0.9.0)
|
55
54
|
Requires-Dist: textblob (>=0.18.0.post0,<0.19.0)
|
55
|
+
Requires-Dist: tiktoken
|
56
56
|
Requires-Dist: torch (>=1.10.0) ; extra == "all" or extra == "llm" or extra == "pytorch"
|
57
57
|
Requires-Dist: tqdm
|
58
58
|
Requires-Dist: transformers (>=4.32.0,<5.0.0) ; extra == "all" or extra == "huggingface" or extra == "llm"
|
@@ -131,6 +131,7 @@ The ValidMind Library has optional dependencies that can be installed separately
|
|
131
131
|
- **R Models**: To use R models with the ValidMind Library, install the `r` extra:
|
132
132
|
|
133
133
|
```bash
|
134
|
-
pip install validmind
|
134
|
+
pip install validmind
|
135
|
+
pip install rpy2
|
135
136
|
```
|
136
137
|
|
@@ -68,5 +68,6 @@ The ValidMind Library has optional dependencies that can be installed separately
|
|
68
68
|
- **R Models**: To use R models with the ValidMind Library, install the `r` extra:
|
69
69
|
|
70
70
|
```bash
|
71
|
-
pip install validmind
|
71
|
+
pip install validmind
|
72
|
+
pip install rpy2
|
72
73
|
```
|
@@ -10,10 +10,11 @@ description = "ValidMind Library"
|
|
10
10
|
license = "Commercial License"
|
11
11
|
name = "validmind"
|
12
12
|
readme = "README.pypi.md"
|
13
|
-
version = "2.
|
13
|
+
version = "2.8.10"
|
14
14
|
|
15
15
|
[tool.poetry.dependencies]
|
16
16
|
aiohttp = {extras = ["speedups"], version = "*"}
|
17
|
+
anywidget = "^0.9.13"
|
17
18
|
arch = "*"
|
18
19
|
bert-score = ">=0.3.13"
|
19
20
|
catboost = "*"
|
@@ -40,7 +41,6 @@ python = ">=3.8.1,<3.12"
|
|
40
41
|
python-dotenv = "*"
|
41
42
|
ragas = {version = ">=0.2.3", optional = true}
|
42
43
|
rouge = ">=1"
|
43
|
-
rpy2 = {version = "^3.5.10", optional = true}
|
44
44
|
scikit-learn = "*,<1.6.0"
|
45
45
|
scipy = "*"
|
46
46
|
scorecardpy = "^0.1.9.6"
|
@@ -51,6 +51,7 @@ shap = "0.44.1"
|
|
51
51
|
statsmodels = "*"
|
52
52
|
tabulate = "^0.8.9"
|
53
53
|
textblob = "^0.18.0.post0"
|
54
|
+
tiktoken = "*"
|
54
55
|
torch = {version = ">=1.10.0", optional = true}
|
55
56
|
tqdm = "*"
|
56
57
|
transformers = {version = "^4.32.0", optional = true}
|
@@ -76,7 +77,6 @@ twine = "^4.0.2"
|
|
76
77
|
|
77
78
|
[tool.poetry.extras]
|
78
79
|
all = [
|
79
|
-
"rpy2",
|
80
80
|
"torch",
|
81
81
|
"transformers",
|
82
82
|
"pycocoevalcap",
|
@@ -94,7 +94,6 @@ llm = [
|
|
94
94
|
"langchain-openai",
|
95
95
|
]
|
96
96
|
pytorch = ["torch"]
|
97
|
-
r-support = ["rpy2"]
|
98
97
|
|
99
98
|
[build-system]
|
100
99
|
build-backend = "poetry.core.masonry.api"
|
@@ -30,8 +30,12 @@ vm.init(
|
|
30
30
|
|
31
31
|
After you have pasted the code snippet into your development source code and executed the code, the Python Library API will register with ValidMind. You can now use the ValidMind Library to document and test your models, and to upload to the ValidMind Platform.
|
32
32
|
"""
|
33
|
+
import threading
|
33
34
|
import warnings
|
34
35
|
|
36
|
+
import pkg_resources
|
37
|
+
from IPython.display import HTML, display
|
38
|
+
|
35
39
|
# Ignore Numba warnings. We are not requiring this package directly
|
36
40
|
from numba.core.errors import NumbaDeprecationWarning, NumbaPendingDeprecationWarning
|
37
41
|
|
@@ -51,30 +55,74 @@ from .client import ( # noqa: E402
|
|
51
55
|
)
|
52
56
|
from .tests.decorator import tags, tasks, test
|
53
57
|
from .tests.run import print_env
|
58
|
+
from .utils import is_notebook, parse_version
|
54
59
|
from .vm_models.result import RawData
|
55
60
|
|
61
|
+
__shown = False
|
62
|
+
|
63
|
+
|
64
|
+
def show_warning(installed, running):
|
65
|
+
global __shown
|
66
|
+
|
67
|
+
if __shown:
|
68
|
+
return
|
69
|
+
__shown = True
|
70
|
+
|
71
|
+
message = (
|
72
|
+
f"⚠️ This kernel is running an older version of validmind ({running}) "
|
73
|
+
f"than the latest version installed on your system ({installed}).\n\n"
|
74
|
+
"You may need to restart the kernel if you are experiencing issues."
|
75
|
+
)
|
76
|
+
display(HTML(f"<div style='color: red;'>{message}</div>"))
|
77
|
+
|
78
|
+
|
79
|
+
def check_version():
|
80
|
+
# get the installed vs running version of validmind
|
81
|
+
# to make sure we are using the latest installed version
|
82
|
+
# in case user has updated the package but forgot to restart the kernel
|
83
|
+
installed = pkg_resources.get_distribution("validmind").version
|
84
|
+
running = __version__
|
85
|
+
|
86
|
+
if parse_version(installed) > parse_version(running):
|
87
|
+
show_warning(installed, running)
|
88
|
+
|
89
|
+
# Schedule the next check for 5 minutes from now
|
90
|
+
timer = threading.Timer(300, check_version)
|
91
|
+
timer.daemon = True
|
92
|
+
timer.start()
|
93
|
+
|
94
|
+
|
95
|
+
if is_notebook():
|
96
|
+
check_version()
|
97
|
+
|
56
98
|
__all__ = [ # noqa
|
57
99
|
"__version__",
|
58
|
-
#
|
59
|
-
"datasets",
|
60
|
-
"errors",
|
61
|
-
"get_test_suite",
|
100
|
+
# main library API
|
62
101
|
"init",
|
102
|
+
"reload",
|
63
103
|
"init_dataset",
|
64
104
|
"init_model",
|
65
105
|
"init_r_model",
|
66
106
|
"preview_template",
|
67
|
-
"print_env",
|
68
|
-
"RawData",
|
69
|
-
"reload",
|
70
107
|
"run_documentation_tests",
|
108
|
+
# log metric function (for direct/bulk/retroactive logging of metrics)
|
109
|
+
"log_metric",
|
110
|
+
# test suite functions (less common)
|
111
|
+
"get_test_suite",
|
71
112
|
"run_test_suite",
|
113
|
+
# helper functions (for troubleshooting)
|
114
|
+
"print_env",
|
115
|
+
# decorators (for building tests
|
72
116
|
"tags",
|
73
117
|
"tasks",
|
74
118
|
"test",
|
75
|
-
|
76
|
-
"
|
119
|
+
# raw data (for post-processing test results and building tests)
|
120
|
+
"RawData",
|
121
|
+
# submodules
|
122
|
+
"datasets",
|
123
|
+
"errors",
|
77
124
|
"vm_models",
|
125
|
+
"tests",
|
78
126
|
"unit_metrics",
|
79
|
-
"
|
127
|
+
"test_suites",
|
80
128
|
]
|
@@ -0,0 +1 @@
|
|
1
|
+
__version__ = "2.8.10"
|
@@ -4,70 +4,24 @@
|
|
4
4
|
|
5
5
|
import json
|
6
6
|
import os
|
7
|
-
import re
|
8
7
|
from concurrent.futures import ThreadPoolExecutor
|
9
8
|
from typing import List, Optional, Union
|
10
9
|
|
11
10
|
import tiktoken
|
12
|
-
from jinja2 import Template
|
13
11
|
|
14
12
|
from ..client_config import client_config
|
15
13
|
from ..logging import get_logger
|
16
14
|
from ..utils import NumpyEncoder, md_to_html, test_id_to_name
|
17
15
|
from ..vm_models.figure import Figure
|
18
16
|
from ..vm_models.result import ResultTable
|
19
|
-
from .utils import DescriptionFuture
|
17
|
+
from .utils import DescriptionFuture
|
20
18
|
|
21
19
|
__executor = ThreadPoolExecutor()
|
22
|
-
__prompt = None
|
23
20
|
|
24
21
|
logger = get_logger(__name__)
|
25
22
|
|
26
23
|
|
27
|
-
def _load_prompt():
|
28
|
-
global __prompt
|
29
|
-
|
30
|
-
if not __prompt:
|
31
|
-
folder_path = os.path.join(os.path.dirname(__file__), "test_result_description")
|
32
|
-
with open(os.path.join(folder_path, "system.jinja"), "r") as f:
|
33
|
-
system_prompt = f.read()
|
34
|
-
with open(os.path.join(folder_path, "user.jinja"), "r") as f:
|
35
|
-
user_prompt = f.read()
|
36
|
-
|
37
|
-
__prompt = (Template(system_prompt), Template(user_prompt))
|
38
|
-
|
39
|
-
return __prompt
|
40
|
-
|
41
|
-
|
42
|
-
def prompt_to_message(role, prompt):
|
43
|
-
if "[[IMAGE:" not in prompt:
|
44
|
-
return {"role": role, "content": prompt}
|
45
|
-
|
46
|
-
content = []
|
47
|
-
|
48
|
-
# Regex pattern to find [[IMAGE:<b64-data>]] markers
|
49
|
-
pattern = re.compile(r"\[\[IMAGE:(.*?)\]\]", re.DOTALL)
|
50
|
-
|
51
|
-
last_index = 0
|
52
|
-
for match in pattern.finditer(prompt):
|
53
|
-
# Text before the image marker
|
54
|
-
start, end = match.span()
|
55
|
-
if start > last_index:
|
56
|
-
content.append({"type": "text", "text": prompt[last_index:start]})
|
57
|
-
|
58
|
-
content.append({"type": "image_url", "image_url": {"url": match.group(1)}})
|
59
|
-
|
60
|
-
last_index = end
|
61
|
-
|
62
|
-
# Text after the last image
|
63
|
-
if last_index < len(prompt):
|
64
|
-
content.append({"type": "text", "text": prompt[last_index:]})
|
65
|
-
|
66
|
-
return {"role": role, "content": content}
|
67
|
-
|
68
|
-
|
69
24
|
def _get_llm_global_context():
|
70
|
-
|
71
25
|
# Get the context from the environment variable
|
72
26
|
context = os.getenv("VALIDMIND_LLM_DESCRIPTIONS_CONTEXT", "")
|
73
27
|
|
@@ -115,13 +69,13 @@ def generate_description(
|
|
115
69
|
title: Optional[str] = None,
|
116
70
|
):
|
117
71
|
"""Generate the description for the test results"""
|
72
|
+
from validmind.api_client import generate_test_result_description
|
73
|
+
|
118
74
|
if not tables and not figures and not metric:
|
119
75
|
raise ValueError(
|
120
76
|
"No tables, unit metric or figures provided - cannot generate description"
|
121
77
|
)
|
122
78
|
|
123
|
-
client, model = get_client_and_model()
|
124
|
-
|
125
79
|
# get last part of test id
|
126
80
|
test_name = title or test_id.split(".")[-1]
|
127
81
|
|
@@ -145,29 +99,18 @@ def generate_description(
|
|
145
99
|
else:
|
146
100
|
summary = None
|
147
101
|
|
148
|
-
|
149
|
-
|
150
|
-
|
151
|
-
|
152
|
-
|
153
|
-
|
154
|
-
|
155
|
-
|
156
|
-
|
157
|
-
|
158
|
-
|
159
|
-
|
160
|
-
messages = [
|
161
|
-
prompt_to_message("system", system.render(input_data)),
|
162
|
-
prompt_to_message("user", user.render(input_data)),
|
163
|
-
]
|
164
|
-
response = client.chat.completions.create(
|
165
|
-
model=model,
|
166
|
-
temperature=0.0,
|
167
|
-
messages=messages,
|
168
|
-
)
|
169
|
-
|
170
|
-
return response.choices[0].message.content
|
102
|
+
return generate_test_result_description(
|
103
|
+
{
|
104
|
+
"test_name": test_name,
|
105
|
+
"test_description": test_description,
|
106
|
+
"title": title,
|
107
|
+
"summary": _truncate_summary(summary, test_id),
|
108
|
+
"figures": [
|
109
|
+
figure._get_b64_url() for figure in ([] if tables else figures)
|
110
|
+
],
|
111
|
+
"context": _get_llm_global_context(),
|
112
|
+
}
|
113
|
+
)["content"]
|
171
114
|
|
172
115
|
|
173
116
|
def background_generate_description(
|
@@ -238,7 +181,8 @@ def get_result_description(
|
|
238
181
|
# Check the feature flag first, then the environment variable
|
239
182
|
llm_descriptions_enabled = (
|
240
183
|
client_config.can_generate_llm_test_descriptions()
|
241
|
-
and os.getenv("VALIDMIND_LLM_DESCRIPTIONS_ENABLED", "1")
|
184
|
+
and os.getenv("VALIDMIND_LLM_DESCRIPTIONS_ENABLED", "1").lower()
|
185
|
+
not in ["0", "false"]
|
242
186
|
)
|
243
187
|
|
244
188
|
# TODO: fix circular import
|
@@ -194,6 +194,7 @@ def init(
|
|
194
194
|
api_host: Optional[str] = None,
|
195
195
|
model: Optional[str] = None,
|
196
196
|
monitoring: bool = False,
|
197
|
+
generate_descriptions: Optional[bool] = None,
|
197
198
|
):
|
198
199
|
"""
|
199
200
|
Initializes the API client instances and calls the /ping endpoint to ensure
|
@@ -209,7 +210,7 @@ def init(
|
|
209
210
|
api_secret (str, optional): The API secret. Defaults to None.
|
210
211
|
api_host (str, optional): The API host. Defaults to None.
|
211
212
|
monitoring (bool): The ongoing monitoring flag. Defaults to False.
|
212
|
-
|
213
|
+
generate_descriptions (bool): Whether to use GenAI to generate test result descriptions. Defaults to True.
|
213
214
|
Raises:
|
214
215
|
ValueError: If the API key and secret are not provided
|
215
216
|
"""
|
@@ -235,6 +236,9 @@ def init(
|
|
235
236
|
|
236
237
|
_monitoring = monitoring
|
237
238
|
|
239
|
+
if generate_descriptions is not None:
|
240
|
+
os.environ["VALIDMIND_LLM_DESCRIPTIONS_ENABLED"] = str(generate_descriptions)
|
241
|
+
|
238
242
|
reload()
|
239
243
|
|
240
244
|
|
@@ -487,3 +491,16 @@ def get_ai_key() -> Dict[str, Any]:
|
|
487
491
|
raise_api_error(r.text)
|
488
492
|
|
489
493
|
return r.json()
|
494
|
+
|
495
|
+
|
496
|
+
def generate_test_result_description(test_result_data: Dict[str, Any]) -> str:
|
497
|
+
r = requests.post(
|
498
|
+
url=_get_url("ai/generate/test_result_description"),
|
499
|
+
headers=_get_api_headers(),
|
500
|
+
json=test_result_data,
|
501
|
+
)
|
502
|
+
|
503
|
+
if r.status_code != 200:
|
504
|
+
raise_api_error(r.text)
|
505
|
+
|
506
|
+
return r.json()
|
@@ -228,7 +228,7 @@ class MissingRExtrasError(BaseError):
|
|
228
228
|
def description(self, *args, **kwargs):
|
229
229
|
return (
|
230
230
|
self.message
|
231
|
-
or "
|
231
|
+
or "`rpy2` is required to use R models. Please install it with `pip install rpy2`"
|
232
232
|
)
|
233
233
|
|
234
234
|
|
@@ -5,6 +5,7 @@
|
|
5
5
|
import numpy as np
|
6
6
|
import pandas as pd
|
7
7
|
|
8
|
+
from validmind.errors import MissingRExtrasError
|
8
9
|
from validmind.logging import get_logger
|
9
10
|
from validmind.vm_models.model import VMModel
|
10
11
|
|
@@ -125,7 +126,10 @@ class RModel(VMModel):
|
|
125
126
|
"""
|
126
127
|
Converts the predicted probabilities to classes
|
127
128
|
"""
|
128
|
-
|
129
|
+
try:
|
130
|
+
from rpy2.robjects import pandas2ri
|
131
|
+
except ImportError:
|
132
|
+
raise MissingRExtrasError()
|
129
133
|
|
130
134
|
# Activate the pandas conversion for rpy2
|
131
135
|
pandas2ri.activate()
|
@@ -15,7 +15,7 @@ from validmind.vm_models.figure import (
|
|
15
15
|
is_png_image,
|
16
16
|
)
|
17
17
|
from validmind.vm_models.input import VMInput
|
18
|
-
from validmind.vm_models.result import ResultTable, TestResult
|
18
|
+
from validmind.vm_models.result import RawData, ResultTable, TestResult
|
19
19
|
|
20
20
|
logger = get_logger(__name__)
|
21
21
|
|
@@ -312,6 +312,25 @@ def get_comparison_test_configs(
|
|
312
312
|
return test_configs
|
313
313
|
|
314
314
|
|
315
|
+
def _combine_raw_data(results: List[TestResult]) -> RawData:
|
316
|
+
"""Combine RawData objects"""
|
317
|
+
attribute_names = results[0].raw_data.__dict__.keys()
|
318
|
+
|
319
|
+
# check that all the raw data objects have the same attributes
|
320
|
+
for result in results:
|
321
|
+
if not isinstance(result.raw_data, RawData):
|
322
|
+
raise ValueError("All raw data objects must be of type RawData")
|
323
|
+
if result.raw_data.__dict__.keys() != attribute_names:
|
324
|
+
raise ValueError("RawData objects must have the same attributes")
|
325
|
+
|
326
|
+
return RawData(
|
327
|
+
**{
|
328
|
+
key: [getattr(result.raw_data, key) for result in results]
|
329
|
+
for key in attribute_names
|
330
|
+
}
|
331
|
+
)
|
332
|
+
|
333
|
+
|
315
334
|
def combine_results(
|
316
335
|
results: List[TestResult],
|
317
336
|
) -> Tuple[List[Any], Dict[str, List[Any]], Dict[str, List[Any]]]:
|
@@ -338,6 +357,9 @@ def combine_results(
|
|
338
357
|
# handle threshold tests (i.e. tests that have pass/fail bool status)
|
339
358
|
if results[0].passed is not None:
|
340
359
|
combined_outputs.append(all(result.passed for result in results))
|
360
|
+
# handle raw data (if any)
|
361
|
+
if results[0].raw_data:
|
362
|
+
combined_outputs.append(_combine_raw_data(results))
|
341
363
|
|
342
364
|
# combine inputs and params
|
343
365
|
combined_inputs = {}
|
@@ -359,4 +381,8 @@ def combine_results(
|
|
359
381
|
combined_inputs = _combine_dict_values(combined_inputs)
|
360
382
|
combined_params = _combine_dict_values(combined_params)
|
361
383
|
|
362
|
-
return
|
384
|
+
return (
|
385
|
+
tuple(combined_outputs),
|
386
|
+
combined_inputs,
|
387
|
+
combined_params,
|
388
|
+
)
|
{validmind-2.7.9 → validmind-2.8.10}/validmind/tests/data_validation/FeatureTargetCorrelationPlot.py
RENAMED
@@ -52,16 +52,10 @@ def FeatureTargetCorrelationPlot(dataset, fig_height=600):
|
|
52
52
|
- Not apt for models that employ complex feature interactions, like Decision Trees or Neural Networks, as the test
|
53
53
|
may not accurately reflect their importance.
|
54
54
|
"""
|
55
|
-
|
56
|
-
# Filter DataFrame based on features and target_column
|
57
55
|
df = dataset.df[dataset.feature_columns + [dataset.target_column]]
|
58
56
|
|
59
|
-
fig = _visualize_feature_target_correlation(
|
60
|
-
|
61
|
-
correlations = (
|
62
|
-
df.corr(numeric_only=True)[dataset.target_column]
|
63
|
-
.drop(dataset.target_column)
|
64
|
-
.to_frame()
|
57
|
+
fig, correlations = _visualize_feature_target_correlation(
|
58
|
+
df, dataset.target_column, fig_height
|
65
59
|
)
|
66
60
|
|
67
61
|
return fig, RawData(correlation_data=correlations)
|
@@ -100,4 +94,5 @@ def _visualize_feature_target_correlation(df, target_column, fig_height):
|
|
100
94
|
yaxis_title="",
|
101
95
|
height=fig_height, # Adjust the height value as needed
|
102
96
|
)
|
103
|
-
|
97
|
+
|
98
|
+
return fig, correlations
|
@@ -118,4 +118,4 @@ def ContextualRecall(dataset, model):
|
|
118
118
|
# Create a DataFrame from all collected statistics
|
119
119
|
result_df = pd.DataFrame(stats_df).reset_index().rename(columns={"index": "Metric"})
|
120
120
|
|
121
|
-
return (result_df, *
|
121
|
+
return (result_df, *figures, RawData(contextual_recall_scores=metrics_df))
|
@@ -117,4 +117,4 @@ def MeteorScore(dataset, model):
|
|
117
117
|
# Create a DataFrame from all collected statistics
|
118
118
|
result_df = pd.DataFrame(stats_df).reset_index().rename(columns={"index": "Metric"})
|
119
119
|
|
120
|
-
return (result_df, *
|
120
|
+
return (result_df, *figures, RawData(meteor_scores=metrics_df))
|
@@ -3,7 +3,6 @@
|
|
3
3
|
# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
|
4
4
|
|
5
5
|
import numpy as np
|
6
|
-
import pandas as pd
|
7
6
|
import plotly.express as px
|
8
7
|
from sklearn.metrics.pairwise import cosine_similarity
|
9
8
|
|
@@ -18,14 +17,12 @@ def create_stability_analysis_result(
|
|
18
17
|
original_embeddings, perturbed_embeddings
|
19
18
|
).diagonal()
|
20
19
|
|
21
|
-
#
|
22
|
-
raw_data =
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
27
|
-
}
|
28
|
-
)
|
20
|
+
# Store raw data in a dictionary
|
21
|
+
raw_data = {
|
22
|
+
"original_embeddings": original_embeddings,
|
23
|
+
"perturbed_embeddings": perturbed_embeddings,
|
24
|
+
"similarities": similarities,
|
25
|
+
}
|
29
26
|
|
30
27
|
mean = np.mean(similarities)
|
31
28
|
passed = mean > mean_similarity_threshold
|
@@ -4,24 +4,25 @@
|
|
4
4
|
|
5
5
|
import os
|
6
6
|
|
7
|
-
from validmind.ai.utils import get_client_and_model
|
8
|
-
from validmind.client_config import client_config
|
7
|
+
from validmind.ai.utils import get_client_and_model, is_configured
|
9
8
|
|
10
9
|
EMBEDDINGS_MODEL = "text-embedding-3-small"
|
11
10
|
|
12
11
|
|
13
12
|
def get_ragas_config():
|
14
|
-
if not client_config.can_generate_llm_test_descriptions():
|
15
|
-
raise ValueError(
|
16
|
-
"LLM based descriptions are not enabled in the current configuration."
|
17
|
-
)
|
18
|
-
|
19
13
|
# import here since its an optional dependency
|
20
14
|
try:
|
21
15
|
from langchain_openai import ChatOpenAI, OpenAIEmbeddings
|
22
16
|
except ImportError:
|
23
17
|
raise ImportError("Please run `pip install validmind[llm]` to use LLM tests")
|
24
18
|
|
19
|
+
if not is_configured():
|
20
|
+
raise ValueError(
|
21
|
+
"LLM is not configured. Please set an `OPENAI_API_KEY` environment variable "
|
22
|
+
"or ensure that you are connected to the ValidMind API and ValidMind AI is "
|
23
|
+
"enabled for your account."
|
24
|
+
)
|
25
|
+
|
25
26
|
client, model = get_client_and_model()
|
26
27
|
os.environ["OPENAI_API_BASE"] = str(client.base_url)
|
27
28
|
|
{validmind-2.7.9 → validmind-2.8.10}/validmind/tests/model_validation/sklearn/MinimumROCAUCScore.py
RENAMED
@@ -62,18 +62,14 @@ def MinimumROCAUCScore(dataset: VMDataset, model: VMModel, min_threshold: float
|
|
62
62
|
lb = LabelBinarizer()
|
63
63
|
lb.fit(y_true)
|
64
64
|
|
65
|
-
y_true_binarized = lb.transform(y_true)
|
66
|
-
y_score_binarized = lb.transform(dataset.y_pred(model))
|
67
|
-
|
68
65
|
roc_auc = roc_auc_score(
|
69
|
-
y_true=
|
70
|
-
y_score=
|
66
|
+
y_true=lb.transform(y_true),
|
67
|
+
y_score=lb.transform(dataset.y_pred(model)),
|
71
68
|
average="macro",
|
72
69
|
)
|
73
70
|
|
74
71
|
else:
|
75
|
-
|
76
|
-
roc_auc = roc_auc_score(y_true=y_true, y_score=y_score_prob)
|
72
|
+
roc_auc = roc_auc_score(y_true=y_true, y_score=dataset.y_prob(model))
|
77
73
|
|
78
74
|
return [
|
79
75
|
{
|
@@ -45,17 +45,17 @@ def RegressionModelSummary(dataset: VMDataset, model: VMModel):
|
|
45
45
|
- A high R-Squared or Adjusted R-Squared may not necessarily indicate a good model, especially in cases of
|
46
46
|
overfitting.
|
47
47
|
"""
|
48
|
+
y_true = dataset.y
|
49
|
+
y_pred = dataset.y_pred(model)
|
50
|
+
|
48
51
|
return [
|
49
52
|
{
|
50
53
|
"Independent Variables": dataset.feature_columns,
|
51
|
-
"R-Squared": r2_score(
|
54
|
+
"R-Squared": r2_score(y_true, y_pred),
|
52
55
|
"Adjusted R-Squared": adj_r2_score(
|
53
|
-
dataset.
|
54
|
-
dataset.y_pred(model),
|
55
|
-
len(dataset.y),
|
56
|
-
len(dataset.feature_columns),
|
56
|
+
y_true, y_pred, len(y_true), len(dataset.feature_columns)
|
57
57
|
),
|
58
|
-
"MSE": mean_squared_error(
|
59
|
-
"RMSE": mean_squared_error(
|
58
|
+
"MSE": mean_squared_error(y_true, y_pred, squared=True),
|
59
|
+
"RMSE": mean_squared_error(y_true, y_pred, squared=False),
|
60
60
|
}
|
61
61
|
]
|
@@ -4,8 +4,7 @@
|
|
4
4
|
|
5
5
|
import re
|
6
6
|
|
7
|
-
from validmind.ai.utils import get_client_and_model
|
8
|
-
from validmind.client_config import client_config
|
7
|
+
from validmind.ai.utils import get_client_and_model, is_configured
|
9
8
|
|
10
9
|
missing_prompt_message = """
|
11
10
|
Cannot run prompt validation tests on a model with no prompt.
|
@@ -25,9 +24,11 @@ def call_model(
|
|
25
24
|
system_prompt: str, user_prompt: str, temperature: float = 0.0, seed: int = 42
|
26
25
|
):
|
27
26
|
"""Call LLM with the given prompts and return the response"""
|
28
|
-
if not
|
27
|
+
if not is_configured():
|
29
28
|
raise ValueError(
|
30
|
-
"LLM
|
29
|
+
"LLM is not configured. Please set an `OPENAI_API_KEY` environment variable "
|
30
|
+
"or ensure that you are connected to the ValidMind API and ValidMind AI is "
|
31
|
+
"enabled for your account."
|
31
32
|
)
|
32
33
|
|
33
34
|
client, model = get_client_and_model()
|