PyPI - semantic-link-labs - Versions diffs - 0.8.3__py3-none-any.whl → 0.8.5__py3-none-any.whl - Mend

semantic-link-labs 0.8.3py3-none-any.whl → 0.8.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of semantic-link-labs might be problematic. Click here for more details.

Files changed (109) hide show

{semantic_link_labs-0.8.3.dist-info → semantic_link_labs-0.8.5.dist-info}/METADATA +38 -8
{semantic_link_labs-0.8.3.dist-info → semantic_link_labs-0.8.5.dist-info}/RECORD +109 -104
{semantic_link_labs-0.8.3.dist-info → semantic_link_labs-0.8.5.dist-info}/WHEEL +1 -1
sempy_labs/__init__.py +53 -1
sempy_labs/_bpa_translation/_model/_translations_am-ET.po +24 -5
sempy_labs/_bpa_translation/_model/_translations_ar-AE.po +28 -4
sempy_labs/_bpa_translation/_model/_translations_bg-BG.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_ca-ES.po +33 -4
sempy_labs/_bpa_translation/_model/_translations_cs-CZ.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_da-DK.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_de-DE.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_el-GR.po +36 -4
sempy_labs/_bpa_translation/_model/_translations_es-ES.po +90 -58
sempy_labs/_bpa_translation/_model/_translations_fa-IR.po +31 -5
sempy_labs/_bpa_translation/_model/_translations_fi-FI.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_fr-FR.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_ga-IE.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_he-IL.po +28 -4
sempy_labs/_bpa_translation/_model/_translations_hi-IN.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_hu-HU.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_id-ID.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_is-IS.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_it-IT.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_ja-JP.po +24 -4
sempy_labs/_bpa_translation/_model/_translations_ko-KR.po +72 -56
sempy_labs/_bpa_translation/_model/_translations_mt-MT.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_nl-NL.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_pl-PL.po +95 -71
sempy_labs/_bpa_translation/_model/_translations_pt-BR.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_pt-PT.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_ro-RO.po +33 -4
sempy_labs/_bpa_translation/_model/_translations_ru-RU.po +34 -4
sempy_labs/_bpa_translation/_model/_translations_sk-SK.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_sl-SL.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_sv-SE.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_ta-IN.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_te-IN.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_th-TH.po +31 -4
sempy_labs/_bpa_translation/_model/_translations_tr-TR.po +32 -4
sempy_labs/_bpa_translation/_model/_translations_uk-UA.po +100 -72
sempy_labs/_bpa_translation/_model/_translations_zh-CN.po +23 -5
sempy_labs/_bpa_translation/_model/_translations_zu-ZA.po +32 -4
sempy_labs/_capacities.py +49 -14
sempy_labs/_capacity_migration.py +1 -7
sempy_labs/_data_pipelines.py +6 -0
sempy_labs/_dataflows.py +118 -1
sempy_labs/_dax.py +189 -3
sempy_labs/_deployment_pipelines.py +13 -7
sempy_labs/_environments.py +6 -0
sempy_labs/_eventhouses.py +6 -0
sempy_labs/_eventstreams.py +6 -0
sempy_labs/_external_data_shares.py +6 -4
sempy_labs/_generate_semantic_model.py +26 -3
sempy_labs/_git.py +14 -14
sempy_labs/_helper_functions.py +197 -1
sempy_labs/_icons.py +55 -22
sempy_labs/_kql_databases.py +6 -0
sempy_labs/_kql_querysets.py +6 -0
sempy_labs/_list_functions.py +1 -1
sempy_labs/_managed_private_endpoints.py +166 -0
sempy_labs/_mirrored_databases.py +428 -0
sempy_labs/_mirrored_warehouses.py +2 -0
sempy_labs/_ml_experiments.py +6 -0
sempy_labs/_ml_models.py +7 -1
sempy_labs/_model_bpa.py +215 -181
sempy_labs/_model_bpa_bulk.py +46 -42
sempy_labs/_model_bpa_rules.py +8 -3
sempy_labs/_model_dependencies.py +41 -87
sempy_labs/_notebooks.py +107 -12
sempy_labs/_query_scale_out.py +8 -6
sempy_labs/_refresh_semantic_model.py +299 -49
sempy_labs/_spark.py +12 -5
sempy_labs/_translations.py +2 -0
sempy_labs/_vertipaq.py +89 -86
sempy_labs/_warehouses.py +79 -0
sempy_labs/_workloads.py +128 -0
sempy_labs/_workspace_identity.py +4 -4
sempy_labs/_workspaces.py +14 -1
sempy_labs/admin/__init__.py +2 -0
sempy_labs/admin/_basic_functions.py +131 -43
sempy_labs/admin/_domains.py +18 -18
sempy_labs/directlake/__init__.py +2 -0
sempy_labs/directlake/_directlake_schema_sync.py +2 -1
sempy_labs/directlake/_dl_helper.py +4 -1
sempy_labs/directlake/_get_shared_expression.py +7 -1
sempy_labs/directlake/_guardrails.py +2 -1
sempy_labs/directlake/_show_unsupported_directlake_objects.py +1 -7
sempy_labs/directlake/_update_directlake_model_lakehouse_connection.py +78 -0
sempy_labs/directlake/_update_directlake_partition_entity.py +13 -32
sempy_labs/directlake/_warm_cache.py +10 -9
sempy_labs/lakehouse/_get_lakehouse_tables.py +6 -2
sempy_labs/lakehouse/_shortcuts.py +4 -0
sempy_labs/migration/_create_pqt_file.py +5 -2
sempy_labs/migration/_migrate_calctables_to_lakehouse.py +3 -2
sempy_labs/migration/_migrate_calctables_to_semantic_model.py +2 -0
sempy_labs/migration/_migrate_model_objects_to_semantic_model.py +2 -8
sempy_labs/migration/_migrate_tables_columns_to_semantic_model.py +17 -0
sempy_labs/migration/_migration_validation.py +2 -0
sempy_labs/migration/_refresh_calc_tables.py +1 -0
sempy_labs/report/__init__.py +6 -1
sempy_labs/report/_download_report.py +75 -0
sempy_labs/report/_generate_report.py +6 -0
sempy_labs/report/_paginated.py +74 -0
sempy_labs/report/_report_functions.py +6 -0
sempy_labs/report/_report_rebind.py +2 -0
sempy_labs/report/_reportwrapper.py +4 -2
sempy_labs/tom/_model.py +135 -68
{semantic_link_labs-0.8.3.dist-info → semantic_link_labs-0.8.5.dist-info}/LICENSE +0 -0
{semantic_link_labs-0.8.3.dist-info → semantic_link_labs-0.8.5.dist-info}/top_level.txt +0 -0

sempy_labs/_model_bpa.py CHANGED Viewed

@@ -56,7 +56,7 @@ def run_model_bpa(
     extended : bool, default=False
         If True, runs the set_vertipaq_annotations function to collect Vertipaq Analyzer statistics to be used in the analysis of the semantic model.
     language : str, default=None
-        Specifying a language code (i.e. 'it-IT' for Italian) will auto-translate the Category, Rule Name and Description into the specified language.
+        Specifying a language name or code (i.e. 'it-IT' for Italian) will auto-translate the Category, Rule Name and Description into the specified language.
         Defaults to None which resolves to English.
     Returns
@@ -113,6 +113,7 @@ def run_model_bpa(
         )
     if extended:
+        icons.sll_tags.append("ModelBPAExtended")
         with connect_semantic_model(
             dataset=dataset, workspace=workspace, readonly=False
         ) as tom:
@@ -122,210 +123,239 @@ def run_model_bpa(
         dataset=dataset, workspace=workspace, readonly=True
     ) as tom:
-        dep = get_model_calc_dependencies(dataset=dataset, workspace=workspace)
-        def translate_using_po(rule_file):
-            current_dir = os.path.dirname(os.path.abspath(__file__))
-            translation_file = (
-                f"{current_dir}/_bpa_translation/_model/_translations_{language}.po"
+        # Do not run BPA for models with no tables
+        if tom.model.Tables.Count == 0:
+            print(
+                f"{icons.warning} The '{dataset}' semantic model within the '{workspace}' workspace has no tables and therefore there are no valid BPA results."
             )
-            for c in ["Category", "Description", "Rule Name"]:
-                po = polib.pofile(translation_file)
-                for entry in po:
-                    if entry.tcomment == c.lower().replace(" ", "_"):
-                        rule_file.loc[rule_file["Rule Name"] == entry.msgid, c] = (
-                            entry.msgstr
-                        )
+            finalDF = pd.DataFrame(
+                columns=[
+                    "Category",
+                    "Rule Name",
+                    "Severity",
+                    "Object Type",
+                    "Object Name",
+                    "Description",
+                    "URL",
+                ]
+            )
+        else:
+            dep = get_model_calc_dependencies(dataset=dataset, workspace=workspace)
-        translated = False
+            def translate_using_po(rule_file):
+                current_dir = os.path.dirname(os.path.abspath(__file__))
+                translation_file = (
+                    f"{current_dir}/_bpa_translation/_model/_translations_{language}.po"
+                )
+                for c in ["Category", "Description", "Rule Name"]:
+                    po = polib.pofile(translation_file)
+                    for entry in po:
+                        if entry.tcomment == c.lower().replace(" ", "_"):
+                            rule_file.loc[rule_file["Rule Name"] == entry.msgid, c] = (
+                                entry.msgstr
+                            )
-        # Translations
-        if language is not None and rules is None and language in language_list:
-            rules = model_bpa_rules(dependencies=dep)
-            translate_using_po(rules)
-            translated = True
-        if rules is None:
-            rules = model_bpa_rules(dependencies=dep)
-        if language is not None and not translated:
+            translated = False
-            def translate_using_spark(rule_file):
+            # Translations
+            if language is not None and rules is None and language in language_list:
+                rules = model_bpa_rules(dependencies=dep)
+                translate_using_po(rules)
+                translated = True
+            if rules is None:
+                rules = model_bpa_rules(dependencies=dep)
+            if language is not None and not translated:
-                from synapse.ml.services import Translate
-                from pyspark.sql import SparkSession
+                def translate_using_spark(rule_file):
-                rules_temp = rule_file.copy()
-                rules_temp = rules_temp.drop(["Expression", "URL", "Severity"], axis=1)
+                    from synapse.ml.services import Translate
+                    from pyspark.sql import SparkSession
-                schema = StructType(
-                    [
-                        StructField("Category", StringType(), True),
-                        StructField("Scope", StringType(), True),
-                        StructField("Rule Name", StringType(), True),
-                        StructField("Description", StringType(), True),
-                    ]
-                )
+                    rules_temp = rule_file.copy()
+                    rules_temp = rules_temp.drop(
+                        ["Expression", "URL", "Severity"], axis=1
+                    )
-                spark = SparkSession.builder.getOrCreate()
-                dfRules = spark.createDataFrame(rules_temp, schema)
-                columns = ["Category", "Rule Name", "Description"]
-                for clm in columns:
-                    translate = (
-                        Translate()
-                        .setTextCol(clm)
-                        .setToLanguage(language)
-                        .setOutputCol("translation")
-                        .setConcurrency(5)
+                    schema = StructType(
+                        [
+                            StructField("Category", StringType(), True),
+                            StructField("Scope", StringType(), True),
+                            StructField("Rule Name", StringType(), True),
+                            StructField("Description", StringType(), True),
+                        ]
                     )
-                    if clm == "Rule Name":
-                        transDF = (
-                            translate.transform(dfRules)
-                            .withColumn(
-                                "translation", flatten(col("translation.translations"))
-                            )
-                            .withColumn("translation", col("translation.text"))
-                            .select(clm, "translation")
+                    spark = SparkSession.builder.getOrCreate()
+                    dfRules = spark.createDataFrame(rules_temp, schema)
+                    columns = ["Category", "Rule Name", "Description"]
+                    for clm in columns:
+                        translate = (
+                            Translate()
+                            .setTextCol(clm)
+                            .setToLanguage(language)
+                            .setOutputCol("translation")
+                            .setConcurrency(5)
                         )
-                    else:
-                        transDF = (
-                            translate.transform(dfRules)
-                            .withColumn(
-                                "translation", flatten(col("translation.translations"))
+                        if clm == "Rule Name":
+                            transDF = (
+                                translate.transform(dfRules)
+                                .withColumn(
+                                    "translation",
+                                    flatten(col("translation.translations")),
+                                )
+                                .withColumn("translation", col("translation.text"))
+                                .select(clm, "translation")
+                            )
+                        else:
+                            transDF = (
+                                translate.transform(dfRules)
+                                .withColumn(
+                                    "translation",
+                                    flatten(col("translation.translations")),
+                                )
+                                .withColumn("translation", col("translation.text"))
+                                .select("Rule Name", clm, "translation")
                             )
-                            .withColumn("translation", col("translation.text"))
-                            .select("Rule Name", clm, "translation")
-                        )
-                    df_panda = transDF.toPandas()
-                    rule_file = pd.merge(
-                        rule_file,
-                        df_panda[["Rule Name", "translation"]],
-                        on="Rule Name",
-                        how="left",
-                    )
+                        df_panda = transDF.toPandas()
+                        rule_file = pd.merge(
+                            rule_file,
+                            df_panda[["Rule Name", "translation"]],
+                            on="Rule Name",
+                            how="left",
+                        )
-                    rule_file = rule_file.rename(
-                        columns={"translation": f"{clm}Translated"}
-                    )
-                    rule_file[f"{clm}Translated"] = rule_file[f"{clm}Translated"].apply(
-                        lambda x: x[0] if x is not None else None
-                    )
+                        rule_file = rule_file.rename(
+                            columns={"translation": f"{clm}Translated"}
+                        )
+                        rule_file[f"{clm}Translated"] = rule_file[
+                            f"{clm}Translated"
+                        ].apply(lambda x: x[0] if x is not None else None)
-                for clm in columns:
-                    rule_file = rule_file.drop([clm], axis=1)
-                    rule_file = rule_file.rename(columns={f"{clm}Translated": clm})
+                    for clm in columns:
+                        rule_file = rule_file.drop([clm], axis=1)
+                        rule_file = rule_file.rename(columns={f"{clm}Translated": clm})
-                return rule_file
+                    return rule_file
-            rules = translate_using_spark(rules)
+                rules = translate_using_spark(rules)
-        rules.loc[rules["Severity"] == "Warning", "Severity"] = icons.warning
-        rules.loc[rules["Severity"] == "Error", "Severity"] = icons.error
-        rules.loc[rules["Severity"] == "Info", "Severity"] = icons.info
+            rules.loc[rules["Severity"] == "Warning", "Severity"] = icons.warning
+            rules.loc[rules["Severity"] == "Error", "Severity"] = icons.error
+            rules.loc[rules["Severity"] == "Info", "Severity"] = icons.info
-        pd.set_option("display.max_colwidth", 1000)
+            pd.set_option("display.max_colwidth", 1000)
-        violations = pd.DataFrame(columns=["Object Name", "Scope", "Rule Name"])
+            violations = pd.DataFrame(columns=["Object Name", "Scope", "Rule Name"])
-        scope_to_dataframe = {
-            "Relationship": (
-                tom.model.Relationships,
-                lambda obj: create_relationship_name(
-                    obj.FromTable.Name,
-                    obj.FromColumn.Name,
-                    obj.ToTable.Name,
-                    obj.ToColumn.Name,
+            scope_to_dataframe = {
+                "Relationship": (
+                    tom.model.Relationships,
+                    lambda obj: create_relationship_name(
+                        obj.FromTable.Name,
+                        obj.FromColumn.Name,
+                        obj.ToTable.Name,
+                        obj.ToColumn.Name,
+                    ),
                 ),
-            ),
-            "Column": (
-                tom.all_columns(),
-                lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
-            ),
-            "Measure": (tom.all_measures(), lambda obj: obj.Name),
-            "Hierarchy": (
-                tom.all_hierarchies(),
-                lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
-            ),
-            "Table": (tom.model.Tables, lambda obj: obj.Name),
-            "Role": (tom.model.Roles, lambda obj: obj.Name),
-            "Model": (tom.model, lambda obj: obj.Model.Name),
-            "Calculation Item": (
-                tom.all_calculation_items(),
-                lambda obj: format_dax_object_name(obj.Parent.Table.Name, obj.Name),
-            ),
-            "Row Level Security": (
-                tom.all_rls(),
-                lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
-            ),
-            "Partition": (
-                tom.all_partitions(),
-                lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
-            ),
-        }
-        for i, r in rules.iterrows():
-            ruleName = r["Rule Name"]
-            expr = r["Expression"]
-            scopes = r["Scope"]
-            if isinstance(scopes, str):
-                scopes = [scopes]
-            for scope in scopes:
-                func = scope_to_dataframe[scope][0]
-                nm = scope_to_dataframe[scope][1]
-                if scope == "Model":
-                    x = []
-                    if expr(func, tom):
-                        x = ["Model"]
-                elif scope == "Measure":
-                    x = [nm(obj) for obj in tom.all_measures() if expr(obj, tom)]
-                elif scope == "Column":
-                    x = [nm(obj) for obj in tom.all_columns() if expr(obj, tom)]
-                elif scope == "Partition":
-                    x = [nm(obj) for obj in tom.all_partitions() if expr(obj, tom)]
-                elif scope == "Hierarchy":
-                    x = [nm(obj) for obj in tom.all_hierarchies() if expr(obj, tom)]
-                elif scope == "Table":
-                    x = [nm(obj) for obj in tom.model.Tables if expr(obj, tom)]
-                elif scope == "Relationship":
-                    x = [nm(obj) for obj in tom.model.Relationships if expr(obj, tom)]
-                elif scope == "Role":
-                    x = [nm(obj) for obj in tom.model.Roles if expr(obj, tom)]
-                elif scope == "Row Level Security":
-                    x = [nm(obj) for obj in tom.all_rls() if expr(obj, tom)]
-                elif scope == "Calculation Item":
-                    x = [
-                        nm(obj) for obj in tom.all_calculation_items() if expr(obj, tom)
-                    ]
-                if len(x) > 0:
-                    new_data = {"Object Name": x, "Scope": scope, "Rule Name": ruleName}
-                    violations = pd.concat(
-                        [violations, pd.DataFrame(new_data)], ignore_index=True
-                    )
+                "Column": (
+                    tom.all_columns(),
+                    lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
+                ),
+                "Measure": (tom.all_measures(), lambda obj: obj.Name),
+                "Hierarchy": (
+                    tom.all_hierarchies(),
+                    lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
+                ),
+                "Table": (tom.model.Tables, lambda obj: obj.Name),
+                "Role": (tom.model.Roles, lambda obj: obj.Name),
+                "Model": (tom.model, lambda obj: obj.Model.Name),
+                "Calculation Item": (
+                    tom.all_calculation_items(),
+                    lambda obj: format_dax_object_name(obj.Parent.Table.Name, obj.Name),
+                ),
+                "Row Level Security": (
+                    tom.all_rls(),
+                    lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
+                ),
+                "Partition": (
+                    tom.all_partitions(),
+                    lambda obj: format_dax_object_name(obj.Parent.Name, obj.Name),
+                ),
+            }
+            for i, r in rules.iterrows():
+                ruleName = r["Rule Name"]
+                expr = r["Expression"]
+                scopes = r["Scope"]
+                if isinstance(scopes, str):
+                    scopes = [scopes]
+                for scope in scopes:
+                    func = scope_to_dataframe[scope][0]
+                    nm = scope_to_dataframe[scope][1]
+                    if scope == "Model":
+                        x = []
+                        if expr(func, tom):
+                            x = ["Model"]
+                    elif scope == "Measure":
+                        x = [nm(obj) for obj in tom.all_measures() if expr(obj, tom)]
+                    elif scope == "Column":
+                        x = [nm(obj) for obj in tom.all_columns() if expr(obj, tom)]
+                    elif scope == "Partition":
+                        x = [nm(obj) for obj in tom.all_partitions() if expr(obj, tom)]
+                    elif scope == "Hierarchy":
+                        x = [nm(obj) for obj in tom.all_hierarchies() if expr(obj, tom)]
+                    elif scope == "Table":
+                        x = [nm(obj) for obj in tom.model.Tables if expr(obj, tom)]
+                    elif scope == "Relationship":
+                        x = [
+                            nm(obj) for obj in tom.model.Relationships if expr(obj, tom)
+                        ]
+                    elif scope == "Role":
+                        x = [nm(obj) for obj in tom.model.Roles if expr(obj, tom)]
+                    elif scope == "Row Level Security":
+                        x = [nm(obj) for obj in tom.all_rls() if expr(obj, tom)]
+                    elif scope == "Calculation Item":
+                        x = [
+                            nm(obj)
+                            for obj in tom.all_calculation_items()
+                            if expr(obj, tom)
+                        ]
+                    if len(x) > 0:
+                        new_data = {
+                            "Object Name": x,
+                            "Scope": scope,
+                            "Rule Name": ruleName,
+                        }
+                        violations = pd.concat(
+                            [violations, pd.DataFrame(new_data)], ignore_index=True
+                        )
-        prepDF = pd.merge(
-            violations,
-            rules[["Rule Name", "Category", "Severity", "Description", "URL"]],
-            left_on="Rule Name",
-            right_on="Rule Name",
-            how="left",
-        )
-        prepDF.rename(columns={"Scope": "Object Type"}, inplace=True)
-        finalDF = prepDF[
-            [
-                "Category",
-                "Rule Name",
-                "Severity",
-                "Object Type",
-                "Object Name",
-                "Description",
-                "URL",
+            prepDF = pd.merge(
+                violations,
+                rules[["Rule Name", "Category", "Severity", "Description", "URL"]],
+                left_on="Rule Name",
+                right_on="Rule Name",
+                how="left",
+            )
+            prepDF.rename(columns={"Scope": "Object Type"}, inplace=True)
+            finalDF = prepDF[
+                [
+                    "Category",
+                    "Rule Name",
+                    "Severity",
+                    "Object Type",
+                    "Object Name",
+                    "Description",
+                    "URL",
+                ]
             ]
-        ]
     if export:
         if not lakehouse_attached():
@@ -387,10 +417,14 @@ def run_model_bpa(
         dfExport.insert(5, colName, dfExport.pop(colName))
         dfExport.columns = dfExport.columns.str.replace(" ", "_")
+        schema = {
+            key.replace(" ", "_"): value for key, value in icons.bpa_schema.items()
+        }
         save_as_delta_table(
             dataframe=dfExport,
             delta_table_name=delta_table_name,
             write_mode="append",
+            schema=schema,
             merge_schema=True,
         )

sempy_labs/_model_bpa_bulk.py CHANGED Viewed

@@ -25,6 +25,7 @@ def run_model_bpa_bulk(
     language: Optional[str] = None,
     workspace: Optional[str | List[str]] = None,
     skip_models: Optional[str | List[str]] = ["ModelBPA", "Fabric Capacity Metrics"],
+    skip_models_in_workspace: Optional[dict] = None,
 ):
     """
     Runs the semantic model Best Practice Analyzer across all semantic models in a workspace (or all accessible workspaces).
@@ -33,8 +34,6 @@ def run_model_bpa_bulk(
     Parameters
     ----------
-    dataset : str
-        Name of the semantic model.
     rules : pandas.DataFrame, default=None
         A pandas dataframe containing rules to be evaluated. Based on the format of the dataframe produced by the model_bpa_rules function.
     extended : bool, default=False
@@ -47,6 +46,12 @@ def run_model_bpa_bulk(
         Defaults to None which scans all accessible workspaces.
     skip_models : str | List[str], default=['ModelBPA', 'Fabric Capacity Metrics']
         The semantic models to always skip when running this analysis.
+    skip_models_in_workspace : dict, default=None
+        A dictionary showing specific semantic models within specific workspaces to skip. See the example below:
+        {
+            "Workspace A": ["Dataset1", "Dataset2"],
+            "Workspace B": ["Dataset5", "Dataset 8"],
+        }
     """
     if not lakehouse_attached():
@@ -59,24 +64,6 @@ def run_model_bpa_bulk(
     skip_models.extend(["ModelBPA", "Fabric Capacity Metrics"])
-    cols = [
-        "Capacity Name",
-        "Capacity Id",
-        "Workspace Name",
-        "Workspace Id",
-        "Dataset Name",
-        "Dataset Id",
-        "Configured By",
-        "Rule Name",
-        "Category",
-        "Severity",
-        "Object Type",
-        "Object Name",
-        "Description",
-        "URL",
-        "RunId",
-        "Timestamp",
-    ]
     now = datetime.datetime.now()
     output_table = "modelbparesults"
     lakehouse_workspace = fabric.resolve_workspace_name()
@@ -86,7 +73,6 @@ def run_model_bpa_bulk(
     )
     lakeT = get_lakehouse_tables(lakehouse=lakehouse, workspace=lakehouse_workspace)
     lakeT_filt = lakeT[lakeT["Table Name"] == output_table]
-    # query = f"SELECT MAX(RunId) FROM {lakehouse}.{output_table}"
     if len(lakeT_filt) == 0:
         runId = 1
     else:
@@ -102,13 +88,22 @@ def run_model_bpa_bulk(
     else:
         dfW_filt = dfW[dfW["Name"].isin(workspace)]
+    if len(dfW_filt) == 0:
+        raise ValueError(
+            f"{icons.red_dot} There are no valid workspaces to assess. This is likely due to not having proper permissions to the workspace(s) entered in the 'workspace' parameter."
+        )
     for i, r in dfW_filt.iterrows():
         wksp = r["Name"]
         wksp_id = r["Id"]
         capacity_id, capacity_name = resolve_workspace_capacity(workspace=wksp)
-        df = pd.DataFrame(columns=cols)
+        df = pd.DataFrame(columns=list(icons.bpa_schema.keys()))
         dfD = fabric.list_datasets(workspace=wksp, mode="rest")
+        # Skip models in workspace
+        skip_models_wkspc = skip_models_in_workspace.get(wksp)
+        dfD = dfD[~dfD["Dataset Name"].isin(skip_models_wkspc)]
         # Exclude default semantic models
         if len(dfD) > 0:
             dfI = fabric.list_items(workspace=wksp)
@@ -137,8 +132,8 @@ def run_model_bpa_bulk(
                             rules=rules,
                             extended=extended,
                         )
-                        bpa_df["Capacity Id"] = capacity_id
                         bpa_df["Capacity Name"] = capacity_name
+                        bpa_df["Capacity Id"] = capacity_id
                         bpa_df["Workspace Name"] = wksp
                         bpa_df["Workspace Id"] = wksp_id
                         bpa_df["Dataset Name"] = dataset_name
@@ -146,7 +141,7 @@ def run_model_bpa_bulk(
                         bpa_df["Configured By"] = config_by
                         bpa_df["Timestamp"] = now
                         bpa_df["RunId"] = runId
-                        bpa_df = bpa_df[cols]
+                        bpa_df = bpa_df[list(icons.bpa_schema.keys())]
                         bpa_df["RunId"] = bpa_df["RunId"].astype("int")
@@ -160,21 +155,33 @@ def run_model_bpa_bulk(
                         )
                         print(e)
-                df["Severity"].replace(icons.severity_mapping)
+                if len(df) == 0:
+                    print(
+                        f"{icons.yellow_dot} No BPA results to save for the '{wksp}' workspace."
+                    )
+                else:
+                    df["Severity"].replace(icons.severity_mapping)
-                # Append save results individually for each workspace (so as not to create a giant dataframe)
-                print(
-                    f"{icons.in_progress} Saving the Model BPA results of the '{wksp}' workspace to the '{output_table}' within the '{lakehouse}' lakehouse within the '{lakehouse_workspace}' workspace..."
-                )
-                save_as_delta_table(
-                    dataframe=df,
-                    delta_table_name=output_table,
-                    write_mode="append",
-                    merge_schema=True,
-                )
-                print(
-                    f"{icons.green_dot} Saved BPA results to the '{output_table}' delta table."
-                )
+                    # Append save results individually for each workspace (so as not to create a giant dataframe)
+                    print(
+                        f"{icons.in_progress} Saving the Model BPA results of the '{wksp}' workspace to the '{output_table}' within the '{lakehouse}' lakehouse within the '{lakehouse_workspace}' workspace..."
+                    )
+                    schema = {
+                        key.replace(" ", "_"): value
+                        for key, value in icons.bpa_schema.items()
+                    }
+                    save_as_delta_table(
+                        dataframe=df,
+                        delta_table_name=output_table,
+                        write_mode="append",
+                        schema=schema,
+                        merge_schema=True,
+                    )
+                    print(
+                        f"{icons.green_dot} Saved BPA results to the '{output_table}' delta table."
+                    )
     print(f"{icons.green_dot} Bulk BPA scan complete.")
@@ -203,9 +210,6 @@ def create_model_bpa_semantic_model(
         The workspace in which the lakehouse resides.
         Defaults to None which resolves to the workspace of the attached lakehouse
         or if no lakehouse attached, resolves to the workspace of the notebook.
-    Returns
-    -------
     """
     from sempy_labs._helper_functions import resolve_lakehouse_name
@@ -244,7 +248,7 @@ def create_model_bpa_semantic_model(
             tom.model
     dyn_connect()
+    icons.sll_tags.append("ModelBPABulk")
     table_exists = False
     with connect_semantic_model(
         dataset=dataset, readonly=False, workspace=lakehouse_workspace

semantic-link-labs 0.8.3__py3-none-any.whl → 0.8.5__py3-none-any.whl

Potentially problematic release.

semantic-link-labs 0.8.3py3-none-any.whl → 0.8.5py3-none-any.whl