PyPI - semantic-link-labs - Versions diffs - 0.12.8__py3-none-any.whl - Mend

semantic-link-labs 0.12.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (243) hide show

semantic_link_labs-0.12.8.dist-info/METADATA +354 -0
semantic_link_labs-0.12.8.dist-info/RECORD +243 -0
semantic_link_labs-0.12.8.dist-info/WHEEL +5 -0
semantic_link_labs-0.12.8.dist-info/licenses/LICENSE +21 -0
semantic_link_labs-0.12.8.dist-info/top_level.txt +1 -0
sempy_labs/__init__.py +606 -0
sempy_labs/_a_lib_info.py +2 -0
sempy_labs/_ai.py +437 -0
sempy_labs/_authentication.py +264 -0
sempy_labs/_bpa_translation/_model/_translations_am-ET.po +869 -0
sempy_labs/_bpa_translation/_model/_translations_ar-AE.po +908 -0
sempy_labs/_bpa_translation/_model/_translations_bg-BG.po +968 -0
sempy_labs/_bpa_translation/_model/_translations_ca-ES.po +963 -0
sempy_labs/_bpa_translation/_model/_translations_cs-CZ.po +943 -0
sempy_labs/_bpa_translation/_model/_translations_da-DK.po +945 -0
sempy_labs/_bpa_translation/_model/_translations_de-DE.po +988 -0
sempy_labs/_bpa_translation/_model/_translations_el-GR.po +993 -0
sempy_labs/_bpa_translation/_model/_translations_es-ES.po +971 -0
sempy_labs/_bpa_translation/_model/_translations_fa-IR.po +933 -0
sempy_labs/_bpa_translation/_model/_translations_fi-FI.po +942 -0
sempy_labs/_bpa_translation/_model/_translations_fr-FR.po +994 -0
sempy_labs/_bpa_translation/_model/_translations_ga-IE.po +967 -0
sempy_labs/_bpa_translation/_model/_translations_he-IL.po +902 -0
sempy_labs/_bpa_translation/_model/_translations_hi-IN.po +944 -0
sempy_labs/_bpa_translation/_model/_translations_hu-HU.po +963 -0
sempy_labs/_bpa_translation/_model/_translations_id-ID.po +946 -0
sempy_labs/_bpa_translation/_model/_translations_is-IS.po +939 -0
sempy_labs/_bpa_translation/_model/_translations_it-IT.po +986 -0
sempy_labs/_bpa_translation/_model/_translations_ja-JP.po +846 -0
sempy_labs/_bpa_translation/_model/_translations_ko-KR.po +839 -0
sempy_labs/_bpa_translation/_model/_translations_mt-MT.po +967 -0
sempy_labs/_bpa_translation/_model/_translations_nl-NL.po +978 -0
sempy_labs/_bpa_translation/_model/_translations_pl-PL.po +962 -0
sempy_labs/_bpa_translation/_model/_translations_pt-BR.po +962 -0
sempy_labs/_bpa_translation/_model/_translations_pt-PT.po +957 -0
sempy_labs/_bpa_translation/_model/_translations_ro-RO.po +968 -0
sempy_labs/_bpa_translation/_model/_translations_ru-RU.po +964 -0
sempy_labs/_bpa_translation/_model/_translations_sk-SK.po +952 -0
sempy_labs/_bpa_translation/_model/_translations_sl-SL.po +950 -0
sempy_labs/_bpa_translation/_model/_translations_sv-SE.po +942 -0
sempy_labs/_bpa_translation/_model/_translations_ta-IN.po +976 -0
sempy_labs/_bpa_translation/_model/_translations_te-IN.po +947 -0
sempy_labs/_bpa_translation/_model/_translations_th-TH.po +924 -0
sempy_labs/_bpa_translation/_model/_translations_tr-TR.po +953 -0
sempy_labs/_bpa_translation/_model/_translations_uk-UA.po +961 -0
sempy_labs/_bpa_translation/_model/_translations_zh-CN.po +804 -0
sempy_labs/_bpa_translation/_model/_translations_zu-ZA.po +969 -0
sempy_labs/_capacities.py +1198 -0
sempy_labs/_capacity_migration.py +660 -0
sempy_labs/_clear_cache.py +351 -0
sempy_labs/_connections.py +610 -0
sempy_labs/_dashboards.py +69 -0
sempy_labs/_data_access_security.py +98 -0
sempy_labs/_data_pipelines.py +162 -0
sempy_labs/_dataflows.py +668 -0
sempy_labs/_dax.py +501 -0
sempy_labs/_daxformatter.py +80 -0
sempy_labs/_delta_analyzer.py +467 -0
sempy_labs/_delta_analyzer_history.py +301 -0
sempy_labs/_dictionary_diffs.py +221 -0
sempy_labs/_documentation.py +147 -0
sempy_labs/_domains.py +51 -0
sempy_labs/_eventhouses.py +182 -0
sempy_labs/_external_data_shares.py +230 -0
sempy_labs/_gateways.py +521 -0
sempy_labs/_generate_semantic_model.py +521 -0
sempy_labs/_get_connection_string.py +84 -0
sempy_labs/_git.py +543 -0
sempy_labs/_graphQL.py +90 -0
sempy_labs/_helper_functions.py +2833 -0
sempy_labs/_icons.py +149 -0
sempy_labs/_job_scheduler.py +609 -0
sempy_labs/_kql_databases.py +149 -0
sempy_labs/_kql_querysets.py +124 -0
sempy_labs/_kusto.py +137 -0
sempy_labs/_labels.py +124 -0
sempy_labs/_list_functions.py +1720 -0
sempy_labs/_managed_private_endpoints.py +253 -0
sempy_labs/_mirrored_databases.py +416 -0
sempy_labs/_mirrored_warehouses.py +60 -0
sempy_labs/_ml_experiments.py +113 -0
sempy_labs/_model_auto_build.py +140 -0
sempy_labs/_model_bpa.py +557 -0
sempy_labs/_model_bpa_bulk.py +378 -0
sempy_labs/_model_bpa_rules.py +859 -0
sempy_labs/_model_dependencies.py +343 -0
sempy_labs/_mounted_data_factories.py +123 -0
sempy_labs/_notebooks.py +441 -0
sempy_labs/_one_lake_integration.py +151 -0
sempy_labs/_onelake.py +131 -0
sempy_labs/_query_scale_out.py +433 -0
sempy_labs/_refresh_semantic_model.py +435 -0
sempy_labs/_semantic_models.py +468 -0
sempy_labs/_spark.py +455 -0
sempy_labs/_sql.py +241 -0
sempy_labs/_sql_audit_settings.py +207 -0
sempy_labs/_sql_endpoints.py +214 -0
sempy_labs/_tags.py +201 -0
sempy_labs/_translations.py +43 -0
sempy_labs/_user_delegation_key.py +44 -0
sempy_labs/_utils.py +79 -0
sempy_labs/_vertipaq.py +1021 -0
sempy_labs/_vpax.py +388 -0
sempy_labs/_warehouses.py +234 -0
sempy_labs/_workloads.py +140 -0
sempy_labs/_workspace_identity.py +72 -0
sempy_labs/_workspaces.py +595 -0
sempy_labs/admin/__init__.py +170 -0
sempy_labs/admin/_activities.py +167 -0
sempy_labs/admin/_apps.py +145 -0
sempy_labs/admin/_artifacts.py +65 -0
sempy_labs/admin/_basic_functions.py +463 -0
sempy_labs/admin/_capacities.py +508 -0
sempy_labs/admin/_dataflows.py +45 -0
sempy_labs/admin/_datasets.py +186 -0
sempy_labs/admin/_domains.py +522 -0
sempy_labs/admin/_external_data_share.py +100 -0
sempy_labs/admin/_git.py +72 -0
sempy_labs/admin/_items.py +265 -0
sempy_labs/admin/_labels.py +211 -0
sempy_labs/admin/_reports.py +241 -0
sempy_labs/admin/_scanner.py +118 -0
sempy_labs/admin/_shared.py +82 -0
sempy_labs/admin/_sharing_links.py +110 -0
sempy_labs/admin/_tags.py +131 -0
sempy_labs/admin/_tenant.py +503 -0
sempy_labs/admin/_tenant_keys.py +89 -0
sempy_labs/admin/_users.py +140 -0
sempy_labs/admin/_workspaces.py +236 -0
sempy_labs/deployment_pipeline/__init__.py +23 -0
sempy_labs/deployment_pipeline/_items.py +580 -0
sempy_labs/directlake/__init__.py +57 -0
sempy_labs/directlake/_autosync.py +58 -0
sempy_labs/directlake/_directlake_schema_compare.py +120 -0
sempy_labs/directlake/_directlake_schema_sync.py +161 -0
sempy_labs/directlake/_dl_helper.py +274 -0
sempy_labs/directlake/_generate_shared_expression.py +94 -0
sempy_labs/directlake/_get_directlake_lakehouse.py +62 -0
sempy_labs/directlake/_get_shared_expression.py +34 -0
sempy_labs/directlake/_guardrails.py +96 -0
sempy_labs/directlake/_list_directlake_model_calc_tables.py +70 -0
sempy_labs/directlake/_show_unsupported_directlake_objects.py +90 -0
sempy_labs/directlake/_update_directlake_model_lakehouse_connection.py +239 -0
sempy_labs/directlake/_update_directlake_partition_entity.py +259 -0
sempy_labs/directlake/_warm_cache.py +236 -0
sempy_labs/dotnet_lib/dotnet.runtime.config.json +10 -0
sempy_labs/environment/__init__.py +23 -0
sempy_labs/environment/_items.py +212 -0
sempy_labs/environment/_pubstage.py +223 -0
sempy_labs/eventstream/__init__.py +37 -0
sempy_labs/eventstream/_items.py +263 -0
sempy_labs/eventstream/_topology.py +652 -0
sempy_labs/graph/__init__.py +59 -0
sempy_labs/graph/_groups.py +651 -0
sempy_labs/graph/_sensitivity_labels.py +120 -0
sempy_labs/graph/_teams.py +125 -0
sempy_labs/graph/_user_licenses.py +96 -0
sempy_labs/graph/_users.py +516 -0
sempy_labs/graph_model/__init__.py +15 -0
sempy_labs/graph_model/_background_jobs.py +63 -0
sempy_labs/graph_model/_items.py +149 -0
sempy_labs/lakehouse/__init__.py +67 -0
sempy_labs/lakehouse/_blobs.py +247 -0
sempy_labs/lakehouse/_get_lakehouse_columns.py +102 -0
sempy_labs/lakehouse/_get_lakehouse_tables.py +274 -0
sempy_labs/lakehouse/_helper.py +250 -0
sempy_labs/lakehouse/_lakehouse.py +351 -0
sempy_labs/lakehouse/_livy_sessions.py +143 -0
sempy_labs/lakehouse/_materialized_lake_views.py +157 -0
sempy_labs/lakehouse/_partitioning.py +165 -0
sempy_labs/lakehouse/_schemas.py +217 -0
sempy_labs/lakehouse/_shortcuts.py +440 -0
sempy_labs/migration/__init__.py +35 -0
sempy_labs/migration/_create_pqt_file.py +238 -0
sempy_labs/migration/_direct_lake_to_import.py +105 -0
sempy_labs/migration/_migrate_calctables_to_lakehouse.py +398 -0
sempy_labs/migration/_migrate_calctables_to_semantic_model.py +148 -0
sempy_labs/migration/_migrate_model_objects_to_semantic_model.py +533 -0
sempy_labs/migration/_migrate_tables_columns_to_semantic_model.py +172 -0
sempy_labs/migration/_migration_validation.py +71 -0
sempy_labs/migration/_refresh_calc_tables.py +131 -0
sempy_labs/mirrored_azure_databricks_catalog/__init__.py +15 -0
sempy_labs/mirrored_azure_databricks_catalog/_discover.py +213 -0
sempy_labs/mirrored_azure_databricks_catalog/_refresh_catalog_metadata.py +45 -0
sempy_labs/ml_model/__init__.py +23 -0
sempy_labs/ml_model/_functions.py +427 -0
sempy_labs/report/_BPAReportTemplate.json +232 -0
sempy_labs/report/__init__.py +55 -0
sempy_labs/report/_bpareporttemplate/.pbi/localSettings.json +9 -0
sempy_labs/report/_bpareporttemplate/.platform +11 -0
sempy_labs/report/_bpareporttemplate/StaticResources/SharedResources/BaseThemes/CY24SU06.json +710 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/page.json +11 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/1b08bce3bebabb0a27a8/visual.json +191 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/2f22ddb70c301693c165/visual.json +438 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/3b1182230aa6c600b43a/visual.json +127 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/58577ba6380c69891500/visual.json +576 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/a2a8fa5028b3b776c96c/visual.json +207 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/adfd47ef30652707b987/visual.json +506 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/b6a80ee459e716e170b1/visual.json +127 -0
sempy_labs/report/_bpareporttemplate/definition/pages/01d72098bda5055bd500/visuals/ce3130a721c020cc3d81/visual.json +513 -0
sempy_labs/report/_bpareporttemplate/definition/pages/92735ae19b31712208ad/page.json +8 -0
sempy_labs/report/_bpareporttemplate/definition/pages/92735ae19b31712208ad/visuals/66e60dfb526437cd78d1/visual.json +112 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/page.json +11 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/07deb8bce824e1be37d7/visual.json +513 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/0b1c68838818b32ad03b/visual.json +352 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/0c171de9d2683d10b930/visual.json +37 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/0efa01be0510e40a645e/visual.json +542 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/6bf2f0eb830ab53cc668/visual.json +221 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/88d8141cb8500b60030c/visual.json +127 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/a753273590beed656a03/visual.json +576 -0
sempy_labs/report/_bpareporttemplate/definition/pages/c597da16dc7e63222a82/visuals/b8fdc82cddd61ac447bc/visual.json +127 -0
sempy_labs/report/_bpareporttemplate/definition/pages/d37dce724a0ccc30044b/page.json +9 -0
sempy_labs/report/_bpareporttemplate/definition/pages/d37dce724a0ccc30044b/visuals/ce8532a7e25020271077/visual.json +38 -0
sempy_labs/report/_bpareporttemplate/definition/pages/pages.json +10 -0
sempy_labs/report/_bpareporttemplate/definition/report.json +176 -0
sempy_labs/report/_bpareporttemplate/definition/version.json +4 -0
sempy_labs/report/_bpareporttemplate/definition.pbir +14 -0
sempy_labs/report/_download_report.py +76 -0
sempy_labs/report/_export_report.py +257 -0
sempy_labs/report/_generate_report.py +427 -0
sempy_labs/report/_paginated.py +76 -0
sempy_labs/report/_report_bpa.py +354 -0
sempy_labs/report/_report_bpa_rules.py +115 -0
sempy_labs/report/_report_functions.py +581 -0
sempy_labs/report/_report_helper.py +227 -0
sempy_labs/report/_report_list_functions.py +110 -0
sempy_labs/report/_report_rebind.py +149 -0
sempy_labs/report/_reportwrapper.py +3100 -0
sempy_labs/report/_save_report.py +147 -0
sempy_labs/snowflake_database/__init__.py +10 -0
sempy_labs/snowflake_database/_items.py +105 -0
sempy_labs/sql_database/__init__.py +21 -0
sempy_labs/sql_database/_items.py +201 -0
sempy_labs/sql_database/_mirroring.py +79 -0
sempy_labs/theme/__init__.py +12 -0
sempy_labs/theme/_org_themes.py +129 -0
sempy_labs/tom/__init__.py +3 -0
sempy_labs/tom/_model.py +5977 -0
sempy_labs/variable_library/__init__.py +19 -0
sempy_labs/variable_library/_functions.py +403 -0
sempy_labs/warehouse/__init__.py +28 -0
sempy_labs/warehouse/_items.py +234 -0
sempy_labs/warehouse/_restore_points.py +309 -0

sempy_labs/_ai.py ADDED Viewed

@@ -0,0 +1,437 @@
+import sempy
+import sempy.fabric as fabric
+import pandas as pd
+from typing import List, Optional, Union
+from IPython.display import display
+import sempy_labs._icons as icons
+from .._helper_functions import (
+    _read_delta_table,
+    _run_spark_sql_query,
+)
+def optimize_semantic_model(dataset: str, workspace: Optional[str] = None):
+    from ._model_bpa import run_model_bpa
+    from .directlake._dl_helper import check_fallback_reason
+    from ._helper_functions import format_dax_object_name
+    modelBPA = run_model_bpa(
+        dataset=dataset, workspace=workspace, return_dataframe=True
+    )
+    dfC = fabric.list_columns(dataset=dataset, workspace=workspace, extended=True)
+    dfC["Column Object"] = format_dax_object_name(dfC["Table Name"], dfC["Column Name"])
+    dfC["Total Size"] = dfC["Total Size"].astype("int")
+    dfP = fabric.list_partitions(dataset=dataset, workspace=workspace)
+    modelBPA_col = modelBPA[modelBPA["Object Type"] == "Column"]
+    modelBPA_col = pd.merge(
+        modelBPA_col,
+        dfC[["Column Object", "Total Size"]],
+        left_on="Object Name",
+        right_on="Column Object",
+        how="left",
+    )
+    isDirectLake = any(r["Mode"] == "DirectLake" for i, r in dfP.iterrows())
+    if isDirectLake:
+        fallback = check_fallback_reason(dataset=dataset, workspace=workspace)
+        fallback_filt = fallback[fallback["FallbackReasonID"] == 2]
+        if len(fallback_filt) > 0:
+            print(
+                f"{icons.yellow_dot} The '{dataset}' semantic model is a Direct Lake semantic model which contains views. "
+                "Since views always fall back to DirectQuery, it is recommended to only use lakehouse tables and not views."
+            )
+    # Potential model reduction estimate
+    ruleNames = [
+        "Remove unnecessary columns",
+        "Set IsAvailableInMdx to false on non-attribute columns",
+    ]
+    for rule in ruleNames:
+        df = modelBPA_col[modelBPA_col["Rule Name"] == rule]
+        df_filt = df[["Object Name", "Total Size"]].sort_values(
+            by="Total Size", ascending=False
+        )
+        totSize = df["Total Size"].sum()
+        if len(df_filt) > 0:
+            print(
+                f"{icons.yellow_dot} Potential savings of {totSize} bytes from following the '{rule}' rule."
+            )
+            display(df_filt)
+        else:
+            print(f"{icons.green_dot} The '{rule}' rule has been followed.")
+def generate_aggs(
+    dataset: str,
+    table_name: str,
+    columns: Union[str, List[str]],
+    workspace: Optional[str] = None,
+    lakehouse_workspace: Optional[str] = None,
+):
+    from ._helper_functions import (
+        get_direct_lake_sql_endpoint,
+        create_abfss_path,
+        format_dax_object_name,
+        resolve_lakehouse_id,
+    )
+    sempy.fabric._client._utils._init_analysis_services()
+    import Microsoft.AnalysisServices.Tabular as TOM
+    import System
+    # columns = {
+    # 'SalesAmount': 'Sum',
+    # 'ProductKey': 'GroupBy',
+    # 'OrderDateKey': 'GroupBy'
+    #  }
+    if workspace is None:
+        workspace_id = fabric.get_workspace_id()
+        workspace = fabric.resolve_workspace_name(workspace_id)
+    if lakehouse_workspace is None:
+        lakehouse_workspace = workspace
+        lakehouse_workspace_id = workspace_id
+    else:
+        lakehouse_workspace_id = fabric.resolve_workspace_id(lakehouse_workspace)
+    if isinstance(columns, str):
+        columns = [columns]
+    columnValues = columns.keys()
+    aggTypes = ["Sum", "Count", "Min", "Max", "GroupBy"]
+    aggTypesAggregate = ["Sum", "Count", "Min", "Max"]
+    numericTypes = ["Int64", "Double", "Decimal"]
+    if any(value not in aggTypes for value in columns.values()):
+        raise ValueError(
+            f"{icons.red_dot} Invalid aggregation type(s) have been specified in the 'columns' parameter. Valid aggregation types: {aggTypes}."
+        )
+    dfC = fabric.list_columns(dataset=dataset, workspace=workspace)
+    dfP = fabric.list_partitions(dataset=dataset, workspace=workspace)
+    dfM = fabric.list_measures(dataset=dataset, workspace=workspace)
+    dfR = fabric.list_relationships(dataset=dataset, workspace=workspace)
+    if not any(r["Mode"] == "DirectLake" for i, r in dfP.iterrows()):
+        raise ValueError(
+            f"{icons.red_dot} The '{dataset}' semantic model within the '{workspace}' workspace is not in Direct Lake mode. This function is only relevant for Direct Lake semantic models."
+        )
+    dfC_filtT = dfC[dfC["Table Name"] == table_name]
+    if len(dfC_filtT) == 0:
+        raise ValueError(
+            f"{icons.red_dot} The '{table_name}' table does not exist in the '{dataset}' semantic model within the '{workspace}' workspace."
+        )
+    dfC_filt = dfC[
+        (dfC["Table Name"] == table_name) & (dfC["Column Name"].isin(columnValues))
+    ]
+    if len(columns) != len(dfC_filt):
+        raise ValueError(
+            f"{icons.red_dot} Columns listed in '{columnValues}' do not exist in the '{table_name}' table in the '{dataset}' semantic model within the '{workspace}' workspace."
+        )
+    # Check if doing sum/count/min/max etc. on a non-number column
+    for cm, agg in columns.items():
+        dfC_col = dfC_filt[dfC_filt["Column Name"] == cm]
+        dataType = dfC_col["Data Type"].iloc[0]
+        if agg in aggTypesAggregate and dataType not in numericTypes:
+            raise ValueError(
+                f"{icons.red_dot} The '{cm}' column in the '{table_name}' table is of '{dataType}' data type. Only columns of '{numericTypes}' data types"
+                f" can be aggregated as '{aggTypesAggregate}' aggregation types."
+            )
+    # Create/update lakehouse delta agg table
+    aggSuffix = "_agg"
+    aggTableName = f"{table_name}{aggSuffix}"
+    aggLakeTName = aggTableName.lower().replace(" ", "_")
+    dfP = fabric.list_partitions(dataset=dataset, workspace=workspace)
+    dfP_filt = dfP[dfP["Table Name"] == table_name]
+    lakeTName = dfP_filt["Query"].iloc[0]
+    sqlEndpointId = get_direct_lake_sql_endpoint(dataset=dataset, workspace=workspace)
+    dfI = fabric.list_items(workspace=lakehouse_workspace, type="SQLEndpoint")
+    dfI_filt = dfI[(dfI["Id"] == sqlEndpointId)]
+    if len(dfI_filt) == 0:
+        raise ValueError(
+            f"{icons.red_dot} The lakehouse (SQL Endpoint) used by the '{dataset}' semantic model does not reside in"
+            f" the '{lakehouse_workspace}' workspace. Please update the lakehouse_workspace parameter."
+        )
+    lakehouseName = dfI_filt["Display Name"].iloc[0]
+    lakehouse_id = resolve_lakehouse_id(
+        lakehouse=lakehouseName, workspace=lakehouse_workspace
+    )
+    # Generate SQL query
+    query = "SELECT"
+    groupBy = "\nGROUP BY"
+    for cm, agg in columns.items():
+        colFilt = dfC_filt[dfC_filt["Column Name"] == cm]
+        sourceCol = colFilt["Source"].iloc[0]
+        if agg == "GroupBy":
+            query = f"{query}\n{sourceCol},"
+            groupBy = f"{groupBy}\n{sourceCol},"
+        else:
+            query = f"{query}\n{agg}({sourceCol}) AS {sourceCol},"
+    query = query[:-1]
+    fromTablePath = create_abfss_path(
+        lakehouse_id=lakehouse_id,
+        lakehouse_workspace_id=lakehouse_workspace_id,
+        delta_table_name=lakeTName,
+    )
+    df = _read_delta_table(fromTablePath)
+    tempTableName = f"delta_table_{lakeTName}"
+    df.createOrReplaceTempView(tempTableName)
+    sqlQuery = f"{query} \n FROM {tempTableName} {groupBy}"
+    sqlQuery = sqlQuery[:-1]
+    print(sqlQuery)
+    # Save query to spark dataframe
+    spark_df = _run_spark_sql_query(sqlQuery)
+    f"\nCreating/updating the '{aggLakeTName}' table in the lakehouse..."
+    # Write spark dataframe to delta table
+    aggFilePath = create_abfss_path(
+        lakehouse_id=lakehouse_id,
+        lakehouse_workspace_id=lakehouse_workspace_id,
+        delta_table_name=aggLakeTName,
+    )
+    spark_df.write.mode("overwrite").format("delta").save(aggFilePath)
+    f"{icons.green_dot} The '{aggLakeTName}' table has been created/updated in the lakehouse."
+    # Create/update semantic model agg table
+    tom_server = fabric.create_tom_server(
+        dataset=dataset, readonly=False, workspace=workspace
+    )
+    m = tom_server.Databases.GetByName(dataset).Model
+    print(f"\n{icons.in_progress} Updating the '{dataset}' semantic model...")
+    dfC_agg = dfC[dfC["Table Name"] == aggTableName]
+    if len(dfC_agg) == 0:
+        print(f"{icons.in_progress} Creating the '{aggTableName}' table...")
+        exp = m.Expressions["DatabaseQuery"]
+        tbl = TOM.Table()
+        tbl.Name = aggTableName
+        tbl.IsHidden = True
+        ep = TOM.EntityPartitionSource()
+        ep.Name = aggTableName
+        ep.EntityName = aggLakeTName
+        ep.ExpressionSource = exp
+        part = TOM.Partition()
+        part.Name = aggTableName
+        part.Source = ep
+        part.Mode = TOM.ModeType.DirectLake
+        tbl.Partitions.Add(part)
+        for i, r in dfC_filt.iterrows():
+            scName = r["Source"]
+            cName = r["Column Name"]
+            dType = r["Data Type"]
+            col = TOM.DataColumn()
+            col.Name = cName
+            col.IsHidden = True
+            col.SourceColumn = scName
+            col.DataType = System.Enum.Parse(TOM.DataType, dType)
+            tbl.Columns.Add(col)
+            print(
+                f"{icons.green_dot} The '{aggTableName}'[{cName}] column has been added to the '{dataset}' semantic model."
+            )
+        m.Tables.Add(tbl)
+        print(
+            f"{icons.green_dot} The '{aggTableName}' table has been added to the '{dataset}' semantic model."
+        )
+    else:
+        print(f"{icons.in_progress} Updating the '{aggTableName}' table's columns...")
+        # Remove existing columns
+        for t in m.Tables:
+            tName = t.Name
+            for c in t.Columns:
+                cName = c.Name
+                if t.Name == aggTableName:
+                    m.Tables[tName].Columns.Remove(cName)
+        # Add columns
+        for i, r in dfC_filt.iterrows():
+            scName = r["Source"]
+            cName = r["Column Name"]
+            dType = r["Data Type"]
+            col = TOM.DataColumn()
+            col.Name = cName
+            col.IsHidden = True
+            col.SourceColumn = scName
+            col.DataType = System.Enum.Parse(TOM.DataType, dType)
+            m.Tables[aggTableName].Columns.Add(col)
+            print(
+                f"{icons.green_dot} The '{aggTableName}'[{cName}] column has been added."
+            )
+    # Create relationships
+    relMap = {"m": "Many", "1": "One", "0": "None"}
+    print(f"\n{icons.in_progress} Generating necessary relationships...")
+    for i, r in dfR.iterrows():
+        fromTable = r["From Table"]
+        fromColumn = r["From Column"]
+        toTable = r["To Table"]
+        toColumn = r["To Column"]
+        cfb = r["Cross Filtering Behavior"]
+        sfb = r["Security Filtering Behavior"]
+        mult = r["Multiplicity"]
+        crossFB = System.Enum.Parse(TOM.CrossFilteringBehavior, cfb)
+        secFB = System.Enum.Parse(TOM.SecurityFilteringBehavior, sfb)
+        fromCardinality = System.Enum.Parse(
+            TOM.RelationshipEndCardinality, relMap.get(mult[0])
+        )
+        toCardinality = System.Enum.Parse(
+            TOM.RelationshipEndCardinality, relMap.get(mult[-1])
+        )
+        rel = TOM.SingleColumnRelationship()
+        rel.FromCardinality = fromCardinality
+        rel.ToCardinality = toCardinality
+        rel.IsActive = r["Active"]
+        rel.CrossFilteringBehavior = crossFB
+        rel.SecurityFilteringBehavior = secFB
+        rel.RelyOnReferentialIntegrity = r["Rely On Referential Integrity"]
+        if fromTable == table_name:
+            try:
+                rel.FromColumn = m.Tables[aggTableName].Columns[fromColumn]
+                m.Relationships.Add(rel)
+                print(
+                    f"{icons.green_dot} '{aggTableName}'[{fromColumn}] -> '{toTable}'[{toColumn}] relationship has been added."
+                )
+            except Exception as e:
+                print(
+                    f"{icons.red_dot} '{aggTableName}'[{fromColumn}] -> '{toTable}'[{toColumn}] relationship has not been created."
+                )
+                print(f"Exception occured: {e}")
+        elif toTable == table_name:
+            try:
+                rel.ToColumn = m.Tables[aggTableName].Columns[toColumn]
+                m.Relationships.Add(rel)
+                print(
+                    f"{icons.green_dot} '{fromTable}'[{fromColumn}] -> '{aggTableName}'[{toColumn}] relationship has been added."
+                )
+            except Exception as e:
+                print(
+                    f"{icons.red_dot} '{fromTable}'[{fromColumn}] -> '{aggTableName}'[{toColumn}] relationship has not been created."
+                )
+                print(f"Exception occured: {e}")
+    "Relationship creation is complete."
+    # Create IF measure
+    f"\n{icons.in_progress} Creating measure to check if the agg table can be used..."
+    aggChecker = "IF("
+    dfR_filt = dfR[
+        (dfR["From Table"] == table_name) & (~dfR["From Column"].isin(columnValues))
+    ]
+    for i, r in dfR_filt.iterrows():
+        toTable = r["To Table"]
+        aggChecker = f"{aggChecker}\nISCROSSFILTERED('{toTable}') ||"
+    aggChecker = aggChecker[:-3]
+    aggChecker = f"{aggChecker},1,0)"
+    print(aggChecker)
+    # Todo: add IFISFILTERED clause for columns
+    f"\n{icons.in_progress} Creating the base measures in the agg table..."
+    # Create base agg measures
+    dep = fabric.evaluate_dax(
+        dataset=dataset,
+        workspace=workspace,
+        dax_string="""
+        SELECT
+         [TABLE] AS [Table Name]
+        ,[OBJECT] AS [Object Name]
+        ,[OBJECT_TYPE] AS [Object Type]
+        ,[REFERENCED_TABLE] AS [Referenced Table]
+        ,[REFERENCED_OBJECT] AS [Referenced Object]
+        ,[REFERENCED_OBJECT_TYPE] AS [Referenced Object Type]
+        FROM $SYSTEM.DISCOVER_CALC_DEPENDENCY
+        WHERE [OBJECT_TYPE] = 'MEASURE'
+        """,
+    )
+    baseMeasures = dep[
+        (dep["Referenced Object Type"] == "COLUMN")
+        & (dep["Referenced Table"] == table_name)
+        & (dep["Referenced Object"].isin(columnValues))
+    ]
+    for i, r in baseMeasures.iterrows():
+        tName = r["Table Name"]
+        mName = r["Object Name"]
+        cName = r["Referenced Object"]
+        dfM_filt = dfM[dfM["Measure Name"] == mName]
+        expr = dfM_filt["Measure Expression"].iloc[0]
+        colFQNonAgg = format_dax_object_name(tName, cName)
+        colFQAgg = format_dax_object_name(aggTableName, cName)
+        colNQNonAgg = f"{tName}[{cName}]"
+        if " " in tName:
+            newExpr = expr.replace(colFQNonAgg, colFQAgg)
+        else:
+            newExpr = expr.replace(colFQNonAgg, colFQAgg).replace(colNQNonAgg, colFQAgg)
+        print(expr)
+        print(newExpr)
+        aggMName = f"{mName}{aggSuffix}"
+        measure = TOM.Measure()
+        measure.Name = aggMName
+        measure.IsHidden = True
+        measure.Expression = newExpr
+        m.Tables[aggTableName].Measures.Add(measure)
+        f"The '{aggMName}' measure has been created in the '{aggTableName}' table."
+    # Update base detail measures
+    # m.SaveChanges()
+# Identify views used within Direct Lake model
+# workspace = 'MK Demo 6'
+# lakehouse = 'MyLakehouse'
+# dataset = 'MigrationTest'
+# lakehouse_workspace = workspace
+# dfView = pd.DataFrame(columns=['Workspace Name', 'Lakehouse Name', 'View Name'])
+# dfP = fabric.list_partitions(dataset = dataset, workspace = workspace)
+# isDirectLake = any(r['Mode'] == 'DirectLake' for i, r in dfP.iterrows())
+# spark = _create_spark_session()
+# views = spark.sql(f"SHOW VIEWS IN {lakehouse}").collect()
+# for view in views:
+#    viewName = view['viewName']
+#    isTemporary = view['isTemporary']
+#    new_data = {'Workspace Name': workspace, 'Lakehouse Name': lakehouse, 'View Name': viewName}
+#    dfView = pd.concat([dfView, pd.DataFrame(new_data, index=[0])], ignore_index=True)
+# dfView
+# lakeT = get_lakehouse_tables(lakehouse, lakehouse_workspace)
+# if not dfP['Query'].isin(lakeT['Table Name'].values):
+#    if

sempy_labs/_authentication.py ADDED Viewed

@@ -0,0 +1,264 @@
+from typing import Dict, Literal, Optional
+from azure.core.credentials import AccessToken, TokenCredential
+from azure.identity import ClientSecretCredential
+from sempy._utils._log import log
+from contextlib import contextmanager
+import contextvars
+class ServicePrincipalTokenProvider(TokenCredential):
+    """
+    A class to acquire authentication token with Service Principal.
+    For more information on Service Principal see: `Application and service principal objects in Microsoft Entra ID <https://learn.microsoft.com/en-us/entra/identity-platform/app-objects-and-service-principals?tabs=browser#service-principal-object>`_
+    """
+    _shorthand_scopes: Dict[str, str] = {
+        "pbi": "https://analysis.windows.net/powerbi/api/.default",
+        "storage": "https://storage.azure.com/.default",
+        "azure": "https://management.azure.com/.default",
+        "graph": "https://graph.microsoft.com/.default",
+        "asazure": "https://{region}.asazure.windows.net/.default",
+        "keyvault": "https://vault.azure.net/.default",
+    }
+    def __init__(self, credential: ClientSecretCredential):
+        self.credential = credential
+    @classmethod
+    def from_aad_application_key_authentication(
+        cls, tenant_id: str, client_id: str, client_secret: str
+    ) -> "ServicePrincipalTokenProvider":
+        """
+        Generates the ServicePrincipalTokenProvider, providing the Service Principal information.
+        ***USE THIS ONE ONLY FOR TEST PURPOSE. FOR PRODUCTION WE RECOMMEND CALLING ServicePrincipalTokenProvider.from_azure_key_vault()***
+        Parameters
+        ----------
+        tenant_id : str
+            The Fabric Tenant ID.
+        client_id : str
+            The Service Principal Application Client ID.
+        client_secret : str
+            The Service Principal Client Secret.
+        Returns
+        -------
+        ServicePrincipalTokenProvider
+            Token provider to be used with FabricRestClient or PowerBIRestClient.
+        """
+        credential = ClientSecretCredential(
+            tenant_id=tenant_id, client_id=client_id, client_secret=client_secret
+        )
+        cls.tenant_id = tenant_id
+        cls.client_id = client_id
+        cls.client_secret = client_secret
+        return cls(credential)
+    @classmethod
+    def from_azure_key_vault(
+        cls,
+        key_vault_uri: str,
+        key_vault_tenant_id: str,
+        key_vault_client_id: str,
+        key_vault_client_secret: str,
+    ) -> "ServicePrincipalTokenProvider":
+        """
+        Generates the ServicePrincipalTokenProvider, providing the Azure Key Vault details.
+        For more information on Azure Key Vault, `click here <https://learn.microsoft.com/en-us/azure/key-vault/general/overview>`_.
+        Parameters
+        ----------
+        key_vault_uri : str
+            Azure Key Vault URI.
+        key_vault_tenant_id : str
+            Name of the secret in the Key Vault with the Fabric Tenant ID.
+        key_vault_client_id : str
+            Name of the secret in the Key Vault with the Service Principal Client ID.
+        key_vault_client_secret : str
+            Name of the secret in the Key Vault with the Service Principal Client Secret.
+        Returns
+        -------
+        ServicePrincipalTokenProvider
+            Token provider to be used with FabricRestClient or PowerBIRestClient.
+        """
+        import notebookutils
+        tenant_id = notebookutils.credentials.getSecret(
+            key_vault_uri, key_vault_tenant_id
+        )
+        client_id = notebookutils.credentials.getSecret(
+            key_vault_uri, key_vault_client_id
+        )
+        client_secret = notebookutils.credentials.getSecret(
+            key_vault_uri, key_vault_client_secret
+        )
+        credential = ClientSecretCredential(
+            tenant_id=tenant_id, client_id=client_id, client_secret=client_secret
+        )
+        cls.tenant_id = tenant_id
+        cls.client_id = client_id
+        cls.client_secret = client_secret
+        return cls(credential)
+    def __call__(
+        self,
+        audience: Literal[
+            "pbi", "storage", "azure", "graph", "asazure", "keyvault"
+        ] = "pbi",
+        region: Optional[str] = None,
+    ) -> str:
+        """
+        Parameters
+        ----------
+        audience : Literal["pbi", "storage", "azure", "graph", "asazure", "keyvault"] = "pbi") -> str
+            Literal if it's for PBI/Fabric API call or OneLake/Storage Account call.
+        region : str, default=None
+            The region of the Azure Analysis Services. For example: 'westus2'.
+        """
+        # Check if audience is supported
+        if audience not in self._shorthand_scopes:
+            raise NotImplementedError
+        return self.get_token(audience, region=region).token
+    def get_token(self, *scopes, **kwargs) -> AccessToken:
+        """
+        Gets a token for the specified scopes.
+        Parameters
+        ----------
+        *scopes : str
+            The scopes for which to obtain a token.
+        **kwargs : dict
+            Additional parameters to pass to the token request.
+        Returns
+        -------
+        AccessToken
+            The access token.
+        """
+        if len(scopes) == 0:
+            scopes = ("pbi",)
+        region = kwargs.pop("region", None)
+        scopes = [
+            self._get_fully_qualified_scope(scope, region=region) for scope in scopes
+        ]
+        return self.credential.get_token(*scopes, **kwargs)
+    def _get_fully_qualified_scope(
+        self, scope: str, region: Optional[str] = None
+    ) -> str:
+        """
+        Resolve to fully qualified scope if Fabric short-handed scope is given.
+        Otherwise, return the original scope.
+        Parameters
+        ----------
+        scope : str
+            The scope to resolve.
+        region : str, default=None
+            The specific region to use to resolve scope.
+            Required if scope is "asazure".
+        Returns
+        -------
+        str
+            The resolved scope.
+        """
+        fully_qualified_scope = self._shorthand_scopes.get(scope, scope)
+        if scope == "asazure":
+            if region is None:
+                raise ValueError("Region is required for 'asazure' scope")
+            return fully_qualified_scope.format(region=region)
+        return fully_qualified_scope
+def _get_headers(
+    token_provider: TokenCredential,
+    audience: Literal[
+        "pbi", "storage", "azure", "graph", "asazure", "keyvault"
+    ] = "azure",
+):
+    """
+    Generates headers for an API request.
+    """
+    token = token_provider.get_token(audience).token
+    headers = {"Authorization": f"Bearer {token}"}
+    if audience == "graph":
+        headers["ConsistencyLevel"] = "eventual"
+    else:
+        headers["Content-Type"] = "application/json"
+    return headers
+token_provider = contextvars.ContextVar("token_provider", default=None)
+@log
+@contextmanager
+def service_principal_authentication(
+    key_vault_uri: str,
+    key_vault_tenant_id: str,
+    key_vault_client_id: str,
+    key_vault_client_secret: str,
+):
+    """
+    Establishes an authentication via Service Principal.
+    Parameters
+    ----------
+    key_vault_uri : str
+        Azure Key Vault URI.
+    key_vault_tenant_id : str
+        Name of the secret in the Key Vault with the Fabric Tenant ID.
+    key_vault_client_id : str
+        Name of the secret in the Key Vault with the Service Principal Client ID.
+    key_vault_client_secret : str
+        Name of the secret in the Key Vault with the Service Principal Client Secret.
+    """
+    # Save the prior state
+    prior_token = token_provider.get()
+    # Set the new token_provider in a thread-safe manner
+    token_provider.set(
+        ServicePrincipalTokenProvider.from_azure_key_vault(
+            key_vault_uri=key_vault_uri,
+            key_vault_tenant_id=key_vault_tenant_id,
+            key_vault_client_id=key_vault_client_id,
+            key_vault_client_secret=key_vault_client_secret,
+        )
+    )
+    try:
+        from sempy.fabric import set_service_principal
+        with set_service_principal(
+            (key_vault_uri, key_vault_tenant_id),
+            (key_vault_uri, key_vault_client_id),
+            client_secret=(key_vault_uri, key_vault_client_secret),
+        ):
+            yield
+    finally:
+        # Restore the prior state
+        if prior_token is None:
+            token_provider.set(None)
+        else:
+            token_provider.set(prior_token)