PyPI - flwr-nightly - Versions diffs - 1.8.0.dev20240314__py3-none-any.whl → 1.11.0.dev20240813__py3-none-any.whl - Mend

flwr-nightly 1.8.0.dev20240314py3-none-any.whl → 1.11.0.dev20240813py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of flwr-nightly might be problematic. Click here for more details.

Files changed (237) hide show

flwr/cli/app.py +7 -0
flwr/cli/build.py +150 -0
flwr/cli/config_utils.py +219 -0
flwr/cli/example.py +3 -1
flwr/cli/install.py +227 -0
flwr/cli/new/new.py +179 -48
flwr/cli/new/templates/app/.gitignore.tpl +160 -0
flwr/cli/new/templates/app/README.flowertune.md.tpl +56 -0
flwr/cli/new/templates/app/README.md.tpl +1 -5
flwr/cli/new/templates/app/code/__init__.py.tpl +1 -1
flwr/cli/new/templates/app/code/client.huggingface.py.tpl +65 -0
flwr/cli/new/templates/app/code/client.jax.py.tpl +56 -0
flwr/cli/new/templates/app/code/client.mlx.py.tpl +93 -0
flwr/cli/new/templates/app/code/client.numpy.py.tpl +3 -2
flwr/cli/new/templates/app/code/client.pytorch.py.tpl +23 -11
flwr/cli/new/templates/app/code/client.sklearn.py.tpl +97 -0
flwr/cli/new/templates/app/code/client.tensorflow.py.tpl +60 -1
flwr/cli/new/templates/app/code/flwr_tune/__init__.py +15 -0
flwr/cli/new/templates/app/code/flwr_tune/app.py.tpl +89 -0
flwr/cli/new/templates/app/code/flwr_tune/client.py.tpl +126 -0
flwr/cli/new/templates/app/code/flwr_tune/config.yaml.tpl +34 -0
flwr/cli/new/templates/app/code/flwr_tune/dataset.py.tpl +57 -0
flwr/cli/new/templates/app/code/flwr_tune/models.py.tpl +59 -0
flwr/cli/new/templates/app/code/flwr_tune/server.py.tpl +48 -0
flwr/cli/new/templates/app/code/flwr_tune/static_config.yaml.tpl +11 -0
flwr/cli/new/templates/app/code/server.huggingface.py.tpl +23 -0
flwr/cli/new/templates/app/code/server.jax.py.tpl +20 -0
flwr/cli/new/templates/app/code/server.mlx.py.tpl +20 -0
flwr/cli/new/templates/app/code/server.numpy.py.tpl +17 -9
flwr/cli/new/templates/app/code/server.pytorch.py.tpl +21 -18
flwr/cli/new/templates/app/code/server.sklearn.py.tpl +24 -0
flwr/cli/new/templates/app/code/server.tensorflow.py.tpl +29 -1
flwr/cli/new/templates/app/code/task.huggingface.py.tpl +99 -0
flwr/cli/new/templates/app/code/task.jax.py.tpl +57 -0
flwr/cli/new/templates/app/code/task.mlx.py.tpl +102 -0
flwr/cli/new/templates/app/code/task.pytorch.py.tpl +28 -23
flwr/cli/new/templates/app/code/task.tensorflow.py.tpl +53 -0
flwr/cli/new/templates/app/pyproject.flowertune.toml.tpl +39 -0
flwr/cli/new/templates/app/pyproject.huggingface.toml.tpl +38 -0
flwr/cli/new/templates/app/pyproject.jax.toml.tpl +34 -0
flwr/cli/new/templates/app/pyproject.mlx.toml.tpl +39 -0
flwr/cli/new/templates/app/pyproject.numpy.toml.tpl +25 -12
flwr/cli/new/templates/app/pyproject.pytorch.toml.tpl +29 -14
flwr/cli/new/templates/app/pyproject.sklearn.toml.tpl +33 -0
flwr/cli/new/templates/app/pyproject.tensorflow.toml.tpl +29 -14
flwr/cli/run/run.py +168 -17
flwr/cli/utils.py +75 -4
flwr/client/__init__.py +6 -1
flwr/client/app.py +239 -248
flwr/client/client_app.py +70 -9
flwr/client/dpfedavg_numpy_client.py +1 -1
flwr/client/grpc_adapter_client/__init__.py +15 -0
flwr/client/grpc_adapter_client/connection.py +97 -0
flwr/client/grpc_client/connection.py +18 -5
flwr/client/grpc_rere_client/__init__.py +1 -1
flwr/client/grpc_rere_client/client_interceptor.py +158 -0
flwr/client/grpc_rere_client/connection.py +127 -33
flwr/client/grpc_rere_client/grpc_adapter.py +140 -0
flwr/client/heartbeat.py +74 -0
flwr/client/message_handler/__init__.py +1 -1
flwr/client/message_handler/message_handler.py +7 -7
flwr/client/mod/__init__.py +5 -5
flwr/client/mod/centraldp_mods.py +4 -2
flwr/client/mod/comms_mods.py +4 -4
flwr/client/mod/localdp_mod.py +9 -4
flwr/client/mod/secure_aggregation/__init__.py +1 -1
flwr/client/mod/secure_aggregation/secaggplus_mod.py +1 -1
flwr/client/mod/utils.py +1 -1
flwr/client/node_state.py +60 -10
flwr/client/node_state_tests.py +4 -3
flwr/client/rest_client/__init__.py +1 -1
flwr/client/rest_client/connection.py +177 -157
flwr/client/supernode/__init__.py +26 -0
flwr/client/supernode/app.py +464 -0
flwr/client/typing.py +1 -0
flwr/common/__init__.py +13 -11
flwr/common/address.py +1 -1
flwr/common/config.py +193 -0
flwr/common/constant.py +42 -1
flwr/common/context.py +26 -1
flwr/common/date.py +1 -1
flwr/common/dp.py +1 -1
flwr/common/grpc.py +6 -2
flwr/common/logger.py +79 -8
flwr/common/message.py +167 -105
flwr/common/object_ref.py +126 -25
flwr/common/record/__init__.py +1 -1
flwr/common/record/parametersrecord.py +0 -1
flwr/common/record/recordset.py +78 -27
flwr/common/recordset_compat.py +8 -1
flwr/common/retry_invoker.py +25 -13
flwr/common/secure_aggregation/__init__.py +1 -1
flwr/common/secure_aggregation/crypto/__init__.py +1 -1
flwr/common/secure_aggregation/crypto/shamir.py +1 -1
flwr/common/secure_aggregation/crypto/symmetric_encryption.py +21 -2
flwr/common/secure_aggregation/ndarrays_arithmetic.py +1 -1
flwr/common/secure_aggregation/quantization.py +1 -1
flwr/common/secure_aggregation/secaggplus_constants.py +1 -1
flwr/common/secure_aggregation/secaggplus_utils.py +1 -1
flwr/common/serde.py +209 -3
flwr/common/telemetry.py +25 -0
flwr/common/typing.py +38 -0
flwr/common/version.py +14 -0
flwr/proto/clientappio_pb2.py +41 -0
flwr/proto/clientappio_pb2.pyi +110 -0
flwr/proto/clientappio_pb2_grpc.py +101 -0
flwr/proto/clientappio_pb2_grpc.pyi +40 -0
flwr/proto/common_pb2.py +36 -0
flwr/proto/common_pb2.pyi +121 -0
flwr/proto/common_pb2_grpc.py +4 -0
flwr/proto/common_pb2_grpc.pyi +4 -0
flwr/proto/driver_pb2.py +26 -19
flwr/proto/driver_pb2.pyi +34 -0
flwr/proto/driver_pb2_grpc.py +70 -0
flwr/proto/driver_pb2_grpc.pyi +28 -0
flwr/proto/exec_pb2.py +43 -0
flwr/proto/exec_pb2.pyi +95 -0
flwr/proto/exec_pb2_grpc.py +101 -0
flwr/proto/exec_pb2_grpc.pyi +41 -0
flwr/proto/fab_pb2.py +30 -0
flwr/proto/fab_pb2.pyi +56 -0
flwr/proto/fab_pb2_grpc.py +4 -0
flwr/proto/fab_pb2_grpc.pyi +4 -0
flwr/proto/fleet_pb2.py +29 -23
flwr/proto/fleet_pb2.pyi +33 -0
flwr/proto/fleet_pb2_grpc.py +102 -0
flwr/proto/fleet_pb2_grpc.pyi +35 -0
flwr/proto/grpcadapter_pb2.py +32 -0
flwr/proto/grpcadapter_pb2.pyi +43 -0
flwr/proto/grpcadapter_pb2_grpc.py +66 -0
flwr/proto/grpcadapter_pb2_grpc.pyi +24 -0
flwr/proto/message_pb2.py +41 -0
flwr/proto/message_pb2.pyi +122 -0
flwr/proto/message_pb2_grpc.py +4 -0
flwr/proto/message_pb2_grpc.pyi +4 -0
flwr/proto/run_pb2.py +35 -0
flwr/proto/run_pb2.pyi +76 -0
flwr/proto/run_pb2_grpc.py +4 -0
flwr/proto/run_pb2_grpc.pyi +4 -0
flwr/proto/task_pb2.py +7 -8
flwr/proto/task_pb2.pyi +8 -5
flwr/server/__init__.py +4 -8
flwr/server/app.py +298 -350
flwr/server/compat/app.py +6 -57
flwr/server/compat/app_utils.py +5 -4
flwr/server/compat/driver_client_proxy.py +29 -48
flwr/server/compat/legacy_context.py +5 -4
flwr/server/driver/__init__.py +2 -0
flwr/server/driver/driver.py +22 -132
flwr/server/driver/grpc_driver.py +224 -74
flwr/server/driver/inmemory_driver.py +183 -0
flwr/server/history.py +20 -20
flwr/server/run_serverapp.py +121 -34
flwr/server/server.py +11 -7
flwr/server/server_app.py +59 -10
flwr/server/serverapp_components.py +52 -0
flwr/server/strategy/__init__.py +2 -2
flwr/server/strategy/bulyan.py +1 -1
flwr/server/strategy/dp_adaptive_clipping.py +3 -3
flwr/server/strategy/dp_fixed_clipping.py +4 -3
flwr/server/strategy/dpfedavg_adaptive.py +1 -1
flwr/server/strategy/dpfedavg_fixed.py +1 -1
flwr/server/strategy/fedadagrad.py +1 -1
flwr/server/strategy/fedadam.py +1 -1
flwr/server/strategy/fedavg_android.py +1 -1
flwr/server/strategy/fedavgm.py +1 -1
flwr/server/strategy/fedmedian.py +1 -1
flwr/server/strategy/fedopt.py +1 -1
flwr/server/strategy/fedprox.py +1 -1
flwr/server/strategy/fedxgb_bagging.py +1 -1
flwr/server/strategy/fedxgb_cyclic.py +1 -1
flwr/server/strategy/fedxgb_nn_avg.py +1 -1
flwr/server/strategy/fedyogi.py +1 -1
flwr/server/strategy/krum.py +1 -1
flwr/server/strategy/qfedavg.py +1 -1
flwr/server/superlink/driver/__init__.py +1 -1
flwr/server/superlink/driver/driver_grpc.py +1 -1
flwr/server/superlink/driver/driver_servicer.py +51 -4
flwr/server/superlink/ffs/__init__.py +24 -0
flwr/server/superlink/ffs/disk_ffs.py +104 -0
flwr/server/superlink/ffs/ffs.py +79 -0
flwr/server/superlink/fleet/__init__.py +1 -1
flwr/server/superlink/fleet/grpc_adapter/__init__.py +15 -0
flwr/server/superlink/fleet/grpc_adapter/grpc_adapter_servicer.py +131 -0
flwr/server/superlink/fleet/grpc_bidi/__init__.py +1 -1
flwr/server/superlink/fleet/grpc_bidi/flower_service_servicer.py +1 -1
flwr/server/superlink/fleet/grpc_bidi/grpc_bridge.py +1 -1
flwr/server/superlink/fleet/grpc_bidi/grpc_client_proxy.py +1 -1
flwr/server/superlink/fleet/grpc_bidi/grpc_server.py +8 -2
flwr/server/superlink/fleet/grpc_rere/__init__.py +1 -1
flwr/server/superlink/fleet/grpc_rere/fleet_servicer.py +30 -2
flwr/server/superlink/fleet/grpc_rere/server_interceptor.py +214 -0
flwr/server/superlink/fleet/message_handler/__init__.py +1 -1
flwr/server/superlink/fleet/message_handler/message_handler.py +42 -2
flwr/server/superlink/fleet/rest_rere/__init__.py +1 -1
flwr/server/superlink/fleet/rest_rere/rest_api.py +59 -1
flwr/server/superlink/fleet/vce/backend/__init__.py +1 -1
flwr/server/superlink/fleet/vce/backend/backend.py +5 -5
flwr/server/superlink/fleet/vce/backend/raybackend.py +53 -56
flwr/server/superlink/fleet/vce/vce_api.py +190 -127
flwr/server/superlink/state/__init__.py +1 -1
flwr/server/superlink/state/in_memory_state.py +159 -42
flwr/server/superlink/state/sqlite_state.py +243 -39
flwr/server/superlink/state/state.py +81 -6
flwr/server/superlink/state/state_factory.py +11 -2
flwr/server/superlink/state/utils.py +62 -0
flwr/server/typing.py +2 -0
flwr/server/utils/__init__.py +1 -1
flwr/server/utils/tensorboard.py +1 -1
flwr/server/utils/validator.py +23 -9
flwr/server/workflow/default_workflows.py +67 -25
flwr/server/workflow/secure_aggregation/secaggplus_workflow.py +18 -6
flwr/simulation/__init__.py +7 -4
flwr/simulation/app.py +67 -36
flwr/simulation/ray_transport/__init__.py +1 -1
flwr/simulation/ray_transport/ray_actor.py +20 -46
flwr/simulation/ray_transport/ray_client_proxy.py +36 -16
flwr/simulation/run_simulation.py +308 -92
flwr/superexec/__init__.py +21 -0
flwr/superexec/app.py +184 -0
flwr/superexec/deployment.py +185 -0
flwr/superexec/exec_grpc.py +55 -0
flwr/superexec/exec_servicer.py +70 -0
flwr/superexec/executor.py +75 -0
flwr/superexec/simulation.py +193 -0
{flwr_nightly-1.8.0.dev20240314.dist-info → flwr_nightly-1.11.0.dev20240813.dist-info}/METADATA +10 -6
flwr_nightly-1.11.0.dev20240813.dist-info/RECORD +288 -0
flwr_nightly-1.11.0.dev20240813.dist-info/entry_points.txt +10 -0
flwr/cli/flower_toml.py +0 -140
flwr/cli/new/templates/app/flower.toml.tpl +0 -13
flwr/cli/new/templates/app/requirements.numpy.txt.tpl +0 -2
flwr/cli/new/templates/app/requirements.pytorch.txt.tpl +0 -4
flwr/cli/new/templates/app/requirements.tensorflow.txt.tpl +0 -4
flwr_nightly-1.8.0.dev20240314.dist-info/RECORD +0 -211
flwr_nightly-1.8.0.dev20240314.dist-info/entry_points.txt +0 -9
{flwr_nightly-1.8.0.dev20240314.dist-info → flwr_nightly-1.11.0.dev20240813.dist-info}/LICENSE +0 -0
{flwr_nightly-1.8.0.dev20240314.dist-info → flwr_nightly-1.11.0.dev20240813.dist-info}/WHEEL +0 -0

flwr/simulation/run_simulation.py CHANGED Viewed

@@ -18,46 +18,169 @@ import argparse
 import asyncio
 import json
 import logging
+import sys
 import threading
 import traceback
+from argparse import Namespace
 from logging import DEBUG, ERROR, INFO, WARNING
+from pathlib import Path
 from time import sleep
-from typing import Dict, Optional
-import grpc
+from typing import List, Optional
+from flwr.cli.config_utils import load_and_validate
 from flwr.client import ClientApp
 from flwr.common import EventType, event, log
-from flwr.common.typing import ConfigsRecordValues
-from flwr.server.driver.driver import Driver
-from flwr.server.run_serverapp import run
+from flwr.common.config import get_fused_config_from_dir, parse_config_args
+from flwr.common.constant import RUN_ID_NUM_BYTES
+from flwr.common.logger import (
+    set_logger_propagation,
+    update_console_handler,
+    warn_deprecated_feature_with_example,
+)
+from flwr.common.typing import Run, UserConfig
+from flwr.server.driver import Driver, InMemoryDriver
+from flwr.server.run_serverapp import run as run_server_app
 from flwr.server.server_app import ServerApp
-from flwr.server.superlink.driver.driver_grpc import run_driver_api_grpc
 from flwr.server.superlink.fleet import vce
+from flwr.server.superlink.fleet.vce.backend.backend import BackendConfig
 from flwr.server.superlink.state import StateFactory
+from flwr.server.superlink.state.utils import generate_rand_int_from_bytes
 from flwr.simulation.ray_transport.utils import (
     enable_tf_gpu_growth as enable_gpu_growth,
 )
+def _check_args_do_not_interfere(args: Namespace) -> bool:
+    """Ensure decoupling of flags for different ways to start the simulation."""
+    mode_one_args = ["app", "run_config"]
+    mode_two_args = ["client_app", "server_app"]
+    def _resolve_message(conflict_keys: List[str]) -> str:
+        return ",".join([f"`--{key}`".replace("_", "-") for key in conflict_keys])
+    # When passing `--app`, `--app-dir` is ignored
+    if args.app and args.app_dir:
+        log(ERROR, "Either `--app` or `--app-dir` can be set, but not both.")
+        return False
+    if any(getattr(args, key) for key in mode_one_args):
+        if any(getattr(args, key) for key in mode_two_args):
+            log(
+                ERROR,
+                "Passing any of {%s} alongside with any of {%s}",
+                _resolve_message(mode_one_args),
+                _resolve_message(mode_two_args),
+            )
+            return False
+        if not args.app:
+            log(ERROR, "You need to pass --app")
+            return False
+        return True
+    # Ensure all args are set (required for the non-FAB mode of execution)
+    if not all(getattr(args, key) for key in mode_two_args):
+        log(
+            ERROR,
+            "Passing all of %s keys are required.",
+            _resolve_message(mode_two_args),
+        )
+        return False
+    return True
 # Entry point from CLI
+# pylint: disable=too-many-locals
 def run_simulation_from_cli() -> None:
     """Run Simulation Engine from the CLI."""
     args = _parse_args_run_simulation().parse_args()
+    if args.enable_tf_gpu_growth:
+        warn_deprecated_feature_with_example(
+            "Passing `--enable-tf-gpu-growth` is deprecated.",
+            example_message="Instead, set the `TF_FORCE_GPU_ALLOW_GROWTH` environmnet "
+            "variable to true.",
+            code_example='TF_FORCE_GPU_ALLOW_GROWTH="true" flower-simulation <...>',
+        )
+    # We are supporting two modes for the CLI entrypoint:
+    # 1) Running an app dir containing a `pyproject.toml`
+    # 2) Running any ClientApp and SeverApp w/o pyproject.toml being present
+    # For 2), some CLI args are compulsory, but they are not required for 1)
+    # We first do these checks
+    args_check_pass = _check_args_do_not_interfere(args)
+    if not args_check_pass:
+        sys.exit("Simulation Engine cannot start.")
+    run_id = (
+        generate_rand_int_from_bytes(RUN_ID_NUM_BYTES)
+        if args.run_id is None
+        else args.run_id
+    )
+    if args.app:
+        # Mode 1
+        app_path = Path(args.app)
+        if not app_path.is_dir():
+            log(ERROR, "--app is not a directory")
+            sys.exit("Simulation Engine cannot start.")
+        # Load pyproject.toml
+        config, errors, warnings = load_and_validate(
+            app_path / "pyproject.toml", check_module=False
+        )
+        if errors:
+            raise ValueError(errors)
+        if warnings:
+            log(WARNING, warnings)
+        if config is None:
+            raise ValueError("Config extracted from FAB's pyproject.toml is not valid")
+        # Get ClientApp and SeverApp components
+        app_components = config["tool"]["flwr"]["app"]["components"]
+        client_app_attr = app_components["clientapp"]
+        server_app_attr = app_components["serverapp"]
+        override_config = parse_config_args([args.run_config])
+        fused_config = get_fused_config_from_dir(app_path, override_config)
+        app_dir = args.app
+        is_app = True
+    else:
+        # Mode 2
+        client_app_attr = args.client_app
+        server_app_attr = args.server_app
+        override_config = {}
+        fused_config = None
+        app_dir = args.app_dir
+        is_app = False
+    # Create run
+    run = Run(
+        run_id=run_id,
+        fab_id="",
+        fab_version="",
+        override_config=override_config,
+    )
     # Load JSON config
     backend_config_dict = json.loads(args.backend_config)
     _run_simulation(
-        server_app_attr=args.server_app,
-        client_app_attr=args.client_app,
+        server_app_attr=server_app_attr,
+        client_app_attr=client_app_attr,
         num_supernodes=args.num_supernodes,
         backend_name=args.backend,
         backend_config=backend_config_dict,
-        app_dir=args.app_dir,
-        driver_api_address=args.driver_api_address,
+        app_dir=app_dir,
+        run=run,
         enable_tf_gpu_growth=args.enable_tf_gpu_growth,
         verbose_logging=args.verbose,
+        server_app_run_config=fused_config,
+        is_app=is_app,
     )
@@ -68,7 +191,7 @@ def run_simulation(
     client_app: ClientApp,
     num_supernodes: int,
     backend_name: str = "ray",
-    backend_config: Optional[Dict[str, ConfigsRecordValues]] = None,
+    backend_config: Optional[BackendConfig] = None,
     enable_tf_gpu_growth: bool = False,
     verbose_logging: bool = False,
 ) -> None:
@@ -92,9 +215,12 @@ def run_simulation(
     backend_name : str (default: ray)
         A simulation backend that runs `ClientApp`s.
-    backend_config : Optional[Dict[str, ConfigsRecordValues]]
-        'A dictionary, e.g {"<keyA>": <value>, "<keyB>": <value>} to configure a
-        backend. Values supported in <value> are those included by
+    backend_config : Optional[BackendConfig]
+        'A dictionary to configure a backend. Separate dictionaries to configure
+        different elements of backend. Supported top-level keys are `init_args`
+        for values parsed to initialisation of backend, `client_resources`
+        to define the resources for clients, and `actor` to define the actor
+        parameters. Values supported in <value> are those included by
         `flwr.common.typing.ConfigsRecordValues`.
     enable_tf_gpu_growth : bool (default: False)
@@ -106,9 +232,18 @@ def run_simulation(
         works in the TensorFlow documentation: https://www.tensorflow.org/api/stable.
     verbose_logging : bool (default: False)
-        When diabled, only INFO, WARNING and ERROR log messages will be shown. If
+        When disabled, only INFO, WARNING and ERROR log messages will be shown. If
         enabled, DEBUG-level logs will be displayed.
     """
+    if enable_tf_gpu_growth:
+        warn_deprecated_feature_with_example(
+            "Passing `enable_tf_gpu_growth=True` is deprecated.",
+            example_message="Instead, set the `TF_FORCE_GPU_ALLOW_GROWTH` environmnet "
+            "variable to true.",
+            code_example='import os;os.environ["TF_FORCE_GPU_ALLOW_GROWTH"]="true"'
+            "\n\tflwr.simulation.run_simulationt(...)",
+        )
     _run_simulation(
         num_supernodes=num_supernodes,
         client_app=client_app,
@@ -124,47 +259,67 @@ def run_simulation(
 def run_serverapp_th(
     server_app_attr: Optional[str],
     server_app: Optional[ServerApp],
+    server_app_run_config: UserConfig,
     driver: Driver,
     app_dir: str,
-    f_stop: asyncio.Event,
+    f_stop: threading.Event,
+    has_exception: threading.Event,
     enable_tf_gpu_growth: bool,
     delay_launch: int = 3,
 ) -> threading.Thread:
     """Run SeverApp in a thread."""
-    def server_th_with_start_checks(  # type: ignore
-        tf_gpu_growth: bool, stop_event: asyncio.Event, **kwargs
+    def server_th_with_start_checks(
+        tf_gpu_growth: bool,
+        stop_event: threading.Event,
+        exception_event: threading.Event,
+        _driver: Driver,
+        _server_app_dir: str,
+        _server_app_run_config: UserConfig,
+        _server_app_attr: Optional[str],
+        _server_app: Optional[ServerApp],
     ) -> None:
-        """Run SeverApp, after check if GPU memory grouwth has to be set.
+        """Run SeverApp, after check if GPU memory growth has to be set.
         Upon exception, trigger stop event for Simulation Engine.
         """
         try:
             if tf_gpu_growth:
-                log(INFO, "Enabling GPU growth for Tensorflow on the main thread.")
+                log(INFO, "Enabling GPU growth for Tensorflow on the server thread.")
                 enable_gpu_growth()
             # Run ServerApp
-            run(**kwargs)
+            run_server_app(
+                driver=_driver,
+                server_app_dir=_server_app_dir,
+                server_app_run_config=_server_app_run_config,
+                server_app_attr=_server_app_attr,
+                loaded_server_app=_server_app,
+            )
         except Exception as ex:  # pylint: disable=broad-exception-caught
             log(ERROR, "ServerApp thread raised an exception: %s", ex)
             log(ERROR, traceback.format_exc())
+            exception_event.set()
+            raise
         finally:
             log(DEBUG, "ServerApp finished running.")
             # Upon completion, trigger stop event if one was passed
             if stop_event is not None:
                 stop_event.set()
-                log(WARNING, "Triggered stop event for Simulation Engine.")
+                log(DEBUG, "Triggered stop event for Simulation Engine.")
     serverapp_th = threading.Thread(
         target=server_th_with_start_checks,
-        args=(enable_tf_gpu_growth, f_stop),
-        kwargs={
-            "server_app_attr": server_app_attr,
-            "loaded_server_app": server_app,
-            "driver": driver,
-            "server_app_dir": app_dir,
-        },
+        args=(
+            enable_tf_gpu_growth,
+            f_stop,
+            has_exception,
+            driver,
+            app_dir,
+            server_app_run_config,
+            server_app_attr,
+            server_app,
+        ),
     )
     sleep(delay_launch)
     serverapp_th.start()
@@ -176,46 +331,45 @@ def _main_loop(
     num_supernodes: int,
     backend_name: str,
     backend_config_stream: str,
-    driver_api_address: str,
     app_dir: str,
+    is_app: bool,
     enable_tf_gpu_growth: bool,
+    run: Run,
+    flwr_dir: Optional[str] = None,
     client_app: Optional[ClientApp] = None,
     client_app_attr: Optional[str] = None,
     server_app: Optional[ServerApp] = None,
     server_app_attr: Optional[str] = None,
+    server_app_run_config: Optional[UserConfig] = None,
 ) -> None:
-    """Launch SuperLink with Simulation Engine, then ServerApp on a separate thread.
-    Everything runs on the main thread or a separate one, depening on whether the main
-    thread already contains a running Asyncio event loop. This is the case if running
-    the Simulation Engine on a Jupyter/Colab notebook.
-    """
+    """Launch SuperLink with Simulation Engine, then ServerApp on a separate thread."""
     # Initialize StateFactory
     state_factory = StateFactory(":flwr-in-memory-state:")
-    # Start Driver API
-    driver_server: grpc.Server = run_driver_api_grpc(
-        address=driver_api_address,
-        state_factory=state_factory,
-        certificates=None,
-    )
-    f_stop = asyncio.Event()
+    f_stop = threading.Event()
+    # A Threading event to indicate if an exception was raised in the ServerApp thread
+    server_app_thread_has_exception = threading.Event()
     serverapp_th = None
     try:
+        # Register run
+        log(DEBUG, "Pre-registering run with id %s", run.run_id)
+        state_factory.state().run_ids[run.run_id] = run  # type: ignore
+        if server_app_run_config is None:
+            server_app_run_config = {}
         # Initialize Driver
-        driver = Driver(
-            driver_service_address=driver_api_address,
-            root_certificates=None,
-        )
+        driver = InMemoryDriver(run_id=run.run_id, state_factory=state_factory)
         # Get and run ServerApp thread
         serverapp_th = run_serverapp_th(
             server_app_attr=server_app_attr,
             server_app=server_app,
+            server_app_run_config=server_app_run_config,
             driver=driver,
             app_dir=app_dir,
             f_stop=f_stop,
+            has_exception=server_app_thread_has_exception,
             enable_tf_gpu_growth=enable_tf_gpu_growth,
         )
@@ -228,8 +382,11 @@ def _main_loop(
             backend_name=backend_name,
             backend_config_json_stream=backend_config_stream,
             app_dir=app_dir,
+            is_app=is_app,
             state_factory=state_factory,
             f_stop=f_stop,
+            run=run,
+            flwr_dir=flwr_dir,
         )
     except Exception as ex:
@@ -238,17 +395,16 @@ def _main_loop(
         raise RuntimeError("An error was encountered. Ending simulation.") from ex
     finally:
-        # Stop Driver
-        driver_server.stop(grace=0)
-        driver.close()
         # Trigger stop event
         f_stop.set()
         event(EventType.RUN_SUPERLINK_LEAVE)
         if serverapp_th:
             serverapp_th.join()
+            if server_app_thread_has_exception.is_set():
+                raise RuntimeError("Exception in ServerApp thread")
-    log(INFO, "Stopping Simulation Engine now.")
+    log(DEBUG, "Stopping Simulation Engine now.")
 # pylint: disable=too-many-arguments,too-many-locals
@@ -257,13 +413,16 @@ def _run_simulation(
     client_app: Optional[ClientApp] = None,
     server_app: Optional[ServerApp] = None,
     backend_name: str = "ray",
-    backend_config: Optional[Dict[str, ConfigsRecordValues]] = None,
+    backend_config: Optional[BackendConfig] = None,
     client_app_attr: Optional[str] = None,
     server_app_attr: Optional[str] = None,
+    server_app_run_config: Optional[UserConfig] = None,
     app_dir: str = "",
-    driver_api_address: str = "0.0.0.0:9091",
+    flwr_dir: Optional[str] = None,
+    run: Optional[Run] = None,
     enable_tf_gpu_growth: bool = False,
     verbose_logging: bool = False,
+    is_app: bool = False,
 ) -> None:
     r"""Launch the Simulation Engine.
@@ -284,93 +443,130 @@ def _run_simulation(
     backend_name : str (default: ray)
         A simulation backend that runs `ClientApp`s.
-    backend_config : Optional[Dict[str, ConfigsRecordValues]]
-        'A dictionary, e.g {"<keyA>":<value>, "<keyB>":<value>} to configure a
-        backend. Values supported in <value> are those included by
+    backend_config : Optional[BackendConfig]
+        'A dictionary to configure a backend. Separate dictionaries to configure
+        different elements of backend. Supported top-level keys are `init_args`
+        for values parsed to initialisation of backend, `client_resources`
+        to define the resources for clients, and `actor` to define the actor
+        parameters. Values supported in <value> are those included by
         `flwr.common.typing.ConfigsRecordValues`.
-    client_app_attr : str
+    client_app_attr : Optional[str]
         A path to a `ClientApp` module to be loaded: For example: `client:app` or
         `project.package.module:wrapper.app`."
-    server_app_attr : str
+    server_app_attr : Optional[str]
         A path to a `ServerApp` module to be loaded: For example: `server:app` or
         `project.package.module:wrapper.app`."
+    server_app_run_config : Optional[UserConfig]
+        Config dictionary that parameterizes the run config. It will be made accesible
+        to the ServerApp.
     app_dir : str
         Add specified directory to the PYTHONPATH and load `ClientApp` from there.
         (Default: current working directory.)
-    driver_api_address : str (default: "0.0.0.0:9091")
-        Driver API (gRPC) server address (IPv4, IPv6, or a domain name)
+    flwr_dir : Optional[str]
+        The path containing installed Flower Apps.
+    run : Optional[Run]
+        An object carrying details about the run.
     enable_tf_gpu_growth : bool (default: False)
         A boolean to indicate whether to enable GPU growth on the main thread. This is
         desirable if you make use of a TensorFlow model on your `ServerApp` while
         having your `ClientApp` running on the same GPU. Without enabling this, you
-        might encounter an out-of-memory error becasue TensorFlow by default allocates
+        might encounter an out-of-memory error because TensorFlow by default allocates
         all GPU memory. Read mor about how `tf.config.experimental.set_memory_growth()`
         works in the TensorFlow documentation: https://www.tensorflow.org/api/stable.
     verbose_logging : bool (default: False)
-        When diabled, only INFO, WARNING and ERROR log messages will be shown. If
+        When disabled, only INFO, WARNING and ERROR log messages will be shown. If
         enabled, DEBUG-level logs will be displayed.
-    """
-    # Set logging level
-    if not verbose_logging:
-        logger = logging.getLogger("flwr")
-        logger.setLevel(INFO)
+    is_app : bool (default: False)
+        A flag that indicates whether the simulation is running an app or not. This is
+        needed in order to attempt loading an app's pyproject.toml when nodes register
+        a context object.
+    """
     if backend_config is None:
         backend_config = {}
+    if "init_args" not in backend_config:
+        backend_config["init_args"] = {}
+    # Set default client_resources if not passed
+    if "client_resources" not in backend_config:
+        backend_config["client_resources"] = {"num_cpus": 2, "num_gpus": 0}
+    # Initialization of backend config to enable GPU growth globally when set
+    if "actor" not in backend_config:
+        backend_config["actor"] = {"tensorflow": 0}
+    # Set logging level
+    logger = logging.getLogger("flwr")
+    if verbose_logging:
+        update_console_handler(level=DEBUG, timestamps=True, colored=True)
+    else:
+        backend_config["init_args"]["logging_level"] = backend_config["init_args"].get(
+            "logging_level", WARNING
+        )
+        backend_config["init_args"]["log_to_driver"] = backend_config["init_args"].get(
+            "log_to_driver", True
+        )
     if enable_tf_gpu_growth:
         # Check that Backend config has also enabled using GPU growth
-        use_tf = backend_config.get("tensorflow", False)
+        use_tf = backend_config.get("actor", {}).get("tensorflow", False)
         if not use_tf:
             log(WARNING, "Enabling GPU growth for your backend.")
-            backend_config["tensorflow"] = True
+            backend_config["actor"]["tensorflow"] = True
     # Convert config to original JSON-stream format
     backend_config_stream = json.dumps(backend_config)
-    simulation_engine_th = None
+    # If no `Run` object is set, create one
+    if run is None:
+        run_id = generate_rand_int_from_bytes(RUN_ID_NUM_BYTES)
+        run = Run(run_id=run_id, fab_id="", fab_version="", override_config={})
     args = (
         num_supernodes,
         backend_name,
         backend_config_stream,
-        driver_api_address,
         app_dir,
+        is_app,
         enable_tf_gpu_growth,
+        run,
+        flwr_dir,
         client_app,
         client_app_attr,
         server_app,
         server_app_attr,
+        server_app_run_config,
     )
     # Detect if there is an Asyncio event loop already running.
-    # If yes, run everything on a separate thread. In environmnets
-    # like Jupyter/Colab notebooks, there is an event loop present.
-    run_in_thread = False
+    # If yes, disable logger propagation. In environmnets
+    # like Jupyter/Colab notebooks, it's often better to do this.
+    asyncio_loop_running = False
     try:
         _ = (
             asyncio.get_running_loop()
         )  # Raises RuntimeError if no event loop is present
         log(DEBUG, "Asyncio event loop already running.")
-        run_in_thread = True
+        asyncio_loop_running = True
     except RuntimeError:
-        log(DEBUG, "No asyncio event loop runnig")
+        pass
     finally:
-        if run_in_thread:
-            log(DEBUG, "Starting Simulation Engine on a new thread.")
-            simulation_engine_th = threading.Thread(target=_main_loop, args=args)
-            simulation_engine_th.start()
-            simulation_engine_th.join()
-        else:
-            log(DEBUG, "Starting Simulation Engine on the main thread.")
-            _main_loop(*args)
+        if asyncio_loop_running:
+            # Set logger propagation to False to prevent duplicated log output in Colab.
+            logger = set_logger_propagation(logger, False)
+        _main_loop(*args)
 def _parse_args_run_simulation() -> argparse.ArgumentParser:
@@ -380,12 +576,10 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
     )
     parser.add_argument(
         "--server-app",
-        required=True,
         help="For example: `server:app` or `project.package.module:wrapper.app`",
     )
     parser.add_argument(
         "--client-app",
-        required=True,
         help="For example: `client:app` or `project.package.module:wrapper.app`",
     )
     parser.add_argument(
@@ -395,10 +589,16 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
         help="Number of simulated SuperNodes.",
     )
     parser.add_argument(
-        "--driver-api-address",
-        default="0.0.0.0:9091",
+        "--app",
         type=str,
-        help="For example: `server:app` or `project.package.module:wrapper.app`",
+        default=None,
+        help="Path to a directory containing a FAB-like structure with a "
+        "pyproject.toml.",
+    )
+    parser.add_argument(
+        "--run-config",
+        default=None,
+        help="Override configuration key-value pairs.",
     )
     parser.add_argument(
         "--backend",
@@ -409,7 +609,7 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
     parser.add_argument(
         "--backend-config",
         type=str,
-        default='{"client_resources": {"num_cpus":2, "num_gpus":0.0}, "tensorflow": 0}',
+        default="{}",
         help='A JSON formatted stream, e.g \'{"<keyA>":<value>, "<keyB>":<value>}\' to '
         "configure a backend. Values supported in <value> are those included by "
         "`flwr.common.typing.ConfigsRecordValues`. ",
@@ -437,5 +637,21 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
         "ClientApp and ServerApp from there."
         " Default: current working directory.",
     )
+    parser.add_argument(
+        "--flwr-dir",
+        default=None,
+        help="""The path containing installed Flower Apps.
+    By default, this value is equal to:
+        - `$FLWR_HOME/` if `$FLWR_HOME` is defined
+        - `$XDG_DATA_HOME/.flwr/` if `$XDG_DATA_HOME` is defined
+        - `$HOME/.flwr/` in all other cases
+    """,
+    )
+    parser.add_argument(
+        "--run-id",
+        type=int,
+        help="Sets the ID of the run started by the Simulation Engine.",
+    )
     return parser

flwr/superexec/__init__.py ADDED Viewed

@@ -0,0 +1,21 @@
+# Copyright 2024 Flower Labs GmbH. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Flower SuperExec service."""
+from .app import run_superexec as run_superexec
+__all__ = [
+    "run_superexec",
+]

flwr-nightly 1.8.0.dev20240314__py3-none-any.whl → 1.11.0.dev20240813__py3-none-any.whl

Potentially problematic release.

flwr-nightly 1.8.0.dev20240314py3-none-any.whl → 1.11.0.dev20240813py3-none-any.whl