PyPI - flwr-nightly - Versions diffs - 1.8.0.dev20240303__py3-none-any.whl → 1.8.0.dev20240305__py3-none-any.whl - Mend

flwr-nightly 1.8.0.dev20240303py3-none-any.whl → 1.8.0.dev20240305py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

flwr/cli/new/new.py +1 -0
flwr/cli/new/templates/app/code/client.numpy.py.tpl +24 -0
flwr/cli/new/templates/app/code/server.numpy.py.tpl +12 -0
flwr/cli/new/templates/app/flower.toml.tpl +2 -2
flwr/cli/new/templates/app/requirements.numpy.txt.tpl +2 -0
flwr/client/app.py +93 -8
flwr/client/grpc_client/connection.py +7 -0
flwr/client/grpc_rere_client/connection.py +14 -4
flwr/client/rest_client/connection.py +16 -4
flwr/common/__init__.py +4 -0
flwr/common/constant.py +11 -0
flwr/server/app.py +7 -7
flwr/server/run_serverapp.py +14 -9
flwr/server/server.py +5 -5
flwr/server/superlink/driver/driver_servicer.py +1 -1
flwr/server/superlink/fleet/vce/vce_api.py +17 -5
flwr/simulation/__init__.py +2 -5
flwr/simulation/run_simulation.py +301 -76
{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/METADATA +1 -1
{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/RECORD +23 -20
{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/entry_points.txt +1 -1
{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/LICENSE +0 -0
{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/WHEEL +0 -0

flwr/server/superlink/fleet/vce/vce_api.py CHANGED Viewed

@@ -219,16 +219,23 @@ async def run(
 # pylint: disable=too-many-arguments,unused-argument,too-many-locals
 def start_vce(
-    client_app_module_name: str,
     backend_name: str,
     backend_config_json_stream: str,
-    working_dir: str,
+    app_dir: str,
     f_stop: asyncio.Event,
+    client_app: Optional[ClientApp] = None,
+    client_app_attr: Optional[str] = None,
     num_supernodes: Optional[int] = None,
     state_factory: Optional[StateFactory] = None,
     existing_nodes_mapping: Optional[NodeToPartitionMapping] = None,
 ) -> None:
     """Start Fleet API with the Simulation Engine."""
+    if client_app_attr is not None and client_app is not None:
+        raise ValueError(
+            "Both `client_app_attr` and `client_app` are provided, "
+            "but only one is allowed."
+        )
     if num_supernodes is not None and existing_nodes_mapping is not None:
         raise ValueError(
             "Both `num_supernodes` and `existing_nodes_mapping` are provided, "
@@ -290,12 +297,17 @@ def start_vce(
     def backend_fn() -> Backend:
         """Instantiate a Backend."""
-        return backend_type(backend_config, work_dir=working_dir)
+        return backend_type(backend_config, work_dir=app_dir)
-    log(INFO, "client_app_module_name = %s", client_app_module_name)
+    log(INFO, "client_app_attr = %s", client_app_attr)
+    # Load ClientApp if needed
     def _load() -> ClientApp:
-        app: ClientApp = load_client_app(client_app_module_name)
+        if client_app_attr:
+            app: ClientApp = load_client_app(client_app_attr)
+        if client_app:
+            app = client_app
         return app
     app_fn = _load

flwr/simulation/__init__.py CHANGED Viewed

@@ -17,7 +17,7 @@
 import importlib
-from flwr.simulation.run_simulation import run_simulation
+from flwr.simulation.run_simulation import run_simulation, run_simulation_from_cli
 is_ray_installed = importlib.util.find_spec("ray") is not None
@@ -36,7 +36,4 @@ To install the necessary dependencies, install `flwr` with the `simulation` extr
         raise ImportError(RAY_IMPORT_ERROR)
-__all__ = [
-    "start_simulation",
-    "run_simulation",
-]
+__all__ = ["start_simulation", "run_simulation_from_cli", "run_simulation"]

flwr/simulation/run_simulation.py CHANGED Viewed

@@ -17,39 +17,153 @@
 import argparse
 import asyncio
 import json
+import logging
 import threading
 import traceback
-from logging import ERROR, INFO, WARNING
+from logging import DEBUG, ERROR, INFO, WARNING
 from time import sleep
-from typing import Any, Callable
+from typing import Dict, Optional
 import grpc
+from flwr.client import ClientApp
 from flwr.common import EventType, event, log
+from flwr.common.typing import ConfigsRecordValues
 from flwr.server.driver.driver import Driver
 from flwr.server.run_serverapp import run
+from flwr.server.server_app import ServerApp
 from flwr.server.superlink.driver.driver_grpc import run_driver_api_grpc
 from flwr.server.superlink.fleet import vce
 from flwr.server.superlink.state import StateFactory
-from flwr.simulation.ray_transport.utils import enable_tf_gpu_growth
+from flwr.simulation.ray_transport.utils import (
+    enable_tf_gpu_growth as enable_gpu_growth,
+)
+# Entry point from CLI
+def run_simulation_from_cli() -> None:
+    """Run Simulation Engine from the CLI."""
+    args = _parse_args_run_simulation().parse_args()
+    # Load JSON config
+    backend_config_dict = json.loads(args.backend_config)
+    _run_simulation(
+        server_app_attr=args.server_app,
+        client_app_attr=args.client_app,
+        num_supernodes=args.num_supernodes,
+        backend_name=args.backend,
+        backend_config=backend_config_dict,
+        app_dir=args.app_dir,
+        driver_api_address=args.driver_api_address,
+        enable_tf_gpu_growth=args.enable_tf_gpu_growth,
+        verbose_logging=args.verbose,
+    )
+# Entry point from Python session (script or notebook)
+# pylint: disable=too-many-arguments
+def run_simulation(
+    server_app: ServerApp,
+    client_app: ClientApp,
+    num_supernodes: int,
+    backend_name: str = "ray",
+    backend_config: Optional[Dict[str, ConfigsRecordValues]] = None,
+    enable_tf_gpu_growth: bool = False,
+    verbose_logging: bool = False,
+) -> None:
+    r"""Run a Flower App using the Simulation Engine.
+    Parameters
+    ----------
+    server_app : ServerApp
+        The `ServerApp` to be executed. It will send messages to different `ClientApp`
+        instances running on different (virtual) SuperNodes.
+    client_app : ClientApp
+        The `ClientApp` to be executed by each of the SuperNodes. It will receive
+        messages sent by the `ServerApp`.
+    num_supernodes : int
+        Number of nodes that run a ClientApp. They can be sampled by a
+        Driver in the ServerApp and receive a Message describing what the ClientApp
+        should perform.
+    backend_name : str (default: ray)
+        A simulation backend that runs `ClientApp`s.
+    backend_config : Optional[Dict[str, ConfigsRecordValues]]
+        'A dictionary, e.g {"<keyA>": <value>, "<keyB>": <value>} to configure a
+        backend. Values supported in <value> are those included by
+        `flwr.common.typing.ConfigsRecordValues`.
+    enable_tf_gpu_growth : bool (default: False)
+        A boolean to indicate whether to enable GPU growth on the main thread. This is
+        desirable if you make use of a TensorFlow model on your `ServerApp` while
+        having your `ClientApp` running on the same GPU. Without enabling this, you
+        might encounter an out-of-memory error because TensorFlow, by default, allocates
+        all GPU memory. Read more about how `tf.config.experimental.set_memory_growth()`
+        works in the TensorFlow documentation: https://www.tensorflow.org/api/stable.
+    verbose_logging : bool (default: False)
+        When diabled, only INFO, WARNING and ERROR log messages will be shown. If
+        enabled, DEBUG-level logs will be displayed.
+    """
+    _run_simulation(
+        num_supernodes=num_supernodes,
+        client_app=client_app,
+        server_app=server_app,
+        backend_name=backend_name,
+        backend_config=backend_config,
+        enable_tf_gpu_growth=enable_tf_gpu_growth,
+        verbose_logging=verbose_logging,
+    )
+# pylint: disable=too-many-arguments
 def run_serverapp_th(
-    server_app_attr: str,
+    server_app_attr: Optional[str],
+    server_app: Optional[ServerApp],
     driver: Driver,
-    server_app_dir: str,
+    app_dir: str,
     f_stop: asyncio.Event,
+    enable_tf_gpu_growth: bool,
     delay_launch: int = 3,
 ) -> threading.Thread:
     """Run SeverApp in a thread."""
+    def server_th_with_start_checks(  # type: ignore
+        tf_gpu_growth: bool, stop_event: asyncio.Event, **kwargs
+    ) -> None:
+        """Run SeverApp, after check if GPU memory grouwth has to be set.
+        Upon exception, trigger stop event for Simulation Engine.
+        """
+        try:
+            if tf_gpu_growth:
+                log(INFO, "Enabling GPU growth for Tensorflow on the main thread.")
+                enable_gpu_growth()
+            # Run ServerApp
+            run(**kwargs)
+        except Exception as ex:  # pylint: disable=broad-exception-caught
+            log(ERROR, "ServerApp thread raised an exception: %s", ex)
+            log(ERROR, traceback.format_exc())
+        finally:
+            log(DEBUG, "ServerApp finished running.")
+            # Upon completion, trigger stop event if one was passed
+            if stop_event is not None:
+                stop_event.set()
+                log(WARNING, "Triggered stop event for Simulation Engine.")
     serverapp_th = threading.Thread(
-        target=run,
+        target=server_th_with_start_checks,
+        args=(enable_tf_gpu_growth, f_stop),
         kwargs={
             "server_app_attr": server_app_attr,
+            "loaded_server_app": server_app,
             "driver": driver,
-            "server_app_dir": server_app_dir,
-            "stop_event": f_stop,  # will be set when `run()` finishes
-            # will trigger the shutdown of the Simulation Engine
+            "server_app_dir": app_dir,
         },
     )
     sleep(delay_launch)
@@ -57,52 +171,31 @@ def run_serverapp_th(
     return serverapp_th
-def get_thread_exception_hook(stop_event: asyncio.Event) -> Callable[[Any], None]:
-    """Return a callback for when the ServerApp thread raises an exception."""
-    def execepthook(args: Any) -> None:
-        """Upon exception raised, log exception and trigger stop event."""
-        # log
-        log(
-            ERROR,
-            "The ServerApp thread triggered exception (%s): %s",
-            args.exc_type,
-            args.exc_value,
-        )
-        log(ERROR, traceback.format_exc())
-        # Set stop event
-        stop_event.set()
-        log(WARNING, "Triggered stop event for Simulation Engine.")
-    return execepthook
-def run_simulation() -> None:
-    """Run Simulation Engine."""
-    args = _parse_args_run_simulation().parse_args()
-    # Load JSON config
-    backend_config_dict = json.loads(args.backend_config)
-    # Enable GPU memory growth (relevant only for TF)
-    if args.enable_tf_gpu_growth:
-        log(INFO, "Enabling GPU growth for Tensorflow on the main thread.")
-        enable_tf_gpu_growth()
-        # Check that Backend config has also enabled using GPU growth
-        use_tf = backend_config_dict.get("tensorflow", False)
-        if not use_tf:
-            log(WARNING, "Enabling GPU growth for your backend.")
-            backend_config_dict["tensorflow"] = True
-    # Convert back to JSON stream
-    backend_config = json.dumps(backend_config_dict)
+# pylint: disable=too-many-locals
+def _main_loop(
+    num_supernodes: int,
+    backend_name: str,
+    backend_config_stream: str,
+    driver_api_address: str,
+    app_dir: str,
+    enable_tf_gpu_growth: bool,
+    client_app: Optional[ClientApp] = None,
+    client_app_attr: Optional[str] = None,
+    server_app: Optional[ServerApp] = None,
+    server_app_attr: Optional[str] = None,
+) -> None:
+    """Launch SuperLink with Simulation Engine, then ServerApp on a separate thread.
+    Everything runs on the main thread or a separate one, depening on whether the main
+    thread already contains a running Asyncio event loop. This is the case if running
+    the Simulation Engine on a Jupyter/Colab notebook.
+    """
     # Initialize StateFactory
     state_factory = StateFactory(":flwr-in-memory-state:")
     # Start Driver API
     driver_server: grpc.Server = run_driver_api_grpc(
-        address=args.driver_api_address,
+        address=driver_api_address,
         state_factory=state_factory,
         certificates=None,
     )
@@ -112,35 +205,39 @@ def run_simulation() -> None:
     try:
         # Initialize Driver
         driver = Driver(
-            driver_service_address=args.driver_api_address,
+            driver_service_address=driver_api_address,
             root_certificates=None,
         )
         # Get and run ServerApp thread
-        serverapp_th = run_serverapp_th(args.server_app, driver, args.dir, f_stop)
-        # Setup an exception hook
-        threading.excepthook = get_thread_exception_hook(f_stop)
+        serverapp_th = run_serverapp_th(
+            server_app_attr=server_app_attr,
+            server_app=server_app,
+            driver=driver,
+            app_dir=app_dir,
+            f_stop=f_stop,
+            enable_tf_gpu_growth=enable_tf_gpu_growth,
+        )
         # SuperLink with Simulation Engine
         event(EventType.RUN_SUPERLINK_ENTER)
         vce.start_vce(
-            num_supernodes=args.num_supernodes,
-            client_app_module_name=args.client_app,
-            backend_name=args.backend,
-            backend_config_json_stream=backend_config,
-            working_dir=args.dir,
+            num_supernodes=num_supernodes,
+            client_app_attr=client_app_attr,
+            client_app=client_app,
+            backend_name=backend_name,
+            backend_config_json_stream=backend_config_stream,
+            app_dir=app_dir,
             state_factory=state_factory,
             f_stop=f_stop,
         )
     except Exception as ex:
-        log(ERROR, "An exception occurred: %s", ex)
+        log(ERROR, "An exception occurred !! %s", ex)
         log(ERROR, traceback.format_exc())
         raise RuntimeError("An error was encountered. Ending simulation.") from ex
     finally:
         # Stop Driver
         driver_server.stop(grace=0)
         del driver
@@ -154,20 +251,148 @@ def run_simulation() -> None:
     log(INFO, "Stopping Simulation Engine now.")
+# pylint: disable=too-many-arguments,too-many-locals
+def _run_simulation(
+    num_supernodes: int,
+    client_app: Optional[ClientApp] = None,
+    server_app: Optional[ServerApp] = None,
+    backend_name: str = "ray",
+    backend_config: Optional[Dict[str, ConfigsRecordValues]] = None,
+    client_app_attr: Optional[str] = None,
+    server_app_attr: Optional[str] = None,
+    app_dir: str = "",
+    driver_api_address: str = "0.0.0.0:9091",
+    enable_tf_gpu_growth: bool = False,
+    verbose_logging: bool = False,
+) -> None:
+    r"""Launch the Simulation Engine.
+    Parameters
+    ----------
+    num_supernodes : int
+        Number of nodes that run a ClientApp. They can be sampled by a
+        Driver in the ServerApp and receive a Message describing what the ClientApp
+        should perform.
+    client_app : Optional[ClientApp]
+        The `ClientApp` to be executed by each of the `SuperNodes`. It will receive
+        messages sent by the `ServerApp`.
+    server_app : Optional[ServerApp]
+        The `ServerApp` to be executed.
+    backend_name : str (default: ray)
+        A simulation backend that runs `ClientApp`s.
+    backend_config : Optional[Dict[str, ConfigsRecordValues]]
+        'A dictionary, e.g {"<keyA>":<value>, "<keyB>":<value>} to configure a
+        backend. Values supported in <value> are those included by
+        `flwr.common.typing.ConfigsRecordValues`.
+    client_app_attr : str
+        A path to a `ClientApp` module to be loaded: For example: `client:app` or
+        `project.package.module:wrapper.app`."
+    server_app_attr : str
+        A path to a `ServerApp` module to be loaded: For example: `server:app` or
+        `project.package.module:wrapper.app`."
+    app_dir : str
+        Add specified directory to the PYTHONPATH and load `ClientApp` from there.
+        (Default: current working directory.)
+    driver_api_address : str (default: "0.0.0.0:9091")
+        Driver API (gRPC) server address (IPv4, IPv6, or a domain name)
+    enable_tf_gpu_growth : bool (default: False)
+        A boolean to indicate whether to enable GPU growth on the main thread. This is
+        desirable if you make use of a TensorFlow model on your `ServerApp` while
+        having your `ClientApp` running on the same GPU. Without enabling this, you
+        might encounter an out-of-memory error becasue TensorFlow by default allocates
+        all GPU memory. Read mor about how `tf.config.experimental.set_memory_growth()`
+        works in the TensorFlow documentation: https://www.tensorflow.org/api/stable.
+    verbose_logging : bool (default: False)
+        When diabled, only INFO, WARNING and ERROR log messages will be shown. If
+        enabled, DEBUG-level logs will be displayed.
+    """
+    # Set logging level
+    if not verbose_logging:
+        logger = logging.getLogger("flwr")
+        logger.setLevel(INFO)
+    if backend_config is None:
+        backend_config = {}
+    if enable_tf_gpu_growth:
+        # Check that Backend config has also enabled using GPU growth
+        use_tf = backend_config.get("tensorflow", False)
+        if not use_tf:
+            log(WARNING, "Enabling GPU growth for your backend.")
+            backend_config["tensorflow"] = True
+    # Convert config to original JSON-stream format
+    backend_config_stream = json.dumps(backend_config)
+    simulation_engine_th = None
+    args = (
+        num_supernodes,
+        backend_name,
+        backend_config_stream,
+        driver_api_address,
+        app_dir,
+        enable_tf_gpu_growth,
+        client_app,
+        client_app_attr,
+        server_app,
+        server_app_attr,
+    )
+    # Detect if there is an Asyncio event loop already running.
+    # If yes, run everything on a separate thread. In environmnets
+    # like Jupyter/Colab notebooks, there is an event loop present.
+    run_in_thread = False
+    try:
+        _ = (
+            asyncio.get_running_loop()
+        )  # Raises RuntimeError if no event loop is present
+        log(DEBUG, "Asyncio event loop already running.")
+        run_in_thread = True
+    except RuntimeError:
+        log(DEBUG, "No asyncio event loop runnig")
+    finally:
+        if run_in_thread:
+            log(DEBUG, "Starting Simulation Engine on a new thread.")
+            simulation_engine_th = threading.Thread(target=_main_loop, args=args)
+            simulation_engine_th.start()
+            simulation_engine_th.join()
+        else:
+            log(DEBUG, "Starting Simulation Engine on the main thread.")
+            _main_loop(*args)
 def _parse_args_run_simulation() -> argparse.ArgumentParser:
     """Parse flower-simulation command line arguments."""
     parser = argparse.ArgumentParser(
         description="Start a Flower simulation",
     )
+    parser.add_argument(
+        "--server-app",
+        required=True,
+        help="For example: `server:app` or `project.package.module:wrapper.app`",
+    )
     parser.add_argument(
         "--client-app",
         required=True,
         help="For example: `client:app` or `project.package.module:wrapper.app`",
     )
     parser.add_argument(
-        "--server-app",
+        "--num-supernodes",
+        type=int,
         required=True,
-        help="For example: `server:app` or `project.package.module:wrapper.app`",
+        help="Number of simulated SuperNodes.",
     )
     parser.add_argument(
         "--driver-api-address",
@@ -175,18 +400,20 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
         type=str,
         help="For example: `server:app` or `project.package.module:wrapper.app`",
     )
-    parser.add_argument(
-        "--num-supernodes",
-        type=int,
-        required=True,
-        help="Number of simulated SuperNodes.",
-    )
     parser.add_argument(
         "--backend",
         default="ray",
         type=str,
         help="Simulation backend that executes the ClientApp.",
     )
+    parser.add_argument(
+        "--backend-config",
+        type=str,
+        default='{"client_resources": {"num_cpus":2, "num_gpus":0.0}, "tensorflow": 0}',
+        help='A JSON formatted stream, e.g \'{"<keyA>":<value>, "<keyB>":<value>}\' to '
+        "configure a backend. Values supported in <value> are those included by "
+        "`flwr.common.typing.ConfigsRecordValues`. ",
+    )
     parser.add_argument(
         "--enable-tf-gpu-growth",
         action="store_true",
@@ -198,15 +425,13 @@ def _parse_args_run_simulation() -> argparse.ArgumentParser:
         "the TensorFlow documentation: https://www.tensorflow.org/api/stable.",
     )
     parser.add_argument(
-        "--backend-config",
-        type=str,
-        default='{"client_resources": {"num_cpus":2, "num_gpus":0.0}, "tensorflow": 0}',
-        help='A JSON formatted stream, e.g \'{"<keyA>":<value>, "<keyB>":<value>}\' to '
-        "configure a backend. Values supported in <value> are those included by "
-        "`flwr.common.typing.ConfigsRecordValues`. ",
+        "--verbose",
+        action="store_true",
+        help="When unset, only INFO, WARNING and ERROR log messages will be shown. "
+        "If set, DEBUG-level logs will be displayed. ",
     )
     parser.add_argument(
-        "--dir",
+        "--app-dir",
         default="",
         help="Add specified directory to the PYTHONPATH and load"
         "ClientApp and ServerApp from there."

{flwr_nightly-1.8.0.dev20240303.dist-info → flwr_nightly-1.8.0.dev20240305.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: flwr-nightly
-Version: 1.8.0.dev20240303
+Version: 1.8.0.dev20240305
 Summary: Flower: A Friendly Federated Learning Framework
 Home-page: https://flower.ai
 License: Apache-2.0

flwr-nightly 1.8.0.dev20240303__py3-none-any.whl → 1.8.0.dev20240305__py3-none-any.whl

flwr-nightly 1.8.0.dev20240303py3-none-any.whl → 1.8.0.dev20240305py3-none-any.whl