flwr-nightly 1.8.0.dev20240315__py3-none-any.whl → 1.15.0.dev20250115__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- flwr/cli/app.py +16 -2
- flwr/cli/build.py +181 -0
- flwr/cli/cli_user_auth_interceptor.py +90 -0
- flwr/cli/config_utils.py +343 -0
- flwr/cli/example.py +4 -1
- flwr/cli/install.py +253 -0
- flwr/cli/log.py +182 -0
- flwr/{server/superlink/state → cli/login}/__init__.py +4 -10
- flwr/cli/login/login.py +88 -0
- flwr/cli/ls.py +327 -0
- flwr/cli/new/__init__.py +1 -0
- flwr/cli/new/new.py +210 -66
- flwr/cli/new/templates/app/.gitignore.tpl +163 -0
- flwr/cli/new/templates/app/LICENSE.tpl +202 -0
- flwr/cli/new/templates/app/README.baseline.md.tpl +127 -0
- flwr/cli/new/templates/app/README.flowertune.md.tpl +66 -0
- flwr/cli/new/templates/app/README.md.tpl +16 -32
- flwr/cli/new/templates/app/code/__init__.baseline.py.tpl +1 -0
- flwr/cli/new/templates/app/code/__init__.py.tpl +1 -1
- flwr/cli/new/templates/app/code/client.baseline.py.tpl +58 -0
- flwr/cli/new/templates/app/code/client.huggingface.py.tpl +55 -0
- flwr/cli/new/templates/app/code/client.jax.py.tpl +50 -0
- flwr/cli/new/templates/app/code/client.mlx.py.tpl +73 -0
- flwr/cli/new/templates/app/code/client.numpy.py.tpl +7 -7
- flwr/cli/new/templates/app/code/client.pytorch.py.tpl +30 -21
- flwr/cli/new/templates/app/code/client.sklearn.py.tpl +63 -0
- flwr/cli/new/templates/app/code/client.tensorflow.py.tpl +57 -1
- flwr/cli/new/templates/app/code/dataset.baseline.py.tpl +36 -0
- flwr/cli/new/templates/app/code/flwr_tune/__init__.py +15 -0
- flwr/cli/new/templates/app/code/flwr_tune/client_app.py.tpl +126 -0
- flwr/cli/new/templates/app/code/flwr_tune/dataset.py.tpl +87 -0
- flwr/cli/new/templates/app/code/flwr_tune/models.py.tpl +78 -0
- flwr/cli/new/templates/app/code/flwr_tune/server_app.py.tpl +94 -0
- flwr/cli/new/templates/app/code/flwr_tune/strategy.py.tpl +83 -0
- flwr/cli/new/templates/app/code/model.baseline.py.tpl +80 -0
- flwr/cli/new/templates/app/code/server.baseline.py.tpl +46 -0
- flwr/cli/new/templates/app/code/server.huggingface.py.tpl +38 -0
- flwr/cli/new/templates/app/code/server.jax.py.tpl +26 -0
- flwr/cli/new/templates/app/code/server.mlx.py.tpl +31 -0
- flwr/cli/new/templates/app/code/server.numpy.py.tpl +22 -9
- flwr/cli/new/templates/app/code/server.pytorch.py.tpl +21 -18
- flwr/cli/new/templates/app/code/server.sklearn.py.tpl +36 -0
- flwr/cli/new/templates/app/code/server.tensorflow.py.tpl +29 -1
- flwr/cli/new/templates/app/code/strategy.baseline.py.tpl +1 -0
- flwr/cli/new/templates/app/code/task.huggingface.py.tpl +102 -0
- flwr/cli/new/templates/app/code/task.jax.py.tpl +57 -0
- flwr/cli/new/templates/app/code/task.mlx.py.tpl +102 -0
- flwr/cli/new/templates/app/code/task.numpy.py.tpl +7 -0
- flwr/cli/new/templates/app/code/task.pytorch.py.tpl +29 -24
- flwr/cli/new/templates/app/code/task.sklearn.py.tpl +67 -0
- flwr/cli/new/templates/app/code/task.tensorflow.py.tpl +53 -0
- flwr/cli/new/templates/app/code/utils.baseline.py.tpl +1 -0
- flwr/cli/new/templates/app/pyproject.baseline.toml.tpl +138 -0
- flwr/cli/new/templates/app/pyproject.flowertune.toml.tpl +68 -0
- flwr/cli/new/templates/app/pyproject.huggingface.toml.tpl +46 -0
- flwr/cli/new/templates/app/pyproject.jax.toml.tpl +35 -0
- flwr/cli/new/templates/app/pyproject.mlx.toml.tpl +39 -0
- flwr/cli/new/templates/app/pyproject.numpy.toml.tpl +25 -12
- flwr/cli/new/templates/app/pyproject.pytorch.toml.tpl +29 -14
- flwr/cli/new/templates/app/pyproject.sklearn.toml.tpl +35 -0
- flwr/cli/new/templates/app/pyproject.tensorflow.toml.tpl +29 -14
- flwr/cli/run/__init__.py +1 -0
- flwr/cli/run/run.py +212 -34
- flwr/cli/stop.py +130 -0
- flwr/cli/utils.py +240 -5
- flwr/client/__init__.py +3 -2
- flwr/client/app.py +432 -255
- flwr/client/client.py +1 -11
- flwr/client/client_app.py +74 -13
- flwr/client/clientapp/__init__.py +22 -0
- flwr/client/clientapp/app.py +259 -0
- flwr/client/clientapp/clientappio_servicer.py +244 -0
- flwr/client/clientapp/utils.py +115 -0
- flwr/client/dpfedavg_numpy_client.py +7 -8
- flwr/client/grpc_adapter_client/__init__.py +15 -0
- flwr/client/grpc_adapter_client/connection.py +98 -0
- flwr/client/grpc_client/connection.py +21 -7
- flwr/client/grpc_rere_client/__init__.py +1 -1
- flwr/client/grpc_rere_client/client_interceptor.py +176 -0
- flwr/client/grpc_rere_client/connection.py +163 -56
- flwr/client/grpc_rere_client/grpc_adapter.py +167 -0
- flwr/client/heartbeat.py +74 -0
- flwr/client/message_handler/__init__.py +1 -1
- flwr/client/message_handler/message_handler.py +10 -11
- flwr/client/mod/__init__.py +5 -5
- flwr/client/mod/centraldp_mods.py +4 -2
- flwr/client/mod/comms_mods.py +5 -4
- flwr/client/mod/localdp_mod.py +10 -5
- flwr/client/mod/secure_aggregation/__init__.py +1 -1
- flwr/client/mod/secure_aggregation/secaggplus_mod.py +26 -26
- flwr/client/mod/utils.py +2 -4
- flwr/client/nodestate/__init__.py +26 -0
- flwr/client/nodestate/in_memory_nodestate.py +38 -0
- flwr/client/nodestate/nodestate.py +31 -0
- flwr/client/nodestate/nodestate_factory.py +38 -0
- flwr/client/numpy_client.py +8 -31
- flwr/client/rest_client/__init__.py +1 -1
- flwr/client/rest_client/connection.py +199 -176
- flwr/client/run_info_store.py +112 -0
- flwr/client/supernode/__init__.py +24 -0
- flwr/client/supernode/app.py +321 -0
- flwr/client/typing.py +1 -0
- flwr/common/__init__.py +17 -11
- flwr/common/address.py +47 -3
- flwr/common/args.py +153 -0
- flwr/common/auth_plugin/__init__.py +24 -0
- flwr/common/auth_plugin/auth_plugin.py +121 -0
- flwr/common/config.py +243 -0
- flwr/common/constant.py +135 -1
- flwr/common/context.py +32 -2
- flwr/common/date.py +22 -4
- flwr/common/differential_privacy.py +2 -2
- flwr/common/dp.py +2 -4
- flwr/common/exit_handlers.py +3 -3
- flwr/common/grpc.py +164 -5
- flwr/common/logger.py +230 -12
- flwr/common/message.py +191 -106
- flwr/common/object_ref.py +179 -44
- flwr/common/pyproject.py +1 -0
- flwr/common/record/__init__.py +2 -1
- flwr/common/record/configsrecord.py +58 -18
- flwr/common/record/metricsrecord.py +57 -17
- flwr/common/record/parametersrecord.py +88 -20
- flwr/common/record/recordset.py +153 -30
- flwr/common/record/typeddict.py +30 -55
- flwr/common/recordset_compat.py +31 -12
- flwr/common/retry_invoker.py +123 -30
- flwr/common/secure_aggregation/__init__.py +1 -1
- flwr/common/secure_aggregation/crypto/__init__.py +1 -1
- flwr/common/secure_aggregation/crypto/shamir.py +11 -11
- flwr/common/secure_aggregation/crypto/symmetric_encryption.py +68 -4
- flwr/common/secure_aggregation/ndarrays_arithmetic.py +17 -17
- flwr/common/secure_aggregation/quantization.py +8 -8
- flwr/common/secure_aggregation/secaggplus_constants.py +1 -1
- flwr/common/secure_aggregation/secaggplus_utils.py +10 -12
- flwr/common/serde.py +304 -23
- flwr/common/telemetry.py +65 -29
- flwr/common/typing.py +120 -19
- flwr/common/version.py +17 -3
- flwr/proto/clientappio_pb2.py +45 -0
- flwr/proto/clientappio_pb2.pyi +132 -0
- flwr/proto/clientappio_pb2_grpc.py +135 -0
- flwr/proto/clientappio_pb2_grpc.pyi +53 -0
- flwr/proto/exec_pb2.py +62 -0
- flwr/proto/exec_pb2.pyi +212 -0
- flwr/proto/exec_pb2_grpc.py +237 -0
- flwr/proto/exec_pb2_grpc.pyi +93 -0
- flwr/proto/fab_pb2.py +31 -0
- flwr/proto/fab_pb2.pyi +65 -0
- flwr/proto/fab_pb2_grpc.py +4 -0
- flwr/proto/fab_pb2_grpc.pyi +4 -0
- flwr/proto/fleet_pb2.py +42 -23
- flwr/proto/fleet_pb2.pyi +123 -1
- flwr/proto/fleet_pb2_grpc.py +170 -0
- flwr/proto/fleet_pb2_grpc.pyi +61 -0
- flwr/proto/grpcadapter_pb2.py +32 -0
- flwr/proto/grpcadapter_pb2.pyi +43 -0
- flwr/proto/grpcadapter_pb2_grpc.py +66 -0
- flwr/proto/grpcadapter_pb2_grpc.pyi +24 -0
- flwr/proto/log_pb2.py +29 -0
- flwr/proto/log_pb2.pyi +39 -0
- flwr/proto/log_pb2_grpc.py +4 -0
- flwr/proto/log_pb2_grpc.pyi +4 -0
- flwr/proto/message_pb2.py +41 -0
- flwr/proto/message_pb2.pyi +128 -0
- flwr/proto/message_pb2_grpc.py +4 -0
- flwr/proto/message_pb2_grpc.pyi +4 -0
- flwr/proto/node_pb2.py +2 -2
- flwr/proto/node_pb2.pyi +1 -4
- flwr/proto/recordset_pb2.py +35 -33
- flwr/proto/recordset_pb2.pyi +40 -14
- flwr/proto/run_pb2.py +64 -0
- flwr/proto/run_pb2.pyi +268 -0
- flwr/proto/run_pb2_grpc.py +4 -0
- flwr/proto/run_pb2_grpc.pyi +4 -0
- flwr/proto/serverappio_pb2.py +52 -0
- flwr/proto/{driver_pb2.pyi → serverappio_pb2.pyi} +62 -20
- flwr/proto/serverappio_pb2_grpc.py +410 -0
- flwr/proto/serverappio_pb2_grpc.pyi +160 -0
- flwr/proto/simulationio_pb2.py +38 -0
- flwr/proto/simulationio_pb2.pyi +65 -0
- flwr/proto/simulationio_pb2_grpc.py +239 -0
- flwr/proto/simulationio_pb2_grpc.pyi +94 -0
- flwr/proto/task_pb2.py +7 -8
- flwr/proto/task_pb2.pyi +8 -5
- flwr/proto/transport_pb2.py +8 -8
- flwr/proto/transport_pb2.pyi +9 -6
- flwr/server/__init__.py +2 -10
- flwr/server/app.py +579 -402
- flwr/server/client_manager.py +8 -6
- flwr/server/compat/app.py +6 -62
- flwr/server/compat/app_utils.py +14 -9
- flwr/server/compat/driver_client_proxy.py +25 -59
- flwr/server/compat/legacy_context.py +5 -4
- flwr/server/driver/__init__.py +2 -0
- flwr/server/driver/driver.py +36 -131
- flwr/server/driver/grpc_driver.py +220 -81
- flwr/server/driver/inmemory_driver.py +183 -0
- flwr/server/history.py +28 -29
- flwr/server/run_serverapp.py +15 -126
- flwr/server/server.py +50 -44
- flwr/server/server_app.py +59 -10
- flwr/server/serverapp/__init__.py +22 -0
- flwr/server/serverapp/app.py +256 -0
- flwr/server/serverapp_components.py +52 -0
- flwr/server/strategy/__init__.py +2 -2
- flwr/server/strategy/aggregate.py +37 -23
- flwr/server/strategy/bulyan.py +9 -9
- flwr/server/strategy/dp_adaptive_clipping.py +25 -25
- flwr/server/strategy/dp_fixed_clipping.py +23 -22
- flwr/server/strategy/dpfedavg_adaptive.py +8 -8
- flwr/server/strategy/dpfedavg_fixed.py +13 -12
- flwr/server/strategy/fault_tolerant_fedavg.py +11 -11
- flwr/server/strategy/fedadagrad.py +9 -9
- flwr/server/strategy/fedadam.py +20 -10
- flwr/server/strategy/fedavg.py +16 -16
- flwr/server/strategy/fedavg_android.py +17 -17
- flwr/server/strategy/fedavgm.py +9 -9
- flwr/server/strategy/fedmedian.py +5 -5
- flwr/server/strategy/fedopt.py +6 -6
- flwr/server/strategy/fedprox.py +7 -7
- flwr/server/strategy/fedtrimmedavg.py +8 -8
- flwr/server/strategy/fedxgb_bagging.py +12 -12
- flwr/server/strategy/fedxgb_cyclic.py +10 -10
- flwr/server/strategy/fedxgb_nn_avg.py +6 -6
- flwr/server/strategy/fedyogi.py +9 -9
- flwr/server/strategy/krum.py +9 -9
- flwr/server/strategy/qfedavg.py +16 -16
- flwr/server/strategy/strategy.py +10 -10
- flwr/server/superlink/driver/__init__.py +2 -2
- flwr/server/superlink/driver/serverappio_grpc.py +61 -0
- flwr/server/superlink/driver/serverappio_servicer.py +361 -0
- flwr/server/superlink/ffs/__init__.py +24 -0
- flwr/server/superlink/ffs/disk_ffs.py +108 -0
- flwr/server/superlink/ffs/ffs.py +79 -0
- flwr/server/superlink/ffs/ffs_factory.py +47 -0
- flwr/server/superlink/fleet/__init__.py +1 -1
- flwr/server/superlink/fleet/grpc_adapter/__init__.py +15 -0
- flwr/server/superlink/fleet/grpc_adapter/grpc_adapter_servicer.py +162 -0
- flwr/server/superlink/fleet/grpc_bidi/__init__.py +1 -1
- flwr/server/superlink/fleet/grpc_bidi/flower_service_servicer.py +4 -2
- flwr/server/superlink/fleet/grpc_bidi/grpc_bridge.py +3 -2
- flwr/server/superlink/fleet/grpc_bidi/grpc_client_proxy.py +1 -1
- flwr/server/superlink/fleet/grpc_bidi/grpc_server.py +5 -154
- flwr/server/superlink/fleet/grpc_rere/__init__.py +1 -1
- flwr/server/superlink/fleet/grpc_rere/fleet_servicer.py +120 -13
- flwr/server/superlink/fleet/grpc_rere/server_interceptor.py +228 -0
- flwr/server/superlink/fleet/message_handler/__init__.py +1 -1
- flwr/server/superlink/fleet/message_handler/message_handler.py +156 -13
- flwr/server/superlink/fleet/rest_rere/__init__.py +1 -1
- flwr/server/superlink/fleet/rest_rere/rest_api.py +119 -81
- flwr/server/superlink/fleet/vce/__init__.py +1 -0
- flwr/server/superlink/fleet/vce/backend/__init__.py +4 -4
- flwr/server/superlink/fleet/vce/backend/backend.py +8 -9
- flwr/server/superlink/fleet/vce/backend/raybackend.py +87 -68
- flwr/server/superlink/fleet/vce/vce_api.py +208 -146
- flwr/server/superlink/linkstate/__init__.py +28 -0
- flwr/server/superlink/linkstate/in_memory_linkstate.py +569 -0
- flwr/server/superlink/linkstate/linkstate.py +376 -0
- flwr/server/superlink/{state/state_factory.py → linkstate/linkstate_factory.py} +19 -10
- flwr/server/superlink/linkstate/sqlite_linkstate.py +1196 -0
- flwr/server/superlink/linkstate/utils.py +399 -0
- flwr/server/superlink/simulation/__init__.py +15 -0
- flwr/server/superlink/simulation/simulationio_grpc.py +65 -0
- flwr/server/superlink/simulation/simulationio_servicer.py +186 -0
- flwr/server/superlink/utils.py +65 -0
- flwr/server/typing.py +2 -0
- flwr/server/utils/__init__.py +1 -1
- flwr/server/utils/tensorboard.py +5 -5
- flwr/server/utils/validator.py +40 -45
- flwr/server/workflow/default_workflows.py +70 -26
- flwr/server/workflow/secure_aggregation/secagg_workflow.py +1 -0
- flwr/server/workflow/secure_aggregation/secaggplus_workflow.py +40 -27
- flwr/simulation/__init__.py +12 -5
- flwr/simulation/app.py +247 -315
- flwr/simulation/legacy_app.py +404 -0
- flwr/simulation/ray_transport/__init__.py +1 -1
- flwr/simulation/ray_transport/ray_actor.py +42 -67
- flwr/simulation/ray_transport/ray_client_proxy.py +37 -17
- flwr/simulation/ray_transport/utils.py +1 -0
- flwr/simulation/run_simulation.py +306 -163
- flwr/simulation/simulationio_connection.py +89 -0
- flwr/superexec/__init__.py +15 -0
- flwr/superexec/app.py +59 -0
- flwr/superexec/deployment.py +188 -0
- flwr/superexec/exec_grpc.py +80 -0
- flwr/superexec/exec_servicer.py +231 -0
- flwr/superexec/exec_user_auth_interceptor.py +101 -0
- flwr/superexec/executor.py +96 -0
- flwr/superexec/simulation.py +124 -0
- {flwr_nightly-1.8.0.dev20240315.dist-info → flwr_nightly-1.15.0.dev20250115.dist-info}/METADATA +33 -26
- flwr_nightly-1.15.0.dev20250115.dist-info/RECORD +328 -0
- flwr_nightly-1.15.0.dev20250115.dist-info/entry_points.txt +12 -0
- flwr/cli/flower_toml.py +0 -140
- flwr/cli/new/templates/app/flower.toml.tpl +0 -13
- flwr/cli/new/templates/app/requirements.numpy.txt.tpl +0 -2
- flwr/cli/new/templates/app/requirements.pytorch.txt.tpl +0 -4
- flwr/cli/new/templates/app/requirements.tensorflow.txt.tpl +0 -4
- flwr/client/node_state.py +0 -48
- flwr/client/node_state_tests.py +0 -65
- flwr/proto/driver_pb2.py +0 -44
- flwr/proto/driver_pb2_grpc.py +0 -169
- flwr/proto/driver_pb2_grpc.pyi +0 -66
- flwr/server/superlink/driver/driver_grpc.py +0 -54
- flwr/server/superlink/driver/driver_servicer.py +0 -129
- flwr/server/superlink/state/in_memory_state.py +0 -230
- flwr/server/superlink/state/sqlite_state.py +0 -630
- flwr/server/superlink/state/state.py +0 -154
- flwr_nightly-1.8.0.dev20240315.dist-info/RECORD +0 -211
- flwr_nightly-1.8.0.dev20240315.dist-info/entry_points.txt +0 -9
- {flwr_nightly-1.8.0.dev20240315.dist-info → flwr_nightly-1.15.0.dev20250115.dist-info}/LICENSE +0 -0
- {flwr_nightly-1.8.0.dev20240315.dist-info → flwr_nightly-1.15.0.dev20250115.dist-info}/WHEEL +0 -0
@@ -0,0 +1,399 @@
|
|
1
|
+
# Copyright 2024 Flower Labs GmbH. All Rights Reserved.
|
2
|
+
#
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
4
|
+
# you may not use this file except in compliance with the License.
|
5
|
+
# You may obtain a copy of the License at
|
6
|
+
#
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
8
|
+
#
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12
|
+
# See the License for the specific language governing permissions and
|
13
|
+
# limitations under the License.
|
14
|
+
# ==============================================================================
|
15
|
+
"""Utility functions for State."""
|
16
|
+
|
17
|
+
|
18
|
+
from logging import ERROR
|
19
|
+
from os import urandom
|
20
|
+
from typing import Optional, Union
|
21
|
+
from uuid import UUID, uuid4
|
22
|
+
|
23
|
+
from flwr.common import ConfigsRecord, Context, log, now, serde
|
24
|
+
from flwr.common.constant import SUPERLINK_NODE_ID, ErrorCode, Status, SubStatus
|
25
|
+
from flwr.common.typing import RunStatus
|
26
|
+
|
27
|
+
# pylint: disable=E0611
|
28
|
+
from flwr.proto.error_pb2 import Error
|
29
|
+
from flwr.proto.message_pb2 import Context as ProtoContext
|
30
|
+
from flwr.proto.node_pb2 import Node
|
31
|
+
from flwr.proto.recordset_pb2 import ConfigsRecord as ProtoConfigsRecord
|
32
|
+
from flwr.proto.task_pb2 import Task, TaskIns, TaskRes
|
33
|
+
|
34
|
+
# pylint: enable=E0611
|
35
|
+
|
36
|
+
NODE_UNAVAILABLE_ERROR_REASON = (
|
37
|
+
"Error: Node Unavailable - The destination node is currently unavailable. "
|
38
|
+
"It exceeds the time limit specified in its last ping."
|
39
|
+
)
|
40
|
+
|
41
|
+
VALID_RUN_STATUS_TRANSITIONS = {
|
42
|
+
(Status.PENDING, Status.STARTING),
|
43
|
+
(Status.STARTING, Status.RUNNING),
|
44
|
+
(Status.RUNNING, Status.FINISHED),
|
45
|
+
# Any non-FINISHED status can transition to FINISHED
|
46
|
+
(Status.PENDING, Status.FINISHED),
|
47
|
+
(Status.STARTING, Status.FINISHED),
|
48
|
+
}
|
49
|
+
VALID_RUN_SUB_STATUSES = {
|
50
|
+
SubStatus.COMPLETED,
|
51
|
+
SubStatus.FAILED,
|
52
|
+
SubStatus.STOPPED,
|
53
|
+
}
|
54
|
+
MESSAGE_UNAVAILABLE_ERROR_REASON = (
|
55
|
+
"Error: Message Unavailable - The requested message could not be found in the "
|
56
|
+
"database. It may have expired due to its TTL or never existed."
|
57
|
+
)
|
58
|
+
REPLY_MESSAGE_UNAVAILABLE_ERROR_REASON = (
|
59
|
+
"Error: Reply Message Unavailable - The reply message has expired."
|
60
|
+
)
|
61
|
+
|
62
|
+
|
63
|
+
def generate_rand_int_from_bytes(
|
64
|
+
num_bytes: int, exclude: Optional[list[int]] = None
|
65
|
+
) -> int:
|
66
|
+
"""Generate a random unsigned integer from `num_bytes` bytes.
|
67
|
+
|
68
|
+
If `exclude` is set, this function guarantees such number is not returned.
|
69
|
+
"""
|
70
|
+
num = int.from_bytes(urandom(num_bytes), "little", signed=False)
|
71
|
+
|
72
|
+
if exclude:
|
73
|
+
while num in exclude:
|
74
|
+
num = int.from_bytes(urandom(num_bytes), "little", signed=False)
|
75
|
+
return num
|
76
|
+
|
77
|
+
|
78
|
+
def convert_uint64_to_sint64(u: int) -> int:
|
79
|
+
"""Convert a uint64 value to a sint64 value with the same bit sequence.
|
80
|
+
|
81
|
+
Parameters
|
82
|
+
----------
|
83
|
+
u : int
|
84
|
+
The unsigned 64-bit integer to convert.
|
85
|
+
|
86
|
+
Returns
|
87
|
+
-------
|
88
|
+
int
|
89
|
+
The signed 64-bit integer equivalent.
|
90
|
+
|
91
|
+
The signed 64-bit integer will have the same bit pattern as the
|
92
|
+
unsigned 64-bit integer but may have a different decimal value.
|
93
|
+
|
94
|
+
For numbers within the range [0, `sint64` max value], the decimal
|
95
|
+
value remains the same. However, for numbers greater than the `sint64`
|
96
|
+
max value, the decimal value will differ due to the wraparound caused
|
97
|
+
by the sign bit.
|
98
|
+
"""
|
99
|
+
if u >= (1 << 63):
|
100
|
+
return u - (1 << 64)
|
101
|
+
return u
|
102
|
+
|
103
|
+
|
104
|
+
def convert_sint64_to_uint64(s: int) -> int:
|
105
|
+
"""Convert a sint64 value to a uint64 value with the same bit sequence.
|
106
|
+
|
107
|
+
Parameters
|
108
|
+
----------
|
109
|
+
s : int
|
110
|
+
The signed 64-bit integer to convert.
|
111
|
+
|
112
|
+
Returns
|
113
|
+
-------
|
114
|
+
int
|
115
|
+
The unsigned 64-bit integer equivalent.
|
116
|
+
|
117
|
+
The unsigned 64-bit integer will have the same bit pattern as the
|
118
|
+
signed 64-bit integer but may have a different decimal value.
|
119
|
+
|
120
|
+
For negative `sint64` values, the conversion adds 2^64 to the
|
121
|
+
signed value to obtain the equivalent `uint64` value. For non-negative
|
122
|
+
`sint64` values, the decimal value remains unchanged in the `uint64`
|
123
|
+
representation.
|
124
|
+
"""
|
125
|
+
if s < 0:
|
126
|
+
return s + (1 << 64)
|
127
|
+
return s
|
128
|
+
|
129
|
+
|
130
|
+
def convert_uint64_values_in_dict_to_sint64(
|
131
|
+
data_dict: dict[str, int], keys: list[str]
|
132
|
+
) -> None:
|
133
|
+
"""Convert uint64 values to sint64 in the given dictionary.
|
134
|
+
|
135
|
+
Parameters
|
136
|
+
----------
|
137
|
+
data_dict : dict[str, int]
|
138
|
+
A dictionary where the values are integers to be converted.
|
139
|
+
keys : list[str]
|
140
|
+
A list of keys in the dictionary whose values need to be converted.
|
141
|
+
"""
|
142
|
+
for key in keys:
|
143
|
+
if key in data_dict:
|
144
|
+
data_dict[key] = convert_uint64_to_sint64(data_dict[key])
|
145
|
+
|
146
|
+
|
147
|
+
def convert_sint64_values_in_dict_to_uint64(
|
148
|
+
data_dict: dict[str, int], keys: list[str]
|
149
|
+
) -> None:
|
150
|
+
"""Convert sint64 values to uint64 in the given dictionary.
|
151
|
+
|
152
|
+
Parameters
|
153
|
+
----------
|
154
|
+
data_dict : dict[str, int]
|
155
|
+
A dictionary where the values are integers to be converted.
|
156
|
+
keys : list[str]
|
157
|
+
A list of keys in the dictionary whose values need to be converted.
|
158
|
+
"""
|
159
|
+
for key in keys:
|
160
|
+
if key in data_dict:
|
161
|
+
data_dict[key] = convert_sint64_to_uint64(data_dict[key])
|
162
|
+
|
163
|
+
|
164
|
+
def context_to_bytes(context: Context) -> bytes:
|
165
|
+
"""Serialize `Context` to bytes."""
|
166
|
+
return serde.context_to_proto(context).SerializeToString()
|
167
|
+
|
168
|
+
|
169
|
+
def context_from_bytes(context_bytes: bytes) -> Context:
|
170
|
+
"""Deserialize `Context` from bytes."""
|
171
|
+
return serde.context_from_proto(ProtoContext.FromString(context_bytes))
|
172
|
+
|
173
|
+
|
174
|
+
def configsrecord_to_bytes(configs_record: ConfigsRecord) -> bytes:
|
175
|
+
"""Serialize a `ConfigsRecord` to bytes."""
|
176
|
+
return serde.configs_record_to_proto(configs_record).SerializeToString()
|
177
|
+
|
178
|
+
|
179
|
+
def configsrecord_from_bytes(configsrecord_bytes: bytes) -> ConfigsRecord:
|
180
|
+
"""Deserialize `ConfigsRecord` from bytes."""
|
181
|
+
return serde.configs_record_from_proto(
|
182
|
+
ProtoConfigsRecord.FromString(configsrecord_bytes)
|
183
|
+
)
|
184
|
+
|
185
|
+
|
186
|
+
def is_valid_transition(current_status: RunStatus, new_status: RunStatus) -> bool:
|
187
|
+
"""Check if a transition between two run statuses is valid.
|
188
|
+
|
189
|
+
Parameters
|
190
|
+
----------
|
191
|
+
current_status : RunStatus
|
192
|
+
The current status of the run.
|
193
|
+
new_status : RunStatus
|
194
|
+
The new status to transition to.
|
195
|
+
|
196
|
+
Returns
|
197
|
+
-------
|
198
|
+
bool
|
199
|
+
True if the transition is valid, False otherwise.
|
200
|
+
"""
|
201
|
+
# Transition to FINISHED from a non-RUNNING status is only allowed
|
202
|
+
# if the sub-status is not COMPLETED
|
203
|
+
if (
|
204
|
+
current_status.status in [Status.PENDING, Status.STARTING]
|
205
|
+
and new_status.status == Status.FINISHED
|
206
|
+
):
|
207
|
+
return new_status.sub_status != SubStatus.COMPLETED
|
208
|
+
|
209
|
+
return (
|
210
|
+
current_status.status,
|
211
|
+
new_status.status,
|
212
|
+
) in VALID_RUN_STATUS_TRANSITIONS
|
213
|
+
|
214
|
+
|
215
|
+
def has_valid_sub_status(status: RunStatus) -> bool:
|
216
|
+
"""Check if the 'sub_status' field of the given status is valid.
|
217
|
+
|
218
|
+
Parameters
|
219
|
+
----------
|
220
|
+
status : RunStatus
|
221
|
+
The status object to be checked.
|
222
|
+
|
223
|
+
Returns
|
224
|
+
-------
|
225
|
+
bool
|
226
|
+
True if the status object has a valid sub-status, False otherwise.
|
227
|
+
|
228
|
+
Notes
|
229
|
+
-----
|
230
|
+
Only an empty string (i.e., "") is considered a valid sub-status for
|
231
|
+
non-finished statuses. The sub-status of a finished status cannot be empty.
|
232
|
+
"""
|
233
|
+
if status.status == Status.FINISHED:
|
234
|
+
return status.sub_status in VALID_RUN_SUB_STATUSES
|
235
|
+
return status.sub_status == ""
|
236
|
+
|
237
|
+
|
238
|
+
def create_taskres_for_unavailable_taskins(taskins_id: Union[str, UUID]) -> TaskRes:
|
239
|
+
"""Generate a TaskRes with a TaskIns unavailable error.
|
240
|
+
|
241
|
+
Parameters
|
242
|
+
----------
|
243
|
+
taskins_id : Union[str, UUID]
|
244
|
+
The ID of the unavailable TaskIns.
|
245
|
+
|
246
|
+
Returns
|
247
|
+
-------
|
248
|
+
TaskRes
|
249
|
+
A TaskRes with an error code MESSAGE_UNAVAILABLE to indicate that the
|
250
|
+
inquired TaskIns ID cannot be found (due to non-existence or expiration).
|
251
|
+
"""
|
252
|
+
current_time = now().timestamp()
|
253
|
+
return TaskRes(
|
254
|
+
task_id=str(uuid4()),
|
255
|
+
group_id="", # Unknown group ID
|
256
|
+
run_id=0, # Unknown run ID
|
257
|
+
task=Task(
|
258
|
+
# This function is only called by SuperLink, and thus it's the producer.
|
259
|
+
producer=Node(node_id=SUPERLINK_NODE_ID),
|
260
|
+
consumer=Node(node_id=SUPERLINK_NODE_ID),
|
261
|
+
created_at=current_time,
|
262
|
+
ttl=0,
|
263
|
+
ancestry=[str(taskins_id)],
|
264
|
+
task_type="", # Unknown message type
|
265
|
+
error=Error(
|
266
|
+
code=ErrorCode.MESSAGE_UNAVAILABLE,
|
267
|
+
reason=MESSAGE_UNAVAILABLE_ERROR_REASON,
|
268
|
+
),
|
269
|
+
),
|
270
|
+
)
|
271
|
+
|
272
|
+
|
273
|
+
def create_taskres_for_unavailable_taskres(ref_taskins: TaskIns) -> TaskRes:
|
274
|
+
"""Generate a TaskRes with a reply message unavailable error from a TaskIns.
|
275
|
+
|
276
|
+
Parameters
|
277
|
+
----------
|
278
|
+
ref_taskins : TaskIns
|
279
|
+
The reference TaskIns object.
|
280
|
+
|
281
|
+
Returns
|
282
|
+
-------
|
283
|
+
TaskRes
|
284
|
+
The generated TaskRes with an error code REPLY_MESSAGE_UNAVAILABLE_ERROR_REASON,
|
285
|
+
indicating that the original TaskRes has expired.
|
286
|
+
"""
|
287
|
+
current_time = now().timestamp()
|
288
|
+
ttl = ref_taskins.task.ttl - (current_time - ref_taskins.task.created_at)
|
289
|
+
if ttl < 0:
|
290
|
+
log(ERROR, "Creating TaskRes for TaskIns that exceeds its TTL.")
|
291
|
+
ttl = 0
|
292
|
+
return TaskRes(
|
293
|
+
task_id=str(uuid4()),
|
294
|
+
group_id=ref_taskins.group_id,
|
295
|
+
run_id=ref_taskins.run_id,
|
296
|
+
task=Task(
|
297
|
+
# This function is only called by SuperLink, and thus it's the producer.
|
298
|
+
producer=Node(node_id=SUPERLINK_NODE_ID),
|
299
|
+
consumer=Node(node_id=SUPERLINK_NODE_ID),
|
300
|
+
created_at=current_time,
|
301
|
+
ttl=ttl,
|
302
|
+
ancestry=[ref_taskins.task_id],
|
303
|
+
task_type=ref_taskins.task.task_type,
|
304
|
+
error=Error(
|
305
|
+
code=ErrorCode.REPLY_MESSAGE_UNAVAILABLE,
|
306
|
+
reason=REPLY_MESSAGE_UNAVAILABLE_ERROR_REASON,
|
307
|
+
),
|
308
|
+
),
|
309
|
+
)
|
310
|
+
|
311
|
+
|
312
|
+
def has_expired(task_ins_or_res: Union[TaskIns, TaskRes], current_time: float) -> bool:
|
313
|
+
"""Check if the TaskIns/TaskRes has expired."""
|
314
|
+
return task_ins_or_res.task.ttl + task_ins_or_res.task.created_at < current_time
|
315
|
+
|
316
|
+
|
317
|
+
def verify_taskins_ids(
|
318
|
+
inquired_taskins_ids: set[UUID],
|
319
|
+
found_taskins_dict: dict[UUID, TaskIns],
|
320
|
+
current_time: Optional[float] = None,
|
321
|
+
update_set: bool = True,
|
322
|
+
) -> dict[UUID, TaskRes]:
|
323
|
+
"""Verify found TaskIns and generate error TaskRes for invalid ones.
|
324
|
+
|
325
|
+
Parameters
|
326
|
+
----------
|
327
|
+
inquired_taskins_ids : set[UUID]
|
328
|
+
Set of TaskIns IDs for which to generate error TaskRes if invalid.
|
329
|
+
found_taskins_dict : dict[UUID, TaskIns]
|
330
|
+
Dictionary containing all found TaskIns indexed by their IDs.
|
331
|
+
current_time : Optional[float] (default: None)
|
332
|
+
The current time to check for expiration. If set to `None`, the current time
|
333
|
+
will automatically be set to the current timestamp using `now().timestamp()`.
|
334
|
+
update_set : bool (default: True)
|
335
|
+
If True, the `inquired_taskins_ids` will be updated to remove invalid ones,
|
336
|
+
by default True.
|
337
|
+
|
338
|
+
Returns
|
339
|
+
-------
|
340
|
+
dict[UUID, TaskRes]
|
341
|
+
A dictionary of error TaskRes indexed by the corresponding TaskIns ID.
|
342
|
+
"""
|
343
|
+
ret_dict = {}
|
344
|
+
current = current_time if current_time else now().timestamp()
|
345
|
+
for taskins_id in list(inquired_taskins_ids):
|
346
|
+
# Generate error TaskRes if the task_ins doesn't exist or has expired
|
347
|
+
taskins = found_taskins_dict.get(taskins_id)
|
348
|
+
if taskins is None or has_expired(taskins, current):
|
349
|
+
if update_set:
|
350
|
+
inquired_taskins_ids.remove(taskins_id)
|
351
|
+
taskres = create_taskres_for_unavailable_taskins(taskins_id)
|
352
|
+
ret_dict[taskins_id] = taskres
|
353
|
+
return ret_dict
|
354
|
+
|
355
|
+
|
356
|
+
def verify_found_taskres(
|
357
|
+
inquired_taskins_ids: set[UUID],
|
358
|
+
found_taskins_dict: dict[UUID, TaskIns],
|
359
|
+
found_taskres_list: list[TaskRes],
|
360
|
+
current_time: Optional[float] = None,
|
361
|
+
update_set: bool = True,
|
362
|
+
) -> dict[UUID, TaskRes]:
|
363
|
+
"""Verify found TaskRes and generate error TaskRes for invalid ones.
|
364
|
+
|
365
|
+
Parameters
|
366
|
+
----------
|
367
|
+
inquired_taskins_ids : set[UUID]
|
368
|
+
Set of TaskIns IDs for which to generate error TaskRes if invalid.
|
369
|
+
found_taskins_dict : dict[UUID, TaskIns]
|
370
|
+
Dictionary containing all found TaskIns indexed by their IDs.
|
371
|
+
found_taskres_list : dict[TaskIns, TaskRes]
|
372
|
+
List of found TaskRes to be verified.
|
373
|
+
current_time : Optional[float] (default: None)
|
374
|
+
The current time to check for expiration. If set to `None`, the current time
|
375
|
+
will automatically be set to the current timestamp using `now().timestamp()`.
|
376
|
+
update_set : bool (default: True)
|
377
|
+
If True, the `inquired_taskins_ids` will be updated to remove ones
|
378
|
+
that have a TaskRes, by default True.
|
379
|
+
|
380
|
+
Returns
|
381
|
+
-------
|
382
|
+
dict[UUID, TaskRes]
|
383
|
+
A dictionary of TaskRes indexed by the corresponding TaskIns ID.
|
384
|
+
"""
|
385
|
+
ret_dict: dict[UUID, TaskRes] = {}
|
386
|
+
current = current_time if current_time else now().timestamp()
|
387
|
+
for taskres in found_taskres_list:
|
388
|
+
taskins_id = UUID(taskres.task.ancestry[0])
|
389
|
+
if update_set:
|
390
|
+
inquired_taskins_ids.remove(taskins_id)
|
391
|
+
# Check if the TaskRes has expired
|
392
|
+
if has_expired(taskres, current):
|
393
|
+
# No need to insert the error TaskRes
|
394
|
+
taskres = create_taskres_for_unavailable_taskres(
|
395
|
+
found_taskins_dict[taskins_id]
|
396
|
+
)
|
397
|
+
taskres.task.delivered_at = now().isoformat()
|
398
|
+
ret_dict[taskins_id] = taskres
|
399
|
+
return ret_dict
|
@@ -0,0 +1,15 @@
|
|
1
|
+
# Copyright 2024 Flower Labs GmbH. All Rights Reserved.
|
2
|
+
#
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
4
|
+
# you may not use this file except in compliance with the License.
|
5
|
+
# You may obtain a copy of the License at
|
6
|
+
#
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
8
|
+
#
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12
|
+
# See the License for the specific language governing permissions and
|
13
|
+
# limitations under the License.
|
14
|
+
# ==============================================================================
|
15
|
+
"""Flower SimulationIo service."""
|
@@ -0,0 +1,65 @@
|
|
1
|
+
# Copyright 2024 Flower Labs GmbH. All Rights Reserved.
|
2
|
+
#
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
4
|
+
# you may not use this file except in compliance with the License.
|
5
|
+
# You may obtain a copy of the License at
|
6
|
+
#
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
8
|
+
#
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12
|
+
# See the License for the specific language governing permissions and
|
13
|
+
# limitations under the License.
|
14
|
+
# ==============================================================================
|
15
|
+
"""SimulationIo gRPC API."""
|
16
|
+
|
17
|
+
|
18
|
+
from logging import INFO
|
19
|
+
from typing import Optional
|
20
|
+
|
21
|
+
import grpc
|
22
|
+
|
23
|
+
from flwr.common import GRPC_MAX_MESSAGE_LENGTH
|
24
|
+
from flwr.common.grpc import generic_create_grpc_server
|
25
|
+
from flwr.common.logger import log
|
26
|
+
from flwr.proto.simulationio_pb2_grpc import ( # pylint: disable=E0611
|
27
|
+
add_SimulationIoServicer_to_server,
|
28
|
+
)
|
29
|
+
from flwr.server.superlink.ffs.ffs_factory import FfsFactory
|
30
|
+
from flwr.server.superlink.linkstate import LinkStateFactory
|
31
|
+
|
32
|
+
from .simulationio_servicer import SimulationIoServicer
|
33
|
+
|
34
|
+
|
35
|
+
def run_simulationio_api_grpc(
|
36
|
+
address: str,
|
37
|
+
state_factory: LinkStateFactory,
|
38
|
+
ffs_factory: FfsFactory,
|
39
|
+
certificates: Optional[tuple[bytes, bytes, bytes]],
|
40
|
+
) -> grpc.Server:
|
41
|
+
"""Run SimulationIo API (gRPC, request-response)."""
|
42
|
+
# Create SimulationIo API gRPC server
|
43
|
+
simulationio_servicer: grpc.Server = SimulationIoServicer(
|
44
|
+
state_factory=state_factory,
|
45
|
+
ffs_factory=ffs_factory,
|
46
|
+
)
|
47
|
+
simulationio_add_servicer_to_server_fn = add_SimulationIoServicer_to_server
|
48
|
+
simulationio_grpc_server = generic_create_grpc_server(
|
49
|
+
servicer_and_add_fn=(
|
50
|
+
simulationio_servicer,
|
51
|
+
simulationio_add_servicer_to_server_fn,
|
52
|
+
),
|
53
|
+
server_address=address,
|
54
|
+
max_message_length=GRPC_MAX_MESSAGE_LENGTH,
|
55
|
+
certificates=certificates,
|
56
|
+
)
|
57
|
+
|
58
|
+
log(
|
59
|
+
INFO,
|
60
|
+
"Flower Simulation Engine: Starting SimulationIo API on %s",
|
61
|
+
address,
|
62
|
+
)
|
63
|
+
simulationio_grpc_server.start()
|
64
|
+
|
65
|
+
return simulationio_grpc_server
|
@@ -0,0 +1,186 @@
|
|
1
|
+
# Copyright 2024 Flower Labs GmbH. All Rights Reserved.
|
2
|
+
#
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
4
|
+
# you may not use this file except in compliance with the License.
|
5
|
+
# You may obtain a copy of the License at
|
6
|
+
#
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
8
|
+
#
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12
|
+
# See the License for the specific language governing permissions and
|
13
|
+
# limitations under the License.
|
14
|
+
# ==============================================================================
|
15
|
+
"""SimulationIo API servicer."""
|
16
|
+
|
17
|
+
|
18
|
+
import threading
|
19
|
+
from logging import DEBUG, INFO
|
20
|
+
|
21
|
+
import grpc
|
22
|
+
from grpc import ServicerContext
|
23
|
+
|
24
|
+
from flwr.common.constant import Status
|
25
|
+
from flwr.common.logger import log
|
26
|
+
from flwr.common.serde import (
|
27
|
+
configs_record_to_proto,
|
28
|
+
context_from_proto,
|
29
|
+
context_to_proto,
|
30
|
+
fab_to_proto,
|
31
|
+
run_status_from_proto,
|
32
|
+
run_status_to_proto,
|
33
|
+
run_to_proto,
|
34
|
+
)
|
35
|
+
from flwr.common.typing import Fab, RunStatus
|
36
|
+
from flwr.proto import simulationio_pb2_grpc
|
37
|
+
from flwr.proto.log_pb2 import ( # pylint: disable=E0611
|
38
|
+
PushLogsRequest,
|
39
|
+
PushLogsResponse,
|
40
|
+
)
|
41
|
+
from flwr.proto.run_pb2 import ( # pylint: disable=E0611
|
42
|
+
GetFederationOptionsRequest,
|
43
|
+
GetFederationOptionsResponse,
|
44
|
+
GetRunStatusRequest,
|
45
|
+
GetRunStatusResponse,
|
46
|
+
UpdateRunStatusRequest,
|
47
|
+
UpdateRunStatusResponse,
|
48
|
+
)
|
49
|
+
from flwr.proto.simulationio_pb2 import ( # pylint: disable=E0611
|
50
|
+
PullSimulationInputsRequest,
|
51
|
+
PullSimulationInputsResponse,
|
52
|
+
PushSimulationOutputsRequest,
|
53
|
+
PushSimulationOutputsResponse,
|
54
|
+
)
|
55
|
+
from flwr.server.superlink.ffs.ffs_factory import FfsFactory
|
56
|
+
from flwr.server.superlink.linkstate import LinkStateFactory
|
57
|
+
from flwr.server.superlink.utils import abort_if
|
58
|
+
|
59
|
+
|
60
|
+
class SimulationIoServicer(simulationio_pb2_grpc.SimulationIoServicer):
|
61
|
+
"""SimulationIo API servicer."""
|
62
|
+
|
63
|
+
def __init__(
|
64
|
+
self, state_factory: LinkStateFactory, ffs_factory: FfsFactory
|
65
|
+
) -> None:
|
66
|
+
self.state_factory = state_factory
|
67
|
+
self.ffs_factory = ffs_factory
|
68
|
+
self.lock = threading.RLock()
|
69
|
+
|
70
|
+
def PullSimulationInputs(
|
71
|
+
self, request: PullSimulationInputsRequest, context: ServicerContext
|
72
|
+
) -> PullSimulationInputsResponse:
|
73
|
+
"""Pull SimultionIo process inputs."""
|
74
|
+
log(DEBUG, "SimultionIoServicer.SimultionIoInputs")
|
75
|
+
# Init access to LinkState and Ffs
|
76
|
+
state = self.state_factory.state()
|
77
|
+
ffs = self.ffs_factory.ffs()
|
78
|
+
|
79
|
+
# Lock access to LinkState, preventing obtaining the same pending run_id
|
80
|
+
with self.lock:
|
81
|
+
# Attempt getting the run_id of a pending run
|
82
|
+
run_id = state.get_pending_run_id()
|
83
|
+
# If there's no pending run, return an empty response
|
84
|
+
if run_id is None:
|
85
|
+
return PullSimulationInputsResponse()
|
86
|
+
|
87
|
+
# Retrieve Context, Run and Fab for the run_id
|
88
|
+
serverapp_ctxt = state.get_serverapp_context(run_id)
|
89
|
+
run = state.get_run(run_id)
|
90
|
+
fab = None
|
91
|
+
if run and run.fab_hash:
|
92
|
+
if result := ffs.get(run.fab_hash):
|
93
|
+
fab = Fab(run.fab_hash, result[0])
|
94
|
+
if run and fab and serverapp_ctxt:
|
95
|
+
# Update run status to STARTING
|
96
|
+
if state.update_run_status(run_id, RunStatus(Status.STARTING, "", "")):
|
97
|
+
log(INFO, "Starting run %d", run_id)
|
98
|
+
return PullSimulationInputsResponse(
|
99
|
+
context=context_to_proto(serverapp_ctxt),
|
100
|
+
run=run_to_proto(run),
|
101
|
+
fab=fab_to_proto(fab),
|
102
|
+
)
|
103
|
+
|
104
|
+
# Raise an exception if the Run or Fab is not found,
|
105
|
+
# or if the status cannot be updated to STARTING
|
106
|
+
raise RuntimeError(f"Failed to start run {run_id}")
|
107
|
+
|
108
|
+
def PushSimulationOutputs(
|
109
|
+
self, request: PushSimulationOutputsRequest, context: ServicerContext
|
110
|
+
) -> PushSimulationOutputsResponse:
|
111
|
+
"""Push Simulation process outputs."""
|
112
|
+
log(DEBUG, "SimultionIoServicer.PushSimulationOutputs")
|
113
|
+
state = self.state_factory.state()
|
114
|
+
|
115
|
+
# Abort if the run is not running
|
116
|
+
abort_if(
|
117
|
+
request.run_id,
|
118
|
+
[Status.PENDING, Status.STARTING, Status.FINISHED],
|
119
|
+
state,
|
120
|
+
context,
|
121
|
+
)
|
122
|
+
|
123
|
+
state.set_serverapp_context(request.run_id, context_from_proto(request.context))
|
124
|
+
return PushSimulationOutputsResponse()
|
125
|
+
|
126
|
+
def UpdateRunStatus(
|
127
|
+
self, request: UpdateRunStatusRequest, context: grpc.ServicerContext
|
128
|
+
) -> UpdateRunStatusResponse:
|
129
|
+
"""Update the status of a run."""
|
130
|
+
log(DEBUG, "SimultionIoServicer.UpdateRunStatus")
|
131
|
+
state = self.state_factory.state()
|
132
|
+
|
133
|
+
# Abort if the run is finished
|
134
|
+
abort_if(request.run_id, [Status.FINISHED], state, context)
|
135
|
+
|
136
|
+
# Update the run status
|
137
|
+
state.update_run_status(
|
138
|
+
run_id=request.run_id, new_status=run_status_from_proto(request.run_status)
|
139
|
+
)
|
140
|
+
return UpdateRunStatusResponse()
|
141
|
+
|
142
|
+
def GetRunStatus(
|
143
|
+
self, request: GetRunStatusRequest, context: ServicerContext
|
144
|
+
) -> GetRunStatusResponse:
|
145
|
+
"""Get status of requested runs."""
|
146
|
+
log(DEBUG, "SimultionIoServicer.GetRunStatus")
|
147
|
+
state = self.state_factory.state()
|
148
|
+
|
149
|
+
statuses = state.get_run_status(set(request.run_ids))
|
150
|
+
|
151
|
+
return GetRunStatusResponse(
|
152
|
+
run_status_dict={
|
153
|
+
run_id: run_status_to_proto(status)
|
154
|
+
for run_id, status in statuses.items()
|
155
|
+
}
|
156
|
+
)
|
157
|
+
|
158
|
+
def PushLogs(
|
159
|
+
self, request: PushLogsRequest, context: grpc.ServicerContext
|
160
|
+
) -> PushLogsResponse:
|
161
|
+
"""Push logs."""
|
162
|
+
log(DEBUG, "SimultionIoServicer.PushLogs")
|
163
|
+
state = self.state_factory.state()
|
164
|
+
|
165
|
+
# Add logs to LinkState
|
166
|
+
merged_logs = "".join(request.logs)
|
167
|
+
state.add_serverapp_log(request.run_id, merged_logs)
|
168
|
+
return PushLogsResponse()
|
169
|
+
|
170
|
+
def GetFederationOptions(
|
171
|
+
self, request: GetFederationOptionsRequest, context: ServicerContext
|
172
|
+
) -> GetFederationOptionsResponse:
|
173
|
+
"""Get Federation Options associated with a run."""
|
174
|
+
log(DEBUG, "SimultionIoServicer.GetFederationOptions")
|
175
|
+
state = self.state_factory.state()
|
176
|
+
|
177
|
+
federation_options = state.get_federation_options(request.run_id)
|
178
|
+
if federation_options is None:
|
179
|
+
context.abort(
|
180
|
+
grpc.StatusCode.FAILED_PRECONDITION,
|
181
|
+
"Expected federation options to be set, but none available.",
|
182
|
+
)
|
183
|
+
return GetFederationOptionsResponse()
|
184
|
+
return GetFederationOptionsResponse(
|
185
|
+
federation_options=configs_record_to_proto(federation_options)
|
186
|
+
)
|