PyPI - langfun - Versions diffs - 0.1.2.dev202510230805__py3-none-any.whl → 0.1.2.dev202511160804__py3-none-any.whl - Mend

langfun 0.1.2.dev202510230805py3-none-any.whl → 0.1.2.dev202511160804py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langfun might be problematic. Click here for more details.

Files changed (146) hide show

langfun/core/__init__.py +1 -0
langfun/core/agentic/action.py +107 -12
langfun/core/agentic/action_eval.py +9 -2
langfun/core/agentic/action_test.py +25 -0
langfun/core/async_support.py +32 -3
langfun/core/coding/python/correction.py +19 -9
langfun/core/coding/python/execution.py +14 -12
langfun/core/coding/python/generation.py +21 -16
langfun/core/coding/python/sandboxing.py +23 -3
langfun/core/component.py +42 -3
langfun/core/concurrent.py +70 -6
langfun/core/concurrent_test.py +1 -0
langfun/core/console.py +1 -1
langfun/core/data/conversion/anthropic.py +12 -3
langfun/core/data/conversion/anthropic_test.py +8 -6
langfun/core/data/conversion/gemini.py +9 -2
langfun/core/data/conversion/gemini_test.py +12 -9
langfun/core/data/conversion/openai.py +145 -31
langfun/core/data/conversion/openai_test.py +161 -17
langfun/core/eval/base.py +47 -43
langfun/core/eval/base_test.py +4 -4
langfun/core/eval/matching.py +5 -2
langfun/core/eval/patching.py +3 -3
langfun/core/eval/scoring.py +4 -3
langfun/core/eval/v2/__init__.py +1 -0
langfun/core/eval/v2/checkpointing.py +39 -5
langfun/core/eval/v2/checkpointing_test.py +1 -1
langfun/core/eval/v2/eval_test_helper.py +96 -0
langfun/core/eval/v2/evaluation.py +87 -15
langfun/core/eval/v2/evaluation_test.py +9 -3
langfun/core/eval/v2/example.py +45 -39
langfun/core/eval/v2/example_test.py +3 -3
langfun/core/eval/v2/experiment.py +51 -8
langfun/core/eval/v2/metric_values.py +31 -3
langfun/core/eval/v2/metric_values_test.py +32 -0
langfun/core/eval/v2/metrics.py +157 -44
langfun/core/eval/v2/metrics_test.py +39 -18
langfun/core/eval/v2/progress.py +30 -1
langfun/core/eval/v2/progress_test.py +27 -0
langfun/core/eval/v2/progress_tracking_test.py +3 -0
langfun/core/eval/v2/reporting.py +90 -71
langfun/core/eval/v2/reporting_test.py +20 -6
langfun/core/eval/v2/runners/__init__.py +26 -0
langfun/core/eval/v2/{runners.py → runners/base.py} +22 -124
langfun/core/eval/v2/runners/debug.py +40 -0
langfun/core/eval/v2/runners/debug_test.py +79 -0
langfun/core/eval/v2/runners/parallel.py +100 -0
langfun/core/eval/v2/runners/parallel_test.py +98 -0
langfun/core/eval/v2/runners/sequential.py +47 -0
langfun/core/eval/v2/runners/sequential_test.py +175 -0
langfun/core/langfunc.py +45 -130
langfun/core/langfunc_test.py +6 -4
langfun/core/language_model.py +103 -16
langfun/core/language_model_test.py +9 -3
langfun/core/llms/__init__.py +7 -1
langfun/core/llms/anthropic.py +157 -2
langfun/core/llms/azure_openai.py +29 -17
langfun/core/llms/cache/base.py +25 -3
langfun/core/llms/cache/in_memory.py +48 -7
langfun/core/llms/cache/in_memory_test.py +14 -4
langfun/core/llms/compositional.py +25 -1
langfun/core/llms/deepseek.py +30 -2
langfun/core/llms/fake.py +32 -1
langfun/core/llms/gemini.py +14 -9
langfun/core/llms/google_genai.py +29 -1
langfun/core/llms/groq.py +28 -3
langfun/core/llms/llama_cpp.py +23 -4
langfun/core/llms/openai.py +36 -3
langfun/core/llms/openai_compatible.py +148 -27
langfun/core/llms/openai_compatible_test.py +207 -20
langfun/core/llms/openai_test.py +0 -2
langfun/core/llms/rest.py +12 -1
langfun/core/llms/vertexai.py +51 -8
langfun/core/logging.py +1 -1
langfun/core/mcp/client.py +77 -22
langfun/core/mcp/client_test.py +8 -35
langfun/core/mcp/session.py +94 -29
langfun/core/mcp/session_test.py +54 -0
langfun/core/mcp/tool.py +151 -22
langfun/core/mcp/tool_test.py +197 -0
langfun/core/memory.py +1 -0
langfun/core/message.py +160 -55
langfun/core/message_test.py +65 -81
langfun/core/modalities/__init__.py +8 -0
langfun/core/modalities/audio.py +21 -1
langfun/core/modalities/image.py +19 -1
langfun/core/modalities/mime.py +62 -3
langfun/core/modalities/pdf.py +19 -1
langfun/core/modalities/video.py +21 -1
langfun/core/modality.py +167 -29
langfun/core/modality_test.py +42 -12
langfun/core/natural_language.py +1 -1
langfun/core/sampling.py +4 -4
langfun/core/sampling_test.py +20 -4
langfun/core/structured/__init__.py +2 -24
langfun/core/structured/completion.py +34 -44
langfun/core/structured/completion_test.py +23 -43
langfun/core/structured/description.py +54 -50
langfun/core/structured/function_generation.py +29 -12
langfun/core/structured/mapping.py +81 -37
langfun/core/structured/parsing.py +95 -79
langfun/core/structured/parsing_test.py +0 -3
langfun/core/structured/querying.py +215 -142
langfun/core/structured/querying_test.py +65 -29
langfun/core/structured/schema/__init__.py +48 -0
langfun/core/structured/schema/base.py +664 -0
langfun/core/structured/schema/base_test.py +531 -0
langfun/core/structured/schema/json.py +174 -0
langfun/core/structured/schema/json_test.py +121 -0
langfun/core/structured/schema/python.py +316 -0
langfun/core/structured/schema/python_test.py +410 -0
langfun/core/structured/schema_generation.py +33 -14
langfun/core/structured/scoring.py +47 -36
langfun/core/structured/tokenization.py +26 -11
langfun/core/subscription.py +2 -2
langfun/core/template.py +174 -49
langfun/core/template_test.py +123 -17
langfun/env/__init__.py +8 -2
langfun/env/base_environment.py +320 -128
langfun/env/base_environment_test.py +473 -0
langfun/env/base_feature.py +92 -15
langfun/env/base_feature_test.py +228 -0
langfun/env/base_sandbox.py +84 -361
langfun/env/base_sandbox_test.py +1235 -0
langfun/env/event_handlers/__init__.py +1 -1
langfun/env/event_handlers/chain.py +233 -0
langfun/env/event_handlers/chain_test.py +253 -0
langfun/env/event_handlers/event_logger.py +95 -98
langfun/env/event_handlers/event_logger_test.py +21 -21
langfun/env/event_handlers/metric_writer.py +225 -140
langfun/env/event_handlers/metric_writer_test.py +23 -6
langfun/env/interface.py +854 -40
langfun/env/interface_test.py +112 -2
langfun/env/load_balancers_test.py +23 -2
langfun/env/test_utils.py +126 -84
{langfun-0.1.2.dev202510230805.dist-info → langfun-0.1.2.dev202511160804.dist-info}/METADATA +1 -1
langfun-0.1.2.dev202511160804.dist-info/RECORD +211 -0
langfun/core/eval/v2/runners_test.py +0 -343
langfun/core/structured/schema.py +0 -987
langfun/core/structured/schema_test.py +0 -982
langfun/env/base_test.py +0 -1481
langfun/env/event_handlers/base.py +0 -350
langfun-0.1.2.dev202510230805.dist-info/RECORD +0 -195
{langfun-0.1.2.dev202510230805.dist-info → langfun-0.1.2.dev202511160804.dist-info}/WHEEL +0 -0
{langfun-0.1.2.dev202510230805.dist-info → langfun-0.1.2.dev202511160804.dist-info}/licenses/LICENSE +0 -0
{langfun-0.1.2.dev202510230805.dist-info → langfun-0.1.2.dev202511160804.dist-info}/top_level.txt +0 -0

langfun/env/base_environment.py CHANGED Viewed

@@ -23,8 +23,10 @@ Note that:
 """
 import abc
+import collections
 import functools
 import random
+import re
 import threading
 import time
 from typing import Annotated, Any
@@ -34,7 +36,6 @@ import langfun.core as lf
 from langfun.env import base_sandbox
 from langfun.env import interface
 from langfun.env import load_balancers
-from langfun.env.event_handlers import base as event_handler_base
 import pyglove as pg
@@ -46,6 +47,23 @@ class BaseEnvironment(interface.Environment):
   maintenance.
   """
+  image_ids: Annotated[
+      list[str],
+      (
+          'A list of static image IDs served by the environment. '
+      )
+  ]
+  supports_dynamic_image_loading: Annotated[
+      bool,
+      (
+          'Whether the environment supports dynamic loading of images which is '
+          'not included in the `image_ids`. `image_ids` could coexist with '
+          'dynamic image loading, which allows users to specify an image id '
+          'that is not included in the `image_ids`.'
+      )
+  ] = False
   root_dir: Annotated[
       str | None,
       (
@@ -55,11 +73,15 @@ class BaseEnvironment(interface.Environment):
   ] = None
   pool_size: Annotated[
-      int | tuple[int, int],
+      int | tuple[int, int] | dict[str, int | tuple[int, int]],
       (
           'The (min_size, max_size) of the sandbox pool. If an integer, it '
-          'will be used as both min and max size. If 0, sandboxes will be '
-          'created on demand and shutdown when user session ends.'
+          'will be used as both min and max size. If 0, all sandboxes will be '
+          'created on demand and shutdown when user session ends. If a dict, '
+          'users could configure the pool size based on image IDs. The keys '
+          'are regular expressions for image IDs, and the values are '
+          '(min_size, max_size) tuples. For dynamic image IDs, min_size will '
+          'ignored while max_size will be honored.'
       )
   ] = (0, 256)
@@ -90,12 +112,13 @@ class BaseEnvironment(interface.Environment):
       )
   ] = True
-  event_handlers: Annotated[
-      list[event_handler_base.EventHandler],
+  event_handler: Annotated[
+      interface.EventHandler,
       (
           'User handler for the environment events.'
+          'By default, the no-op event handler is used.'
       )
-  ] = []
+  ] = interface.EventHandler()
   outage_grace_period: Annotated[
       float,
@@ -146,14 +169,39 @@ class BaseEnvironment(interface.Environment):
     self._status = self.Status.CREATED
     self._start_time = None
-    self._sandbox_pool = []
-    self._next_pooled_sandbox_id = 0
+    self._sandbox_pool: dict[str, list[base_sandbox.BaseSandbox]] = (
+        collections.defaultdict(list)
+    )
+    self._next_sandbox_id: dict[str, int] = collections.defaultdict(int)
     self._random = (
         random if self.random_seed is None else random.Random(self.random_seed)
     )
     self._housekeep_thread = None
     self._offline_start_time = None
+    self._non_sandbox_based_features_with_setup_called = set()
+    # Check image IDs and feature requirements.
+    self._check_image_ids()
+    self._check_feature_requirements()
+  def _check_image_ids(self) -> None:
+    """Checks image ids. Subclass could override this method."""
+  def _check_feature_requirements(self) -> None:
+    """Checks if the image ID is supported by the feature."""
+    if self.supports_dynamic_image_loading:
+      return
+    for name, feature in self.features.items():
+      if not feature.is_sandbox_based or any(
+          feature.is_applicable(image_id) for image_id in self.image_ids
+      ):
+        continue
+      raise ValueError(
+          f'Feature {name!r} is not applicable to all available images: '
+          f'{self.image_ids!r}. '
+          f'Applicable images: {feature.applicable_images}.'
+      )
   #
   # Subclasses must implement:
@@ -162,6 +210,7 @@ class BaseEnvironment(interface.Environment):
   @abc.abstractmethod
   def _create_sandbox(
       self,
+      image_id: str,
       sandbox_id: str,
       reusable: bool,
       proactive_session_setup: bool,
@@ -170,6 +219,7 @@ class BaseEnvironment(interface.Environment):
     """Creates a sandbox with the given identifier.
     Args:
+      image_id: The image ID to use for the sandbox.
       sandbox_id: The identifier for the sandbox.
       reusable: Whether the sandbox is reusable across user sessions.
       proactive_session_setup: Whether the sandbox performs session setup work
@@ -185,13 +235,13 @@ class BaseEnvironment(interface.Environment):
       interface.SandboxStateError: If sandbox cannot be started.
     """
-  def new_session_id(self) -> str:
+  def new_session_id(self, feature_hint: str | None = None) -> str:
     """Generates a random session ID."""
     suffix = uuid.UUID(
         bytes=bytes(bytes(self._random.getrandbits(8) for _ in range(16))),
         version=4
     ).hex[:7]
-    return f'session-{suffix}'
+    return f'{feature_hint or "unknown"}-session-{suffix}'
   @property
   def housekeep_counter(self) -> int:
@@ -204,42 +254,66 @@ class BaseEnvironment(interface.Environment):
   def stats(self) -> dict[str, Any]:
     """Returns the stats of the environment."""
-    stats_dict = {
-        status.value: 0
-        for status in interface.Sandbox.Status
-    }
-    for sandbox in self._sandbox_pool:
-      stats_dict[sandbox.status.value] += 1
+    stats_by_image_id = {}
+    for image_id, sandboxes in self._sandbox_pool.items():
+      stats_dict = {
+          status.value: 0
+          for status in interface.Sandbox.Status
+      }
+      for sandbox in sandboxes:
+        stats_dict[sandbox.status.value] += 1
+      stats_by_image_id[image_id] = stats_dict
     return {
-        'sandbox': stats_dict,
+        'sandbox': stats_by_image_id,
     }
   def _start(self) -> None:
     """Implementation of starting the environment."""
-    if self.min_pool_size > 0:
-      # Pre-allocate the sandbox pool before usage.
-      self._sandbox_pool = [None] * self.min_pool_size
-      for i, sandbox, _ in lf.concurrent_map(
-          lambda i: self._bring_up_sandbox_with_retry(
-              sandbox_id=f'{i}:0', shutdown_env_upon_outage=False
-          ),
-          range(self.min_pool_size),
-          silence_on_errors=None,
-          max_workers=min(
-              self.pool_operation_max_parallelism,
-              self.min_pool_size
-          ),
-      ):
-        self._sandbox_pool[i] = sandbox
-    self._next_sandbox_id = len(self._sandbox_pool)
+    sandbox_startup_infos = []
+    self._non_sandbox_based_features_with_setup_called.clear()
+    # Setup all non-sandbox-based features.
+    for feature in self.non_sandbox_based_features():
+      self._non_sandbox_based_features_with_setup_called.add(feature.name)
+      feature.setup(sandbox=None)
+    # Setup sandbox pools.
+    for image_id in self.image_ids:
+      next_sandbox_id = 0
+      if self.enable_pooling(image_id):
+        min_pool_size = self.min_pool_size(image_id)
+        for i in range(min_pool_size):
+          sandbox_startup_infos.append((image_id, i))
+        self._sandbox_pool[image_id] = [None] * min_pool_size
+        next_sandbox_id = min_pool_size
+      self._next_sandbox_id[image_id] = next_sandbox_id
+    def _start_sandbox(sandbox_startup_info) -> None:
+      image_id, index = sandbox_startup_info
+      self._sandbox_pool[image_id][index] = self._bring_up_sandbox_with_retry(
+          image_id=image_id,
+          sandbox_id=f'{index}:0',
+          shutdown_env_upon_outage=False
+      )
-    if self.enable_pooling:
-      self._housekeep_thread = threading.Thread(
-          target=self._housekeep_loop, daemon=True
+    if sandbox_startup_infos:
+      # Pre-allocate the sandbox pool before usage.
+      _ = list(
+          lf.concurrent_map(
+              _start_sandbox,
+              sandbox_startup_infos,
+              silence_on_errors=None,
+              max_workers=min(
+                  self.pool_operation_max_parallelism,
+                  len(sandbox_startup_infos)
+              ),
+          )
       )
-      self._housekeep_counter = 0
-      self._housekeep_thread.start()
+    self._housekeep_thread = threading.Thread(
+        target=self._housekeep_loop, daemon=True
+    )
+    self._housekeep_counter = 0
+    self._housekeep_thread.start()
   def _shutdown(self) -> None:
     """Implementation of shutting down the environment."""
@@ -248,30 +322,44 @@ class BaseEnvironment(interface.Environment):
       self._housekeep_thread.join()
       self._housekeep_thread = None
-    def _shutdown_sandbox(sandbox: base_sandbox.BaseSandbox) -> None:
-      if sandbox is not None:
-        sandbox.shutdown()
+    # Teardown all non-sandbox-based features.
+    for feature in self.non_sandbox_based_features():
+      if feature.name in self._non_sandbox_based_features_with_setup_called:
+        try:
+          feature.teardown()
+        except BaseException:   # pylint: disable=broad-except
+          pass
+    # Shutdown sandbox pools.
     if self._sandbox_pool:
-      _ = list(
-          lf.concurrent_map(
-              _shutdown_sandbox,
-              self._sandbox_pool,
-              silence_on_errors=None,
-              max_workers=min(
-                  self.pool_operation_max_parallelism,
-                  len(self._sandbox_pool)
-              ),
-          )
-      )
-      self._sandbox_pool = []
+      sandboxes = []
+      for sandbox in self._sandbox_pool.values():
+        sandboxes.extend(sandbox)
+      self._sandbox_pool = {}
+      if sandboxes:
+        def _shutdown_sandbox(sandbox: base_sandbox.BaseSandbox) -> None:
+          if sandbox is not None:
+            sandbox.shutdown()
+        _ = list(
+            lf.concurrent_map(
+                _shutdown_sandbox,
+                sandboxes,
+                silence_on_errors=None,
+                max_workers=min(
+                    self.pool_operation_max_parallelism,
+                    len(sandboxes)
+                ),
+            )
+        )
   #
   # Environment basics.
   #
   @property
-  def sandbox_pool(self) -> list[base_sandbox.BaseSandbox]:
+  def sandbox_pool(self) -> dict[str, list[base_sandbox.BaseSandbox]]:
     """Returns the sandbox pool."""
     return self._sandbox_pool
@@ -280,11 +368,6 @@ class BaseEnvironment(interface.Environment):
     """Returns the working directory for the environment."""
     return self.id.working_dir(self.root_dir)
-  @property
-  def enable_pooling(self) -> bool:
-    """Returns whether the environment enables pooling."""
-    return self.max_pool_size > 0
   @property
   def status(self) -> interface.Environment.Status:
     """Returns whether the environment is online."""
@@ -294,19 +377,39 @@ class BaseEnvironment(interface.Environment):
     """Sets the status of the environment."""
     self._status = status
-  @property
-  def min_pool_size(self) -> int:
+  def enable_pooling(self, image_id: str) -> bool:
+    """Returns whether the environment enables pooling."""
+    return self.max_pool_size(image_id) > 0
+  def min_pool_size(self, image_id: str) -> int:
     """Returns the minimum size of the sandbox pool."""
-    if isinstance(self.pool_size, int):
-      return self.pool_size
-    return self.pool_size[0]
+    return self._pool_size(image_id)[0]
-  @property
-  def max_pool_size(self) -> int:
+  def max_pool_size(self, image_id: str) -> int:
     """Returns the maximum size of the sandbox pool."""
-    if isinstance(self.pool_size, int):
-      return self.pool_size
-    return self.pool_size[1]
+    return self._pool_size(image_id)[1]
+  def _pool_size(self, image_id: str) -> tuple[int, int]:
+    """Returns the minimum and maximum size of the sandbox pool."""
+    if isinstance(self.pool_size, dict):
+      if image_id in self.pool_size:
+        pool_size = self.pool_size[image_id]
+      else:
+        for k, v in self.pool_size.items():
+          if re.match(k, image_id):
+            pool_size = v
+            break
+        else:
+          # Default pool size is 0 and 256.
+          pool_size = (0, 256)
+    else:
+      pool_size = self.pool_size
+    if isinstance(pool_size, int):
+      return pool_size, pool_size
+    else:
+      assert isinstance(pool_size, tuple) and len(pool_size) == 2
+      return pool_size
   @property
   def start_time(self) -> float | None:
@@ -373,9 +476,16 @@ class BaseEnvironment(interface.Environment):
   # Environment operations.
   #
-  def acquire(self) -> base_sandbox.BaseSandbox:
+  def acquire(
+      self,
+      image_id: str | None = None
+  ) -> base_sandbox.BaseSandbox:
     """Acquires a sandbox from the environment.
+    Args:
+      image_id: The image ID to use for the sandbox. If None, it will be
+        automatically determined by the environment.
     Returns:
       The acquired sandbox.
@@ -385,28 +495,50 @@ class BaseEnvironment(interface.Environment):
       interface.EnvironmentOverloadError: If the max pool size is reached and
         the grace period has passed.
     """
     if not self.is_online:
       raise interface.EnvironmentOutageError(
           f'Environment {self.id} is not alive.',
           environment=self,
           offline_duration=self.offline_duration,
       )
+    if image_id is None:
+      if not self.image_ids:
+        raise ValueError(
+            f'Environment {self.id} does not have a default image ID. '
+            'Please specify the image ID explicitly.'
+        )
+      image_id = self.image_ids[0]
+    elif (image_id not in self.image_ids
+          and not self.supports_dynamic_image_loading):
+      raise ValueError(
+          f'Environment {self.id} does not serve image ID {image_id!r}. '
+          f'Please use one of the following image IDs: {self.image_ids!r} or '
+          f'set `{self.__class__.__name__}.supports_dynamic_image_loading` '
+          'to True if dynamic image loading is supported.'
+      )
+    return self._acquire(image_id)
-    if not self.enable_pooling:
+  def _acquire(
+      self,
+      image_id: str | None = None
+  ) -> base_sandbox.BaseSandbox:
+    """Acquires a sandbox from the environment."""
+    if not self.enable_pooling(image_id):
       return self._bring_up_sandbox_with_retry(
-          sandbox_id=str(self._increment_sandbox_id()),
+          image_id=image_id,
+          sandbox_id=str(self._increment_sandbox_id(image_id)),
           set_acquired=True,
       )
     allocation_start_time = time.time()
+    sandbox_pool = self._sandbox_pool[image_id]
     while True:
       try:
         # We only append or replace items in the sandbox pool, therefore
         # there is no need to lock the pool.
-        return self.load_balancer.acquire(self._sandbox_pool)
+        return self.load_balancer.acquire(sandbox_pool)
       except IndexError:
-        if len(self._sandbox_pool) == self.max_pool_size:
+        if len(sandbox_pool) == self.max_pool_size(image_id):
           if time.time() - allocation_start_time > self.outage_grace_period:
             raise interface.EnvironmentOverloadError(  # pylint: disable=raise-missing-from
                 environment=self
@@ -415,11 +547,12 @@ class BaseEnvironment(interface.Environment):
         else:
           try:
             sandbox = self._bring_up_sandbox(
-                sandbox_id=f'{self._increment_sandbox_id()}:0',
+                image_id=image_id,
+                sandbox_id=f'{self._increment_sandbox_id(image_id)}:0',
                 set_acquired=True,
             )
             # Append is atomic and does not require locking.
-            self._sandbox_pool.append(sandbox)
+            sandbox_pool.append(sandbox)
             return sandbox
           except (
               interface.EnvironmentError, interface.SandboxStateError
@@ -428,6 +561,7 @@ class BaseEnvironment(interface.Environment):
   def _bring_up_sandbox(
       self,
+      image_id: str,
       sandbox_id: str,
       set_acquired: bool = False,
   ) -> base_sandbox.BaseSandbox:
@@ -435,13 +569,12 @@ class BaseEnvironment(interface.Environment):
     env_error = None
     try:
       sandbox = self._create_sandbox(
+          image_id=image_id,
           sandbox_id=sandbox_id,
-          reusable=self.enable_pooling,
+          reusable=self.enable_pooling(image_id),
           proactive_session_setup=self.proactive_session_setup,
           keepalive_interval=self.sandbox_keepalive_interval,
       )
-      for handler in self.event_handlers:
-        sandbox.add_event_handler(handler)
       sandbox.start()
       if set_acquired:
         sandbox.set_acquired()
@@ -457,6 +590,7 @@ class BaseEnvironment(interface.Environment):
   def _bring_up_sandbox_with_retry(
       self,
+      image_id: str,
       sandbox_id: str,
       set_acquired: bool = False,
       shutdown_env_upon_outage: bool = True,
@@ -464,6 +598,7 @@ class BaseEnvironment(interface.Environment):
     """Brings up a new sandbox with retry until grace period is passed.
     Args:
+      image_id: The image ID to use for the sandbox.
       sandbox_id: The ID of the sandbox to bring up.
       set_acquired: If True, the sandbox will be marked as acquired.
       shutdown_env_upon_outage: Whether to shutdown the environment when the
@@ -479,15 +614,15 @@ class BaseEnvironment(interface.Environment):
     while True:
       try:
         return self._bring_up_sandbox(
-            sandbox_id=sandbox_id, set_acquired=set_acquired
+            image_id=image_id, sandbox_id=sandbox_id, set_acquired=set_acquired
         )
       except (interface.EnvironmentError, interface.SandboxStateError) as e:
         self._report_outage_or_wait(e, shutdown_env_upon_outage)
-  def _increment_sandbox_id(self) -> int:
+  def _increment_sandbox_id(self, image_id: str) -> int:
     """Returns the next pooled sandbox ID."""
-    x = self._next_sandbox_id
-    self._next_sandbox_id += 1
+    x = self._next_sandbox_id[image_id]
+    self._next_sandbox_id[image_id] += 1
     return x
   def _report_outage_or_wait(
@@ -511,33 +646,83 @@ class BaseEnvironment(interface.Environment):
   def _housekeep_loop(self) -> None:
     """Housekeeping loop for the environment."""
+    def _indices_by_image_id(
+        entries: list[tuple[str, int, Any]]
+    ) -> dict[str, list[int]]:
+      indices_by_image_id = collections.defaultdict(list)
+      for image_id, i, _ in entries:
+        indices_by_image_id[image_id].append(i)
+      return indices_by_image_id
+    last_housekeep_time = {
+        f.name: time.time() for f in self.non_sandbox_based_features()
+    }
     while self._status not in (self.Status.SHUTTING_DOWN, self.Status.OFFLINE):
       housekeep_start_time = time.time()
+      feature_housekeep_successes = []
+      feature_housekeep_failures = []
+      # Housekeeping non-sandbox-based features.
+      for feature in self.non_sandbox_based_features():
+        if feature.housekeep_interval is None:
+          continue
+        if (last_housekeep_time[feature.name]
+            + feature.housekeep_interval < time.time()):
+          try:
+            feature.housekeep()
+            last_housekeep_time[feature.name] = time.time()
+            feature_housekeep_successes.append(feature.name)
+          except BaseException as e:  # pylint: disable=broad-except
+            pg.logging.error(
+                '[%s/%s]: Feature housekeeping failed with error: %s.'
+                'Shutting down environment...',
+                self.id,
+                feature.name,
+                e,
+            )
+            feature_housekeep_failures.append(feature.name)
+            self._housekeep_counter += 1
+            self.on_housekeep(
+                duration=time.time() - housekeep_start_time,
+                error=e,
+                feature_housekeep_successes=feature_housekeep_successes,
+                feature_housekeep_failures=feature_housekeep_failures,
+            )
+            self.shutdown()
+            return
+      # Replace dead sandboxes.
       is_online = True
-      dead_pool_indices = [
-          i for i, s in enumerate(self._sandbox_pool)
-          if s.status == interface.Sandbox.Status.OFFLINE
-      ]
-      replaced_indices = []
-      if dead_pool_indices:
-        replaced_indices = self._replace_dead_sandboxes(dead_pool_indices)
-        if not replaced_indices:
+      dead_sandbox_entries = []
+      for image_id, sandboxes in self._sandbox_pool.items():
+        for i, sandbox in enumerate(sandboxes):
+          if sandbox.status == interface.Sandbox.Status.OFFLINE:
+            dead_sandbox_entries.append((image_id, i, sandbox))
+      replaced_indices_by_image_id = {}
+      if dead_sandbox_entries:
+        replaced_indices_by_image_id = self._replace_dead_sandboxes(
+            dead_sandbox_entries
+        )
+        if not replaced_indices_by_image_id:
           is_online = self.offline_duration < self.outage_grace_period
       self._housekeep_counter += 1
       duration = time.time() - housekeep_start_time
       kwargs = dict(
-          dead_pool_indices=dead_pool_indices,
-          replaced_indices=replaced_indices,
+          feature_housekeep_successes=feature_housekeep_successes,
+          feature_housekeep_failures=feature_housekeep_failures,
+          dead_sandboxes=_indices_by_image_id(dead_sandbox_entries),
+          replaced_sandboxes=replaced_indices_by_image_id,
           offline_duration=self.offline_duration,
       )
       if is_online:
         self.on_housekeep(duration, **kwargs)
         time.sleep(self.housekeep_interval)
       else:
-        self.shutdown()
         self.on_housekeep(
             duration,
             interface.EnvironmentOutageError(
@@ -545,50 +730,63 @@ class BaseEnvironment(interface.Environment):
             ),
             **kwargs
         )
+        self.shutdown()
-  def _replace_dead_sandboxes(self, dead_pool_indices: list[int]) -> list[int]:
+  def _replace_dead_sandboxes(
+      self,
+      dead_sandbox_entries: list[tuple[str, int, base_sandbox.BaseSandbox]]
+  ) -> dict[str, list[int]]:
     """Replaces a dead sandbox with a new one.
     Args:
-      dead_pool_indices: The indices of the dead sandboxes to replace.
+      dead_sandbox_entries: A list of tuples (image_id, index, sandbox) of
+        dead sandboxes to replace.
     Returns:
-      Successfully replaced indices.
+      Successfully replaced sandboxes in a dict of image ID to a list of
+        indices.
     """
     pg.logging.warning(
         '[%s]: %s maintenance: '
         'Replacing %d dead sandbox(es) with new ones...',
         self.id,
         self.__class__.__name__,
-        len(dead_pool_indices),
+        len(dead_sandbox_entries),
     )
-    def _replace(i: int):
-      generation = int(self._sandbox_pool[i].id.sandbox_id.split(':')[1])
-      self._sandbox_pool[i] = self._bring_up_sandbox(f'{i}:{generation + 1}')
+    def _replace(sandbox_entry: tuple[str, int, base_sandbox.BaseSandbox]):
+      image_id, i, sandbox = sandbox_entry
+      generation = int(sandbox.id.sandbox_id.split(':')[-1])
+      replaced_sandbox = self._bring_up_sandbox(
+          image_id=image_id,
+          sandbox_id=f'{i}:{generation + 1}'
+      )
+      self._sandbox_pool[image_id][i] = replaced_sandbox
     # TODO(daiyip): Consider to loose the condition to allow some dead
     # sandboxes to be replaced successfully.
-    replaced_indices = []
-    for index, _, error in lf.concurrent_map(
-        _replace, dead_pool_indices,
+    replaced_indices_by_image_id = collections.defaultdict(list)
+    num_replaced = 0
+    for (image_id, index, _), _, error in lf.concurrent_map(
+        _replace, dead_sandbox_entries,
         max_workers=min(
             self.pool_operation_max_parallelism,
-            len(dead_pool_indices)
+            len(dead_sandbox_entries)
         ),
     ):
       if error is None:
-        replaced_indices.append(index)
+        replaced_indices_by_image_id[image_id].append(index)
+        num_replaced += 1
     pg.logging.warning(
         '[%s]: %s maintenance: '
         '%d/%d dead sandbox(es) have been replaced with new ones. (slots=%s)',
         self.id,
         self.__class__.__name__,
-        len(replaced_indices),
-        len(dead_pool_indices),
-        replaced_indices
+        num_replaced,
+        len(dead_sandbox_entries),
+        replaced_indices_by_image_id,
     )
-    return replaced_indices
+    return replaced_indices_by_image_id
   #
   # Event handlers subclasses can override.
@@ -596,16 +794,14 @@ class BaseEnvironment(interface.Environment):
   def on_starting(self) -> None:
     """Called when the environment is getting started."""
-    for handler in self.event_handlers:
-      handler.on_environment_starting(self)
+    self.event_handler.on_environment_starting(self)
   def on_start(
       self,
       duration: float, error: BaseException | None = None
   ) -> None:
     """Called when the environment is started."""
-    for handler in self.event_handlers:
-      handler.on_environment_start(self, duration, error)
+    self.event_handler.on_environment_start(self, duration, error)
   def on_housekeep(
       self,
@@ -614,16 +810,13 @@ class BaseEnvironment(interface.Environment):
       **kwargs
   ) -> None:
     """Called when the environment finishes a round of housekeeping."""
-    housekeep_counter = self.housekeep_counter
-    for handler in self.event_handlers:
-      handler.on_environment_housekeep(
-          self, housekeep_counter, duration, error, **kwargs
-      )
+    self.event_handler.on_environment_housekeep(
+        self, self.housekeep_counter, duration, error, **kwargs
+    )
   def on_shutting_down(self) -> None:
     """Called when the environment is shutting down."""
-    for handler in self.event_handlers:
-      handler.on_environment_shutting_down(self, self.offline_duration)
+    self.event_handler.on_environment_shutting_down(self, self.offline_duration)
   def on_shutdown(
       self,
@@ -631,5 +824,4 @@ class BaseEnvironment(interface.Environment):
       error: BaseException | None = None) -> None:
     """Called when the environment is shutdown."""
     lifetime = (time.time() - self.start_time) if self.start_time else 0.0
-    for handler in self.event_handlers:
-      handler.on_environment_shutdown(self, duration, lifetime, error)
+    self.event_handler.on_environment_shutdown(self, duration, lifetime, error)

langfun 0.1.2.dev202510230805__py3-none-any.whl → 0.1.2.dev202511160804__py3-none-any.whl

Potentially problematic release.

langfun 0.1.2.dev202510230805py3-none-any.whl → 0.1.2.dev202511160804py3-none-any.whl