PyPI - langfun - Versions diffs - 0.1.2.dev202509020804__py3-none-any.whl → 0.1.2.dev202511110805__py3-none-any.whl - Mend

langfun 0.1.2.dev202509020804py3-none-any.whl → 0.1.2.dev202511110805py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langfun might be problematic. Click here for more details.

Files changed (133) hide show

langfun/__init__.py +1 -1
langfun/core/__init__.py +6 -1
langfun/core/agentic/__init__.py +4 -0
langfun/core/agentic/action.py +412 -103
langfun/core/agentic/action_eval.py +9 -2
langfun/core/agentic/action_test.py +68 -6
langfun/core/async_support.py +104 -5
langfun/core/async_support_test.py +23 -0
langfun/core/coding/python/correction.py +19 -9
langfun/core/coding/python/execution.py +14 -12
langfun/core/coding/python/generation.py +21 -16
langfun/core/coding/python/sandboxing.py +23 -3
langfun/core/component.py +42 -3
langfun/core/concurrent.py +70 -6
langfun/core/concurrent_test.py +9 -2
langfun/core/console.py +1 -1
langfun/core/data/conversion/anthropic.py +12 -3
langfun/core/data/conversion/anthropic_test.py +8 -6
langfun/core/data/conversion/gemini.py +9 -2
langfun/core/data/conversion/gemini_test.py +12 -9
langfun/core/data/conversion/openai.py +145 -31
langfun/core/data/conversion/openai_test.py +161 -17
langfun/core/eval/base.py +47 -43
langfun/core/eval/base_test.py +4 -4
langfun/core/eval/matching.py +5 -2
langfun/core/eval/patching.py +3 -3
langfun/core/eval/scoring.py +4 -3
langfun/core/eval/v2/__init__.py +1 -0
langfun/core/eval/v2/checkpointing.py +30 -4
langfun/core/eval/v2/eval_test_helper.py +1 -1
langfun/core/eval/v2/evaluation.py +60 -14
langfun/core/eval/v2/example.py +22 -11
langfun/core/eval/v2/experiment.py +51 -8
langfun/core/eval/v2/metric_values.py +31 -3
langfun/core/eval/v2/metric_values_test.py +32 -0
langfun/core/eval/v2/metrics.py +39 -4
langfun/core/eval/v2/metrics_test.py +14 -0
langfun/core/eval/v2/progress.py +30 -1
langfun/core/eval/v2/progress_test.py +27 -0
langfun/core/eval/v2/progress_tracking_test.py +6 -0
langfun/core/eval/v2/reporting.py +90 -71
langfun/core/eval/v2/reporting_test.py +20 -6
langfun/core/eval/v2/runners.py +27 -7
langfun/core/eval/v2/runners_test.py +3 -0
langfun/core/langfunc.py +45 -130
langfun/core/langfunc_test.py +6 -4
langfun/core/language_model.py +151 -31
langfun/core/language_model_test.py +9 -3
langfun/core/llms/__init__.py +12 -1
langfun/core/llms/anthropic.py +157 -2
langfun/core/llms/azure_openai.py +29 -17
langfun/core/llms/cache/base.py +25 -3
langfun/core/llms/cache/in_memory.py +48 -7
langfun/core/llms/cache/in_memory_test.py +14 -4
langfun/core/llms/compositional.py +25 -1
langfun/core/llms/deepseek.py +30 -2
langfun/core/llms/fake.py +39 -1
langfun/core/llms/fake_test.py +9 -0
langfun/core/llms/gemini.py +43 -7
langfun/core/llms/google_genai.py +34 -1
langfun/core/llms/groq.py +28 -3
langfun/core/llms/llama_cpp.py +23 -4
langfun/core/llms/openai.py +93 -3
langfun/core/llms/openai_compatible.py +148 -27
langfun/core/llms/openai_compatible_test.py +207 -20
langfun/core/llms/openai_test.py +0 -2
langfun/core/llms/rest.py +16 -1
langfun/core/llms/vertexai.py +59 -8
langfun/core/logging.py +1 -1
langfun/core/mcp/__init__.py +10 -0
langfun/core/mcp/client.py +177 -0
langfun/core/mcp/client_test.py +71 -0
langfun/core/mcp/session.py +241 -0
langfun/core/mcp/session_test.py +54 -0
langfun/core/mcp/testing/simple_mcp_client.py +33 -0
langfun/core/mcp/testing/simple_mcp_server.py +33 -0
langfun/core/mcp/tool.py +256 -0
langfun/core/mcp/tool_test.py +197 -0
langfun/core/memory.py +1 -0
langfun/core/message.py +160 -55
langfun/core/message_test.py +65 -81
langfun/core/modalities/__init__.py +8 -0
langfun/core/modalities/audio.py +21 -1
langfun/core/modalities/image.py +19 -1
langfun/core/modalities/mime.py +62 -3
langfun/core/modalities/pdf.py +19 -1
langfun/core/modalities/video.py +21 -1
langfun/core/modality.py +167 -29
langfun/core/modality_test.py +42 -12
langfun/core/natural_language.py +1 -1
langfun/core/sampling.py +4 -4
langfun/core/sampling_test.py +20 -4
langfun/core/structured/completion.py +34 -44
langfun/core/structured/completion_test.py +23 -43
langfun/core/structured/description.py +54 -50
langfun/core/structured/function_generation.py +29 -12
langfun/core/structured/mapping.py +74 -28
langfun/core/structured/parsing.py +90 -74
langfun/core/structured/parsing_test.py +0 -3
langfun/core/structured/querying.py +242 -156
langfun/core/structured/querying_test.py +95 -64
langfun/core/structured/schema.py +70 -10
langfun/core/structured/schema_generation.py +33 -14
langfun/core/structured/scoring.py +45 -34
langfun/core/structured/tokenization.py +24 -9
langfun/core/subscription.py +2 -2
langfun/core/template.py +175 -50
langfun/core/template_test.py +123 -17
langfun/env/__init__.py +43 -0
langfun/env/base_environment.py +827 -0
langfun/env/base_environment_test.py +473 -0
langfun/env/base_feature.py +304 -0
langfun/env/base_feature_test.py +228 -0
langfun/env/base_sandbox.py +842 -0
langfun/env/base_sandbox_test.py +1235 -0
langfun/env/event_handlers/__init__.py +14 -0
langfun/env/event_handlers/chain.py +233 -0
langfun/env/event_handlers/chain_test.py +253 -0
langfun/env/event_handlers/event_logger.py +472 -0
langfun/env/event_handlers/event_logger_test.py +304 -0
langfun/env/event_handlers/metric_writer.py +726 -0
langfun/env/event_handlers/metric_writer_test.py +214 -0
langfun/env/interface.py +1640 -0
langfun/env/interface_test.py +151 -0
langfun/env/load_balancers.py +59 -0
langfun/env/load_balancers_test.py +139 -0
langfun/env/test_utils.py +497 -0
{langfun-0.1.2.dev202509020804.dist-info → langfun-0.1.2.dev202511110805.dist-info}/METADATA +7 -3
langfun-0.1.2.dev202511110805.dist-info/RECORD +200 -0
langfun-0.1.2.dev202509020804.dist-info/RECORD +0 -172
{langfun-0.1.2.dev202509020804.dist-info → langfun-0.1.2.dev202511110805.dist-info}/WHEEL +0 -0
{langfun-0.1.2.dev202509020804.dist-info → langfun-0.1.2.dev202511110805.dist-info}/licenses/LICENSE +0 -0
{langfun-0.1.2.dev202509020804.dist-info → langfun-0.1.2.dev202511110805.dist-info}/top_level.txt +0 -0

langfun/core/llms/cache/in_memory.py CHANGED Viewed

@@ -24,7 +24,32 @@ import pyglove as pg
 @pg.use_init_args(['filename', 'ttl', 'key'])
 class InMemory(base.LMCacheBase):
-  """In memory cache."""
+  """An in-memory cache for language model lookups.
+  `InMemory` stores LM prompts and their corresponding responses in memory,
+  providing a simple and fast caching mechanism for a single session.
+  Optionally, it can persist the cache to a JSON file on disk, allowing
+  results to be reused across sessions.
+  When a filename is provided, the cache will be loaded from the file upon
+  initialization and saved to the file when `save()` is called. This is
+  useful for caching results in interactive environments like Colab or
+  when running batch jobs.
+  Example:
+  ```python
+  import langfun as lf
+  # Using in-memory cache without persistence
+  lm = lf.llms.GeminiPro(cache=lf.llms.cache.InMemory())
+  r = lm.query('hello')
+  # Using in-memory cache with persistence
+  lm = lf.llms.GeminiPro(cache=lf.llms.cache.InMemory('cache.json'))
+  r = lm.query('hello')
+  lm.cache.save()
+  ```
+  """
   filename: Annotated[
       str | None,
@@ -144,17 +169,33 @@ class InMemory(base.LMCacheBase):
 @contextlib.contextmanager
 def lm_cache(filename: str | None = None) -> Iterator[InMemory]:
-  """Context manager to enable cache for LMs under the context.
+  """Context manager to enable in-memory cache for LMs in the current context.
+  This context manager sets an `InMemory` cache as the default cache for
+  any Langfun language model instantiated within its scope, unless a model
+  is explicitly configured with a different cache.
+  If a `filename` is provided, the cache will be loaded from the specified
+  file at the beginning of the context and automatically saved back to the
+  file upon exiting the context. This is a convenient way to manage
+  persistent caching for a block of code.
+  Example:
-  If LMs under the context manager have explicitly specified cache, they will
-  use their own cache. Otherwise they will use the cache created by the context
-  manager.
+  ```python
+  import langfun as lf
+  with lf.lm_cache('my_cache.json'):
+    # LMs created here will use 'my_cache.json' for caching.
+    lm = lf.llms.GeminiPro()
+    print(lm.query('hello'))
+  ```
   Args:
-    filename: If not None, JSON file to load and save the cache.
+    filename: If provided, specifies the JSON file for loading and saving
+      the cache.
   Yields:
-    A cache object created.
+    The `InMemory` cache instance created for this context.
   """
   cache = InMemory(filename)
   try:

langfun/core/llms/cache/in_memory_test.py CHANGED Viewed

@@ -175,18 +175,28 @@ class InMemoryLMCacheTest(unittest.TestCase):
     cache = in_memory.InMemory()
     lm = fake.StaticSequence(['1', '2', '3', '4', '5', '6'], cache=cache)
-    lm(lf.UserMessage('hi <<[[image]]>>', image=CustomModality('foo')))
-    lm(lf.UserMessage('hi <<[[image]]>>', image=CustomModality('bar')))
+    image_foo = CustomModality('foo')
+    image_bar = CustomModality('bar')
+    lm(
+        lf.UserMessage(
+            f'hi <<[[{image_foo.id}]]>>', referred_modalities=[image_foo]
+        )
+    )
+    lm(
+        lf.UserMessage(
+            f'hi <<[[{image_bar.id}]]>>', referred_modalities=[image_bar]
+        )
+    )
     self.assertEqual(
         list(cache.keys()),
         [
             (
-                'hi <<[[image]]>><image>acbd18db</image>',
+                f'hi <<[[{image_foo.id}]]>>',
                 (None, None, 1, 40, None, None),
                 0,
             ),
             (
-                'hi <<[[image]]>><image>37b51d19</image>',
+                f'hi <<[[{image_bar.id}]]>>',
                 (None, None, 1, 40, None, None),
                 0,
             ),

langfun/core/llms/compositional.py CHANGED Viewed

@@ -21,7 +21,31 @@ import pyglove as pg
 @pg.use_init_args(['candidates', 'seed'])
 class RandomChoice(lf.LanguageModel):
-  """Random choice of a list of LLM models."""
+  """A composite language model that randomly selects from a list of candidates.
+  `RandomChoice` acts as a proxy that forwards each request (`sample`, `score`,
+  `tokenize`, or `__call__`) to one of the `candidates` selected randomly.
+  This can be useful for load balancing across multiple LLM endpoints,
+  for A/B testing different models, or for ensembling model outputs
+  by calling it multiple times.
+  The selection is determined by the provided `seed`, ensuring reproducibility
+  if needed.
+  Example:
+  ```python
+  import langfun as lf
+  lm = lf.llms.RandomChoice([
+      lf.llms.GeminiPro(),
+      lf.llms.GPT4(),
+  ])
+  # This call will be handled by either GeminiPro or GPT4, chosen randomly.
+  r = lm.sample('hello')
+  ```
+  """
   candidates: Annotated[
       list[lf.LanguageModel],

langfun/core/llms/deepseek.py CHANGED Viewed

@@ -93,8 +93,36 @@ _SUPPORTED_MODELS_BY_ID = {m.model_id: m for m in SUPPORTED_MODELS}
 # DeepSeek API uses an API format compatible with OpenAI.
 # Reference: https://api-docs.deepseek.com/
 @lf.use_init_args(['model'])
-class DeepSeek(openai_compatible.OpenAICompatible):
-  """DeepSeek model."""
+class DeepSeek(openai_compatible.OpenAIChatCompletionAPI):
+  """DeepSeek models.
+  **Quick Start:**
+  ```python
+  import langfun as lf
+  # Call DeepSeek-V3 using API key from environment variable
+  # 'DEEPSEEK_API_KEY'.
+  lm = lf.llms.DeepSeekV3()
+  r = lm('Who are you?')
+  print(r)
+  ```
+  **Setting up API key:**
+  The DeepSeek API key can be specified in following ways:
+  1. At model instantiation:
+     ```python
+     lm = lf.llms.DeepSeekV3(api_key='MY_API_KEY')
+     ```
+  2. via environment variable `DEEPSEEK_API_KEY`.
+  **References:**
+  *   https://api-docs.deepseek.com/
+  """
   model: pg.typing.Annotated[
       pg.typing.Enum(

langfun/core/llms/fake.py CHANGED Viewed

@@ -20,7 +20,38 @@ import langfun.core as lf
 class Fake(lf.LanguageModel):
-  """The base class for all fake language models."""
+  """Base class for fake language models, used for testing.
+  Fake models simulate the behavior of real language models but return
+  pre-defined responses, making them useful for testing prompts,
+  data processing logic, and agent behavior without incurring API costs
+  or relying on external services.
+  Langfun provides several fake models:
+  * `lf.llms.Echo`: Echoes the prompt back as the response.
+  * `lf.llms.StaticResponse`: Returns a fixed, pre-defined response for
+    any prompt.
+  * `lf.llms.StaticMapping`: Returns responses based on a prompt-to-response
+    dictionary.
+  * `lf.llms.StaticSequence`: Returns responses from a pre-defined sequence
+    in order.
+  **Example:**
+  ```python
+  import langfun as lf
+  # Use Echo model for testing
+  lm = lf.llms.Echo()
+  response = lm('hello')
+  assert response.text == 'hello'
+  # Use StaticResponse model
+  lm = lf.llms.StaticResponse('world')
+  response = lm('hello')
+  assert response.text == 'world'
+  ```
+  """
   def _score(self, prompt: lf.Message| list[lf.Message],
              completions: list[lf.Message]):
@@ -62,6 +93,13 @@ class Echo(Fake):
     return lf.AIMessage(prompt.text)
+class Pseudo(Fake):
+  """A pseudo language model that should never be called."""
+  def _response_from(self, prompt: lf.Message) -> lf.Message:
+    raise ValueError('Pseudo language model should never be called.')
 @lf.use_init_args(['response'])
 class StaticResponse(Fake):
   """Language model that always gives the same canned response."""

langfun/core/llms/fake_test.py CHANGED Viewed

@@ -20,6 +20,15 @@ import langfun.core as lf
 from langfun.core.llms import fake as fakelm
+class PseudoTest(unittest.TestCase):
+  def test_sample(self):
+    lm = fakelm.Pseudo()
+    self.assertEqual(lm.model_id, 'Pseudo')
+    with self.assertRaises(ValueError):
+      _ = lm.sample(['hi'])
 class EchoTest(unittest.TestCase):
   def test_sample(self):

langfun/core/llms/gemini.py CHANGED Viewed

@@ -195,7 +195,7 @@ SUPPORTED_MODELS = [
         rate_limits=lf.ModelInfo.RateLimits(
             max_requests_per_minute=2000,
             max_tokens_per_minute=4_000_000,
-        )
+        ),
     ),
     # Gemini 2.5 Pro 0605
     GeminiModelInfo(
@@ -218,7 +218,7 @@ SUPPORTED_MODELS = [
         rate_limits=lf.ModelInfo.RateLimits(
             max_requests_per_minute=2000,
             max_tokens_per_minute=4_000_000,
-        )
+        ),
     ),
     # Gemini 2.5 Flash Preview 0520
     GeminiModelInfo(
@@ -264,7 +264,7 @@ SUPPORTED_MODELS = [
         rate_limits=lf.ModelInfo.RateLimits(
             max_requests_per_minute=2000,
             max_tokens_per_minute=4_000_000,
-        )
+        ),
     ),
     # Gemini 2.5 Flash Preview
     GeminiModelInfo(
@@ -614,6 +614,21 @@ SUPPORTED_MODELS = [
     #
     # Experimental models.
     #
+    GeminiModelInfo(
+        model_id='gemini-2.5-flash-image-preview',
+        in_service=True,
+        experimental=True,
+        provider=pg.oneof(['Google GenAI', 'VertexAI']),
+        model_type='instruction-tuned',
+        description='Gemini 2.5 Flash Image Preview model.',
+        release_date=datetime.datetime(2025, 8, 17),
+        input_modalities=GeminiModelInfo.INPUT_IMAGE_TYPES
+        + GeminiModelInfo.INPUT_DOC_TYPES,
+        context_length=lf.ModelInfo.ContextLength(
+            max_input_tokens=32_768,
+            max_output_tokens=32_768,
+        ),
+    ),
     GeminiModelInfo(
         model_id='gemini-2.0-pro-exp-02-05',
         in_service=True,
@@ -681,7 +696,15 @@ _SUPPORTED_MODELS_BY_ID = {m.model_id: m for m in SUPPORTED_MODELS}
 @pg.use_init_args(['model'])
 class Gemini(rest.REST):
-  """Language models provided by Google GenAI."""
+  """Base class for Gemini models served on Google GenAI and Vertex AI.
+  This class implements the Gemini API protocol, shared by
+  `lf.llms.GoogleGenAI` and `lf.llms.VertexAI`, providing common request
+  formatting and response parsing for Gemini models.
+  It is not intended to be used directly. Please use `lf.llms.GoogleGenAI` or
+  `lf.llms.VertexAI` instead.
+  """
   model: pg.typing.Annotated[
       pg.typing.Enum(
@@ -690,6 +713,12 @@ class Gemini(rest.REST):
       'The name of the model to use.',
   ]
+  response_modalities: pg.typing.Annotated[
+      list[str] | None,
+      'Response modalities. It is needed for models whose response modalities '
+      + 'are more than plain text.',
+  ] = None
   @functools.cached_property
   def model_info(self) -> GeminiModelInfo:
     return _SUPPORTED_MODELS_BY_ID[self.model]
@@ -731,6 +760,8 @@ class Gemini(rest.REST):
         prompt.as_format('gemini', chunk_preprocessor=modality_conversion)
     )
     request['contents'] = contents
+    if sampling_options.extras:
+      request.update(sampling_options.extras)
     return request
   def _generation_config(
@@ -768,6 +799,11 @@ class Gemini(rest.REST):
           'thinkingBudget': options.max_thinking_tokens,
       }
+    if self.response_modalities:
+      config['responseModalities'] = self.response_modalities
+      if 'IMAGE' in self.response_modalities:
+        config.pop('responseLogprobs', None)
+        config.pop('logprobs', None)
     return config
   def result(self, json: dict[str, Any]) -> lf.LMSamplingResult:
@@ -802,9 +838,9 @@ class Gemini(rest.REST):
     )
   def _error(self, status_code: int, content: str) -> lf.LMError:
-    if (
-        status_code == 400
-        and b'exceeds the maximum number of tokens' in content
+    if status_code == 400 and (
+        b'exceeds the maximum number of tokens' in content
+        or b'Reduce the input token count and try again.' in content
     ):
       return lf.ContextLimitError(f'{status_code}: {content}')
     return super()._error(status_code, content)

langfun/core/llms/google_genai.py CHANGED Viewed

@@ -25,7 +25,35 @@ import pyglove as pg
 @lf.use_init_args(['model'])
 @pg.members([('api_endpoint', pg.typing.Str().freeze(''))])
 class GenAI(gemini.Gemini):
-  """Language models provided by Google GenAI."""
+  """Google GenAI models.
+  **Quick Start:**
+  ```python
+  import langfun as lf
+  # Call Gemini 1.5 Flash using API key from environment variable
+  # 'GOOGLE_API_KEY'.
+  lm = lf.llms.Gemini15Flash()
+  r = lm('Who are you?')
+  print(r)
+  ```
+  **Setting up API key:**
+  The Google API key can be specified in following ways:
+  1. At model instantiation:
+     ```python
+     lm = lf.llms.Gemini15Flash(api_key='MY_API_KEY')
+     ```
+  2. via environment variable `GOOGLE_API_KEY`.
+  **References:**
+  *   https://ai.google.dev/docs
+  """
   model: pg.typing.Annotated[
       pg.typing.Enum(
@@ -92,6 +120,11 @@ class GenAI(gemini.Gemini):
 #
+class Gemini25FlashImagePreview(GenAI):
+  """Gemini 2.5 Flash Image Preview model."""
+  model = 'gemini-2.5-flash-image-preview'
 class Gemini25Pro(GenAI):
   """Gemini 2.5 Pro GA model."""

langfun/core/llms/groq.py CHANGED Viewed

@@ -259,10 +259,35 @@ _SUPPORTED_MODELS_BY_ID = {m.model_id: m for m in SUPPORTED_MODELS}
 @lf.use_init_args(['model'])
-class Groq(openai_compatible.OpenAICompatible):
-  """Groq LLMs through REST APIs (OpenAI compatible).
+class Groq(openai_compatible.OpenAIChatCompletionAPI):
+  """Groq models.
-  See https://platform.openai.com/docs/api-reference/chat
+  **Quick Start:**
+  ```python
+  import langfun as lf
+  # Call Llama 3.3 70B on Groq using API key from environment variable
+  # 'GROQ_API_KEY'.
+  lm = lf.llms.GroqLlama33_70B_Versatile()
+  r = lm('Who are you?')
+  print(r)
+  ```
+  **Setting up API key:**
+  The Groq API key can be specified in following ways:
+  1. At model instantiation:
+     ```python
+     lm = lf.llms.GroqLlama33_70B_Versatile(api_key='MY_API_KEY')
+     ```
+  2. via environment variable `GROQ_API_KEY`.
+  **References:**
+  *   https://console.groq.com/docs
   """
   model: pg.typing.Annotated[

langfun/core/llms/llama_cpp.py CHANGED Viewed

@@ -20,11 +20,30 @@ import pyglove as pg
 @pg.use_init_args(['url', 'model'])
 @pg.members([('api_endpoint', pg.typing.Str().freeze(''))])
-class LlamaCppRemote(openai_compatible.OpenAICompatible):
-  """The remote LLaMA C++ model.
+class LlamaCppRemote(openai_compatible.OpenAIChatCompletionAPI):
+  """LLaMA C++ models served via a remote server.
-  The Remote LLaMA C++ models can be launched via
-  https://github.com/ggerganov/llama.cpp/tree/master/examples/server
+  This class provides an interface to interact with language models
+  hosted on a LLaMA C++ server, which is compatible with the OpenAI
+  Chat Completions API format.
+  **Quick Start:**
+  Assuming a LLaMA C++ server is running at `http://localhost:8080`,
+  you can interact with it as follows:
+  ```python
+  import langfun as lf
+  # If model name is not specified, it will use server's default.
+  lm = lf.llms.LlamaCppRemote(url='http://localhost:8080')
+  r = lm('Who are you?')
+  print(r)
+  ```
+  **References:**
+  *   https://github.com/ggerganov/llama.cpp/tree/master/examples/server
   """
   url: Annotated[
       str,

langfun/core/llms/openai.py CHANGED Viewed

@@ -49,6 +49,53 @@ class OpenAIModelInfo(lf.ModelInfo):
 #
 SUPPORTED_MODELS = [
+    # GPT-5 models
+    OpenAIModelInfo(
+        model_id='gpt-5',
+        alias_for='gpt-5-2025-08-07',
+        in_service=True,
+        model_type='instruction-tuned',
+        description='GPT 5 model (latest stable).',
+        url='https://platform.openai.com/docs/models/gpt-5',
+        input_modalities=OpenAIModelInfo.INPUT_IMAGE_TYPES,
+        context_length=lf.ModelInfo.ContextLength(
+            max_input_tokens=400_000,
+            max_output_tokens=128_000,
+        ),
+        pricing=lf.ModelInfo.Pricing(
+            cost_per_1m_cached_input_tokens=0.125,
+            cost_per_1m_input_tokens=1.25,
+            cost_per_1m_output_tokens=10.0,
+        ),
+        # Tier 5 rate limits.
+        rate_limits=lf.ModelInfo.RateLimits(
+            max_requests_per_minute=15_000,
+            max_tokens_per_minute=40_000_000,
+        ),
+    ),
+    OpenAIModelInfo(
+        model_id='gpt-5-mini',
+        alias_for='gpt-5-mini-2025-08-07',
+        in_service=True,
+        model_type='instruction-tuned',
+        description='GPT 5 mini model (latest stable).',
+        url='https://platform.openai.com/docs/models/gpt-5-mini',
+        input_modalities=OpenAIModelInfo.INPUT_IMAGE_TYPES,
+        context_length=lf.ModelInfo.ContextLength(
+            max_input_tokens=400_000,
+            max_output_tokens=128_000,
+        ),
+        pricing=lf.ModelInfo.Pricing(
+            cost_per_1m_cached_input_tokens=0.025,
+            cost_per_1m_input_tokens=0.25,
+            cost_per_1m_output_tokens=2.0,
+        ),
+        # Tier 5 rate limits.
+        rate_limits=lf.ModelInfo.RateLimits(
+            max_requests_per_minute=180_000_000,
+            max_tokens_per_minute=30_000_000,
+        ),
+    ),
     # GPT-4.1 models
     OpenAIModelInfo(
         model_id='gpt-4.1',
@@ -984,8 +1031,36 @@ _SUPPORTED_MODELS_BY_MODEL_ID = {m.model_id: m for m in SUPPORTED_MODELS}
 @lf.use_init_args(['model'])
-class OpenAI(openai_compatible.OpenAICompatible):
-  """OpenAI model."""
+class OpenAI(openai_compatible.OpenAIResponsesAPI):
+  """OpenAI models.
+  **Quick Start:**
+  ```python
+  import langfun as lf
+  # Call GPT-4o using API key from environment variable 'OPENAI_API_KEY'.
+  lm = lf.llms.Gpt4o()
+  r = lm('Who are you?')
+  print(r)
+  ```
+  **Setting up API key:**
+  The OpenAI API key can be specified in following ways:
+  1. At model instantiation:
+     ```python
+     lm = lf.llms.Gpt4o(api_key='MY_API_KEY')
+     ```
+  2. via environment variable `OPENAI_API_KEY`.
+  **References:**
+  *   https://platform.openai.com/docs/models
+  *   https://platform.openai.com/docs/api-reference
+  """
   model: pg.typing.Annotated[
       pg.typing.Enum(
@@ -994,7 +1069,12 @@ class OpenAI(openai_compatible.OpenAICompatible):
       'The name of the model to use.',
   ]
-  api_endpoint: str = 'https://api.openai.com/v1/chat/completions'
+  # Disable message storage by default.
+  sampling_options = lf.LMSamplingOptions(
+      extras={'store': False}
+  )
+  api_endpoint: str = 'https://api.openai.com/v1/responses'
   api_key: Annotated[
       str | None,
@@ -1069,6 +1149,16 @@ class OpenAI(openai_compatible.OpenAICompatible):
     return super()._request_args(options)
+class Gpt5(OpenAI):
+  """GPT-5."""
+  model = 'gpt-5'
+class Gpt5Mini(OpenAI):
+  """GPT-5 mini."""
+  model = 'gpt-5-mini'
 class Gpt41(OpenAI):
   """GPT-4.1."""
   model = 'gpt-4.1'

langfun 0.1.2.dev202509020804__py3-none-any.whl → 0.1.2.dev202511110805__py3-none-any.whl

Potentially problematic release.

langfun 0.1.2.dev202509020804py3-none-any.whl → 0.1.2.dev202511110805py3-none-any.whl