PyPI - langfun - Versions diffs - 0.1.2.dev202509120804__py3-none-any.whl → 0.1.2.dev202512040805__py3-none-any.whl - Mend

langfun 0.1.2.dev202509120804py3-none-any.whl → 0.1.2.dev202512040805py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

langfun/__init__.py +1 -1
langfun/core/__init__.py +7 -1
langfun/core/agentic/__init__.py +8 -1
langfun/core/agentic/action.py +740 -112
langfun/core/agentic/action_eval.py +9 -2
langfun/core/agentic/action_test.py +189 -24
langfun/core/async_support.py +104 -5
langfun/core/async_support_test.py +23 -0
langfun/core/coding/python/correction.py +19 -9
langfun/core/coding/python/execution.py +14 -12
langfun/core/coding/python/generation.py +21 -16
langfun/core/coding/python/sandboxing.py +23 -3
langfun/core/component.py +42 -3
langfun/core/concurrent.py +70 -6
langfun/core/concurrent_test.py +9 -2
langfun/core/console.py +1 -1
langfun/core/data/conversion/anthropic.py +12 -3
langfun/core/data/conversion/anthropic_test.py +8 -6
langfun/core/data/conversion/gemini.py +11 -2
langfun/core/data/conversion/gemini_test.py +48 -9
langfun/core/data/conversion/openai.py +145 -31
langfun/core/data/conversion/openai_test.py +161 -17
langfun/core/eval/base.py +48 -44
langfun/core/eval/base_test.py +5 -5
langfun/core/eval/matching.py +5 -2
langfun/core/eval/patching.py +3 -3
langfun/core/eval/scoring.py +4 -3
langfun/core/eval/v2/__init__.py +2 -0
langfun/core/eval/v2/checkpointing.py +76 -7
langfun/core/eval/v2/checkpointing_test.py +9 -2
langfun/core/eval/v2/config_saver.py +37 -0
langfun/core/eval/v2/config_saver_test.py +36 -0
langfun/core/eval/v2/eval_test_helper.py +104 -3
langfun/core/eval/v2/evaluation.py +92 -17
langfun/core/eval/v2/evaluation_test.py +9 -3
langfun/core/eval/v2/example.py +50 -40
langfun/core/eval/v2/example_test.py +16 -8
langfun/core/eval/v2/experiment.py +84 -15
langfun/core/eval/v2/experiment_test.py +19 -0
langfun/core/eval/v2/metric_values.py +31 -3
langfun/core/eval/v2/metric_values_test.py +32 -0
langfun/core/eval/v2/metrics.py +157 -44
langfun/core/eval/v2/metrics_test.py +39 -18
langfun/core/eval/v2/progress.py +31 -1
langfun/core/eval/v2/progress_test.py +27 -0
langfun/core/eval/v2/progress_tracking.py +13 -5
langfun/core/eval/v2/progress_tracking_test.py +9 -1
langfun/core/eval/v2/reporting.py +90 -71
langfun/core/eval/v2/reporting_test.py +24 -6
langfun/core/eval/v2/runners/__init__.py +30 -0
langfun/core/eval/v2/{runners.py → runners/base.py} +72 -180
langfun/core/eval/v2/runners/beam.py +354 -0
langfun/core/eval/v2/runners/beam_test.py +153 -0
langfun/core/eval/v2/runners/ckpt_monitor.py +294 -0
langfun/core/eval/v2/runners/ckpt_monitor_test.py +162 -0
langfun/core/eval/v2/runners/debug.py +40 -0
langfun/core/eval/v2/runners/debug_test.py +76 -0
langfun/core/eval/v2/runners/parallel.py +243 -0
langfun/core/eval/v2/runners/parallel_test.py +182 -0
langfun/core/eval/v2/runners/sequential.py +47 -0
langfun/core/eval/v2/runners/sequential_test.py +169 -0
langfun/core/langfunc.py +45 -130
langfun/core/langfunc_test.py +7 -5
langfun/core/language_model.py +189 -36
langfun/core/language_model_test.py +54 -3
langfun/core/llms/__init__.py +12 -1
langfun/core/llms/anthropic.py +157 -2
langfun/core/llms/azure_openai.py +29 -17
langfun/core/llms/cache/base.py +25 -3
langfun/core/llms/cache/in_memory.py +48 -7
langfun/core/llms/cache/in_memory_test.py +14 -4
langfun/core/llms/compositional.py +25 -1
langfun/core/llms/deepseek.py +30 -2
langfun/core/llms/fake.py +32 -1
langfun/core/llms/gemini.py +64 -12
langfun/core/llms/gemini_test.py +110 -0
langfun/core/llms/google_genai.py +34 -1
langfun/core/llms/groq.py +28 -3
langfun/core/llms/llama_cpp.py +23 -4
langfun/core/llms/openai.py +120 -3
langfun/core/llms/openai_compatible.py +148 -27
langfun/core/llms/openai_compatible_test.py +207 -20
langfun/core/llms/openai_test.py +0 -2
langfun/core/llms/rest.py +16 -1
langfun/core/llms/vertexai.py +58 -8
langfun/core/logging.py +1 -1
langfun/core/mcp/__init__.py +10 -0
langfun/core/mcp/client.py +177 -0
langfun/core/mcp/client_test.py +71 -0
langfun/core/mcp/session.py +241 -0
langfun/core/mcp/session_test.py +54 -0
langfun/core/mcp/testing/simple_mcp_client.py +33 -0
langfun/core/mcp/testing/simple_mcp_server.py +33 -0
langfun/core/mcp/tool.py +254 -0
langfun/core/mcp/tool_test.py +197 -0
langfun/core/memory.py +1 -0
langfun/core/message.py +160 -55
langfun/core/message_test.py +65 -81
langfun/core/modalities/__init__.py +8 -0
langfun/core/modalities/audio.py +21 -1
langfun/core/modalities/image.py +73 -3
langfun/core/modalities/image_test.py +116 -0
langfun/core/modalities/mime.py +64 -3
langfun/core/modalities/mime_test.py +11 -0
langfun/core/modalities/pdf.py +19 -1
langfun/core/modalities/video.py +21 -1
langfun/core/modality.py +167 -29
langfun/core/modality_test.py +42 -12
langfun/core/natural_language.py +1 -1
langfun/core/sampling.py +4 -4
langfun/core/sampling_test.py +20 -4
langfun/core/structured/__init__.py +2 -24
langfun/core/structured/completion.py +34 -44
langfun/core/structured/completion_test.py +23 -43
langfun/core/structured/description.py +54 -50
langfun/core/structured/function_generation.py +29 -12
langfun/core/structured/mapping.py +81 -37
langfun/core/structured/parsing.py +95 -79
langfun/core/structured/parsing_test.py +0 -3
langfun/core/structured/querying.py +230 -154
langfun/core/structured/querying_test.py +69 -33
langfun/core/structured/schema/__init__.py +49 -0
langfun/core/structured/schema/base.py +664 -0
langfun/core/structured/schema/base_test.py +531 -0
langfun/core/structured/schema/json.py +174 -0
langfun/core/structured/schema/json_test.py +121 -0
langfun/core/structured/schema/python.py +316 -0
langfun/core/structured/schema/python_test.py +410 -0
langfun/core/structured/schema_generation.py +33 -14
langfun/core/structured/scoring.py +47 -36
langfun/core/structured/tokenization.py +26 -11
langfun/core/subscription.py +2 -2
langfun/core/template.py +175 -50
langfun/core/template_test.py +123 -17
langfun/env/__init__.py +43 -0
langfun/env/base_environment.py +827 -0
langfun/env/base_environment_test.py +473 -0
langfun/env/base_feature.py +304 -0
langfun/env/base_feature_test.py +228 -0
langfun/env/base_sandbox.py +842 -0
langfun/env/base_sandbox_test.py +1235 -0
langfun/env/event_handlers/__init__.py +14 -0
langfun/env/event_handlers/chain.py +233 -0
langfun/env/event_handlers/chain_test.py +253 -0
langfun/env/event_handlers/event_logger.py +472 -0
langfun/env/event_handlers/event_logger_test.py +304 -0
langfun/env/event_handlers/metric_writer.py +726 -0
langfun/env/event_handlers/metric_writer_test.py +214 -0
langfun/env/interface.py +1640 -0
langfun/env/interface_test.py +153 -0
langfun/env/load_balancers.py +59 -0
langfun/env/load_balancers_test.py +141 -0
langfun/env/test_utils.py +507 -0
{langfun-0.1.2.dev202509120804.dist-info → langfun-0.1.2.dev202512040805.dist-info}/METADATA +7 -3
langfun-0.1.2.dev202512040805.dist-info/RECORD +217 -0
langfun/core/eval/v2/runners_test.py +0 -343
langfun/core/structured/schema.py +0 -987
langfun/core/structured/schema_test.py +0 -982
langfun-0.1.2.dev202509120804.dist-info/RECORD +0 -172
{langfun-0.1.2.dev202509120804.dist-info → langfun-0.1.2.dev202512040805.dist-info}/WHEEL +0 -0
{langfun-0.1.2.dev202509120804.dist-info → langfun-0.1.2.dev202512040805.dist-info}/licenses/LICENSE +0 -0
{langfun-0.1.2.dev202509120804.dist-info → langfun-0.1.2.dev202512040805.dist-info}/top_level.txt +0 -0

langfun/core/structured/schema/python_test.py ADDED Viewed

@@ -0,0 +1,410 @@
+# Copyright 2025 The Langfun Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import dataclasses
+import inspect
+import typing
+import unittest
+import langfun.core as lf
+from langfun.core.llms import fake
+from langfun.core.structured.schema import base
+from langfun.core.structured.schema import python
+import pyglove as pg
+class Activity(pg.Object):
+  description: str
+class Itinerary(pg.Object):
+  """A travel itinerary for a day."""
+  day: pg.typing.Int[1, None]
+  type: pg.typing.Enum['daytime', 'nighttime']
+  activities: list[Activity]
+  hotel: pg.typing.Annotated[
+      pg.typing.Str['.*Hotel'] | None,
+      'Hotel to stay if applicable.'
+  ]
+class PlaceOfInterest(pg.Object):
+  """The name of a place of interest.
+  A place of interest is a place that people ususally visit during their
+  travels.
+  """
+  name: str
+Itinerary.__serialization_key__ = 'Itinerary'
+class Node(pg.Object):
+  children: list['Node']
+class SchemaReprTest(unittest.TestCase):
+  def test_class_definition(self):
+    self.assertEqual(
+        python.class_definition(Activity, allowed_dependencies=set()),
+        'class Activity:\n  description: str\n',
+    )
+    self.assertEqual(
+        python.class_definition(Itinerary),
+        inspect.cleandoc("""
+            class Itinerary(Object):
+              \"\"\"A travel itinerary for a day.\"\"\"
+              day: int(min=1)
+              type: Literal['daytime', 'nighttime']
+              activities: list[Activity]
+              # Hotel to stay if applicable.
+              hotel: str(regex='.*Hotel') | None
+            """) + '\n',
+    )
+    self.assertEqual(
+        python.class_definition(
+            PlaceOfInterest, allowed_dependencies=set()
+        ),
+        inspect.cleandoc("""
+            class PlaceOfInterest:
+              \"\"\"The name of a place of interest.
+              A place of interest is a place that people ususally visit during their
+              travels.
+              \"\"\"
+              name: str
+            """) + '\n',
+    )
+    class A(pg.Object):
+      pass
+    self.assertEqual(
+        python.class_definition(A, allowed_dependencies=set()),
+        'class A:\n  pass\n',
+    )
+    self.assertEqual(
+        python.class_definition(A),
+        'class A(Object):\n  pass\n',
+    )
+    class C(pg.Object):
+      x: str
+      __kwargs__: typing.Any
+    self.assertEqual(
+        python.class_definition(C), 'class C(Object):\n  x: str\n'
+    )
+    class D(pg.Object):
+      x: str
+      @python.include_method_in_prompt
+      def __call__(self, y: int) -> int:
+        return len(self.x) + y
+    self.assertEqual(
+        python.class_definition(D),
+        inspect.cleandoc(
+            """
+            class D(Object):
+              x: str
+              def __call__(self, y: int) -> int:
+                return len(self.x) + y
+            """) + '\n'
+    )
+    class E(pg.Object):
+      x: str
+      y: typing.Annotated[int, 'y', dict(exclude_from_prompt=True)]
+    self.assertEqual(
+        python.class_definition(E),
+        inspect.cleandoc(
+            """
+            class E(Object):
+              x: str
+            """) + '\n'
+    )
+  def test_repr(self):
+    class Foo(pg.Object):
+      x: int
+    @dataclasses.dataclass(frozen=True)
+    class Bar:
+      """Class Bar."""
+      y: str
+    @dataclasses.dataclass(frozen=True)
+    class Baz(Bar):  # pylint: disable=unused-variable
+      pass
+    class A(pg.Object):
+      foo: Foo
+      @python.include_method_in_prompt
+      def foo_value(self) -> int:
+        return self.foo.x
+      def baz_value(self) -> str:
+        return 'baz'
+    class B(A):
+      bar: Bar
+      foo2: Foo
+      @python.include_method_in_prompt
+      def bar_value(self) -> str:
+        return self.bar.y
+    schema = base.Schema([B])
+    self.assertEqual(
+        python.PythonPromptingProtocol().class_definitions(schema),
+        inspect.cleandoc('''
+            class Foo:
+              x: int
+            class Bar:
+              """Class Bar."""
+              y: str
+            class Baz(Bar):
+              """Baz(y: str)"""
+              y: str
+            class B:
+              foo: Foo
+              bar: Bar
+              foo2: Foo
+              def bar_value(self) -> str:
+                return self.bar.y
+              def foo_value(self) -> int:
+                return self.foo.x
+            ''') + '\n',
+    )
+    self.assertEqual(
+        python.PythonPromptingProtocol().result_definition(schema), 'list[B]'
+    )
+    self.assertEqual(
+        base.schema_repr(schema),
+        inspect.cleandoc('''
+            list[B]
+            ```python
+            class Foo:
+              x: int
+            class Bar:
+              """Class Bar."""
+              y: str
+            class Baz(Bar):
+              """Baz(y: str)"""
+              y: str
+            class B:
+              foo: Foo
+              bar: Bar
+              foo2: Foo
+              def bar_value(self) -> str:
+                return self.bar.y
+              def foo_value(self) -> int:
+                return self.foo.x
+            ```
+            '''),
+    )
+    self.assertEqual(
+        python.PythonPromptingProtocol().schema_repr(
+            schema,
+            include_result_definition=False,
+            markdown=False,
+        ),
+        inspect.cleandoc('''
+            class Foo:
+              x: int
+            class Bar:
+              """Class Bar."""
+              y: str
+            class Baz(Bar):
+              """Baz(y: str)"""
+              y: str
+            class B:
+              foo: Foo
+              bar: Bar
+              foo2: Foo
+              def bar_value(self) -> str:
+                return self.bar.y
+              def foo_value(self) -> int:
+                return self.foo.x
+            '''),
+    )
+class ValuePythonReprTest(unittest.TestCase):
+  def test_repr(self):
+    class Foo(pg.Object):
+      x: int
+    class A(pg.Object):
+      foo: list[Foo]
+      y: str | None
+    self.assertEqual(
+        base.value_repr(1, base.Schema(int)),
+        '```python\n1\n```'
+    )
+    self.assertEqual(
+        base.value_repr(lf.Template('hi, {{a}}', a='foo')),
+        'hi, foo'
+    )
+    self.assertEqual(
+        base.value_repr(
+            A([Foo(1), Foo(2)], 'bar'), base.Schema(A), markdown=False,
+        ),
+        "A(foo=[Foo(x=1), Foo(x=2)], y='bar')",
+    )
+    self.assertEqual(
+        base.value_repr(
+            A([Foo(1), Foo(2)], 'bar'),
+            base.Schema(A),
+            markdown=True,
+            compact=False,
+            assign_to_var='output',
+        ),
+        inspect.cleandoc("""
+            ```python
+            output = A(
+              foo=[
+                Foo(
+                  x=1
+                ),
+                Foo(
+                  x=2
+                )
+              ],
+              y='bar'
+            )
+            ```
+            """),
+    )
+    self.assertEqual(
+        base.value_repr(A),
+        inspect.cleandoc("""
+            ```python
+            class Foo(Object):
+              x: int
+            class A(Object):
+              foo: list[Foo]
+              y: str | None
+            ```
+            """),
+    )
+    self.assertEqual(python.source_form(int), 'int')
+  def test_parse(self):
+    class Foo(pg.Object):
+      x: int
+    class A(pg.Object):
+      foo: list[Foo]
+      y: str | None
+    self.assertEqual(
+        base.parse_value(
+            "A(foo=[Foo(x=1), Foo(x=2)], y='bar')", base.Schema(A)
+        ),
+        A([Foo(1), Foo(2)], y='bar'),
+    )
+  def test_parse_with_correction(self):
+    class Foo(pg.Object):
+      x: int
+    class A(pg.Object):
+      foo: list[Foo]
+      y: str | None
+    self.assertEqual(
+        base.parse_value(
+            "A(foo=[Foo(x=1), Foo(x=2)], y='bar'",
+            base.Schema(A),
+            autofix=1,
+            autofix_lm=fake.StaticResponse(
+                inspect.cleandoc(
+                    """
+                    CorrectedCode(
+                        corrected_code='A(foo=[Foo(x=1), Foo(x=2)], y=\\\'bar\\\')',
+                    )
+                    """
+                )
+            ),
+        ),
+        A([Foo(1), Foo(2)], y='bar'),
+    )
+  def test_parse_class_def(self):
+    self.assertTrue(
+        inspect.isclass(
+            base.parse_value(
+                """
+                class A:
+                  x: Dict[str, Any]
+                  y: Optional[Sequence[str]]
+                  z: Union[int, List[int], Tuple[int]]
+                """,
+                permission=pg.coding.CodePermission.ALL,
+            )
+        )
+    )
+class StructureFromPythonTest(unittest.TestCase):
+  def test_parse_class_def(self):
+    class B:
+      pass
+    schema = base.Schema([B])
+    v = python.structure_from_python(
+        """
+        class C(B):
+          pass
+        """,
+        global_vars=dict(B=B),
+        permission=pg.coding.CodePermission.ALL,
+    )
+    self.assertEqual(v.__module__, 'builtins')
+    self.assertEqual(schema.class_dependencies(), [B])
+if __name__ == '__main__':
+  unittest.main()

langfun/core/structured/schema_generation.py CHANGED Viewed

@@ -90,16 +90,35 @@ def generate_class(
     skip_lm: bool = False,
     **kwargs,
 ) -> Type[Any] | lf.Message:
-  """Generate a class with specified name based on the prompt.
-  Example:
-    ```
-    trip_cls = lf.classgen(
-        'Trip',
-        'A trip plan to visit {{ city }}, city='San Francisco',
-        lm=lf.llms.GeminiPro()
-    )
-    ```
+  """Generates a Python class dynamically from a prompt using an LLM.
+  `lf.structured.generate_class` takes a class name and a natural language
+  description (prompt) and uses a language model to generate a Python class
+  (inheriting from `pg.Object`) that matches the description.
+  This is useful for creating structured data types on-the-fly based on
+  dynamic requirements.
+  **Example:**
+  ```python
+  import langfun as lf
+  import pyglove as pg
+  trip_plan_cls = lf.structured.generate_class(
+      'TripPlan',
+      'A trip plan to visit San Francisco, including a list of destinations,'
+      'start date, end date, and total budget.',
+      lm=lf.llms.Gemini25Flash())
+  # This might generate a class like:
+  # class TripPlan(pg.Object):
+  #   destinations: list[str]
+  #   start_date: str
+  #   end_date: str
+  #   total_budget: float
+  print(lf.Schema.from_value(trip_plan_cls).schema_str('python'))
+  ```
   Args:
     name: Class name to be generated.
@@ -108,17 +127,17 @@ def generate_class(
     lm: The language model to use. If not specified, the language model from
       `lf.context` context manager will be used.
     examples: An optional list of fewshot examples for helping class generation.
-      If None, a default single shot example will be used. Use
-      `lf.structured.classgen_example` to generate example.
+      If None, a default single-shot example will be used. Use
+      `lf.structured.classgen_example` to generate examples.
     returns_message: If True, returns `lf.Message` as the output, instead of
       returning the structured `message.result`.
     skip_lm: If True, returns the rendered prompt as a UserMessage object.
-      otherwise return the LLM response based on the rendered prompt.
+      otherwise returns the LLM response based on the rendered prompt.
     **kwargs: Template variables passed to `prompt` and keyword arguments passed
       to `lf.structured.GenerateClass`.
   Returns:
-    Generated class.
+    The generated Python class, or `lf.Message` if `returns_message` is True.
   Raises:
     CodeError: if generation failed.

langfun/core/structured/scoring.py CHANGED Viewed

@@ -31,42 +31,54 @@ def score(
     *,
     lm: lf.LanguageModel | None = None,
     examples: list[mapping.MappingExample] | None = None,
-    protocol: schema_lib.SchemaProtocol = 'python',
+    protocol: str = 'python',
     return_scoring_results: bool = False,
     **kwargs,
 ) -> list[float] | list[lf.LMScoringResult]:
-  """Scores the outputs based on the prompt.
-  Examples:
-    ```
-    # Example 1: Scoring text output based on the user prompt.
-    scores = lf.score('{{x}} + {{y}} =', ['1', '2', '3'], lm=lm, x=1, y=2)
-    assert len(scores) == 3
-    # Example 2: Scoring int output based on the formulated OOP prompt.
-    scores = lf.score('1 + 1 =', [1, 2, 3], lm=lm)
-    assert len(scores) == 3
-    class Answer(pg.Object):
-      result: int
-    # Example 3: Scoring object output based on the formulated OOP prompt.
-    scores = lf.score('1 + 1 =', [Answer(1), Answer(2), Answer(3)], lm=lm)
-    assert len(scores) == 3
-    # Example 4: Scoring object field value based on the formulated OOP prompt
-    # and the generated tokens before the first `pg.oneof`.
-    scores = lf.score('1 + 1 =', [Answer(pg.oneof([1, 2, 3]))], lm=lm)
-    assert len(scores) == 3
-    # Example 5: Scoring multiple prompt/completion pairs.
-    scores = lf.score(
-        ['1 + 1=', '2 + 3='],
-        ['2', '4'],
-        lm=lm
-    )
-    assert len(scores) == 2
-    ```
+  """Scores completions based on a prompt using a language model.
+  `lf.score` computes the likelihood of each completion being generated given
+  a prompt, according to the specified language model. It can score text
+  completions or structured objects. If `schema` is provided, Langfun
+  formats the prompt and completions appropriately before scoring.
+  **Example 1: Score text completions**
+  ```python
+  import langfun as lf
+  scores = lf.score(
+      '1 + 1 =',
+      ['2', '3', '4'],
+      lm=lf.llms.Gemini25Flash())
+  print([f'{s:.3f}' for s in scores])
+  # Output: ['-0.001', '-2.345', '-3.456']
+  ```
+  **Example 2: Score structured completions**
+  ```python
+  import langfun as lf
+  import pyglove as pg
+  class Answer(pg.Object):
+    result: int
+  scores = lf.score(
+      '1 + 1 =',
+      [Answer(result=2), Answer(result=3), Answer(result=4)],
+      lm=lf.llms.Gemini25Flash())
+  print([f'{s:.3f}' for s in scores])
+  # Output: ['-0.001', '-2.345', '-3.456']
+  ```
+  **Example 3: Score multiple prompt/completion pairs**
+  ```python
+  import langfun as lf
+  scores = lf.score(
+      ['1 + 1 =', '2 + 2 ='],
+      ['2', '4'],
+      lm=lf.llms.Gemini25Flash())
+  print([f'{s:.3f}' for s in scores])
+  # Output: ['-0.001', '-0.002']
+  ```
   Args:
     prompt: The prompt(s) based on which each completion will be scored.
@@ -74,8 +86,7 @@ def score(
     schema: The schema as the output type. If None, it will be inferred from
       the completions.
     lm: The language model used for scoring.
-    examples: Fewshot exemplars used together with the prompt in getting the
-      completions.
+    examples: Few-shot examples used to construct the prompt for scoring.
     protocol: The protocol for formulating the prompt based on objects.
     return_scoring_results: If True, returns a list of `lf.LMScoringResult`,
       otherwise returns a list of floats as the scores of each completion.
@@ -190,7 +201,7 @@ async def ascore(
     *,
     lm: lf.LanguageModel | None = None,
     examples: list[mapping.MappingExample] | None = None,
-    protocol: schema_lib.SchemaProtocol = 'python',
+    protocol: str = 'python',
     return_scoring_results: bool = False,
     **kwargs,
 ) -> list[float] | list[lf.LMScoringResult]:

langfun/core/structured/tokenization.py CHANGED Viewed

@@ -23,30 +23,45 @@ import pyglove as pg
 def tokenize(
-    prompt: Union[str, pg.Symbolic] | list[str | pg.Symbolic],
+    prompt: Union[str, pg.Symbolic, list[str | pg.Symbolic]],
     schema: Union[
         schema_lib.Schema, Type[Any], list[Type[Any]], dict[str, Any], None
     ] = None,
     *,
     lm: lf.LanguageModel | None = None,
     examples: list[mapping.MappingExample] | None = None,
-    protocol: schema_lib.SchemaProtocol = 'python',
+    protocol: str = 'python',
     **kwargs,
 ) -> list[tuple[str | bytes, int]]:
-  """Tokenize the prompt for `lf.query`.
+  """Renders a prompt and tokenizes it using a language model.
+  `lf.tokenize` first renders a prompt based on the provided `prompt`,
+  `schema`, and `examples`, similar to `lf.query`, and then uses the
+  specified language model (`lm`) to tokenize the resulting message.
+  This is useful for understanding how a prompt is seen by the model or
+  for estimating token counts before sending requests.
+  **Example:**
+  ```python
+  import langfun as lf
+  tokens = lf.tokenize('Hello world!', lm=lf.llms.Gpt4())
+  print(tokens)
+  # Output might look like: [('Hello', 15339), (' world', 1917), ('!', 0)]
+  ```
   Args:
-    prompt: The prompt(s) based on which each completion will be scored.
-    schema: The schema as the output type. If None, it will be inferred from
-      the completions.
-    lm: The language model used for scoring.
-    examples: Fewshot exemplars used together with the prompt in getting the
-      completions.
+    prompt: The prompt to render and tokenize. Can be a string, `pg.Symbolic`,
+      or `lf.Template`.
+    schema: The schema for formatting the prompt, if `prompt` is structured or
+      if schema-based formatting is needed.
+    lm: The language model to use for tokenization.
+    examples: Few-shot examples to include in the rendered prompt.
     protocol: The protocol for formulating the prompt based on objects.
     **kwargs: Keyword arguments that are referred by the prompt.
   Returns:
-    A list of (text, token_id) tuples.
+    A list of (token_str, token_id) tuples representing the tokenized prompt.
   """
   input_message = querying.query_prompt(
       prompt,
@@ -72,7 +87,7 @@ async def atokenize(
     *,
     lm: lf.LanguageModel | None = None,
     examples: list[mapping.MappingExample] | None = None,
-    protocol: schema_lib.SchemaProtocol = 'python',
+    protocol: str = 'python',
     **kwargs,
 ) -> list[tuple[str | bytes, int]]:
   """Async version of `lf.tokenize`."""

langfun/core/subscription.py CHANGED Viewed

@@ -35,7 +35,7 @@ EventType = TypeVar('EventType')
 class EventHandler(Generic[EventType], metaclass=abc.ABCMeta):
-  """Interface for event subscriber."""
+  """Interface for event handler."""
   @classmethod
   @functools.cache
@@ -51,7 +51,7 @@ class EventHandler(Generic[EventType], metaclass=abc.ABCMeta):
   @classmethod
   def accepts(cls, event: Event[Any]) -> bool:
-    """Returns True if current event handler class can accepts an event."""
+    """Returns True if current event handler class can accept an event."""
     return isinstance(event, cls.event_type())
   @abc.abstractmethod

langfun 0.1.2.dev202509120804__py3-none-any.whl → 0.1.2.dev202512040805__py3-none-any.whl

langfun 0.1.2.dev202509120804py3-none-any.whl → 0.1.2.dev202512040805py3-none-any.whl