PyPI - langfun - Versions diffs - 0.0.2.dev20240429__py3-none-any.whl → 0.1.2.dev202501150804__py3-none-any.whl - Mend

langfun 0.0.2.dev20240429py3-none-any.whl → 0.1.2.dev202501150804py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (144) hide show

langfun/__init__.py +20 -2
langfun/core/__init__.py +16 -5
langfun/core/agentic/__init__.py +30 -0
langfun/core/agentic/action.py +854 -0
langfun/core/agentic/action_eval.py +150 -0
langfun/core/agentic/action_eval_test.py +109 -0
langfun/core/agentic/action_test.py +136 -0
langfun/core/coding/python/__init__.py +5 -11
langfun/core/coding/python/correction.py +37 -21
langfun/core/coding/python/correction_test.py +29 -3
langfun/core/coding/python/execution.py +40 -216
langfun/core/coding/python/execution_test.py +29 -89
langfun/core/coding/python/generation.py +21 -11
langfun/core/coding/python/generation_test.py +2 -2
langfun/core/coding/python/parsing.py +108 -193
langfun/core/coding/python/parsing_test.py +2 -105
langfun/core/component.py +63 -2
langfun/core/component_test.py +53 -0
langfun/core/concurrent.py +414 -117
langfun/core/concurrent_test.py +111 -24
langfun/core/console.py +17 -5
langfun/core/console_test.py +17 -0
langfun/core/eval/__init__.py +16 -1
langfun/core/eval/base.py +622 -174
langfun/core/eval/base_test.py +200 -54
langfun/core/eval/matching.py +63 -76
langfun/core/eval/matching_test.py +17 -8
langfun/core/eval/patching.py +130 -0
langfun/core/eval/patching_test.py +170 -0
langfun/core/eval/scoring.py +26 -26
langfun/core/eval/scoring_test.py +19 -2
langfun/core/eval/v2/__init__.py +42 -0
langfun/core/eval/v2/checkpointing.py +380 -0
langfun/core/eval/v2/checkpointing_test.py +228 -0
langfun/core/eval/v2/eval_test_helper.py +136 -0
langfun/core/eval/v2/evaluation.py +725 -0
langfun/core/eval/v2/evaluation_test.py +180 -0
langfun/core/eval/v2/example.py +305 -0
langfun/core/eval/v2/example_test.py +128 -0
langfun/core/eval/v2/experiment.py +1048 -0
langfun/core/eval/v2/experiment_test.py +433 -0
langfun/core/eval/v2/metric_values.py +156 -0
langfun/core/eval/v2/metric_values_test.py +80 -0
langfun/core/eval/v2/metrics.py +357 -0
langfun/core/eval/v2/metrics_test.py +203 -0
langfun/core/eval/v2/progress.py +348 -0
langfun/core/eval/v2/progress_test.py +82 -0
langfun/core/eval/v2/progress_tracking.py +210 -0
langfun/core/eval/v2/progress_tracking_test.py +66 -0
langfun/core/eval/v2/reporting.py +270 -0
langfun/core/eval/v2/reporting_test.py +158 -0
langfun/core/eval/v2/runners.py +488 -0
langfun/core/eval/v2/runners_test.py +334 -0
langfun/core/langfunc.py +4 -17
langfun/core/langfunc_test.py +22 -6
langfun/core/language_model.py +577 -39
langfun/core/language_model_test.py +470 -56
langfun/core/llms/__init__.py +87 -16
langfun/core/llms/anthropic.py +312 -87
langfun/core/llms/anthropic_test.py +71 -3
langfun/core/llms/cache/base.py +21 -2
langfun/core/llms/cache/in_memory.py +13 -0
langfun/core/llms/cache/in_memory_test.py +53 -2
langfun/core/llms/compositional.py +101 -0
langfun/core/llms/compositional_test.py +73 -0
langfun/core/llms/deepseek.py +117 -0
langfun/core/llms/deepseek_test.py +61 -0
langfun/core/llms/fake.py +11 -7
langfun/core/llms/fake_test.py +14 -0
langfun/core/llms/gemini.py +507 -0
langfun/core/llms/gemini_test.py +195 -0
langfun/core/llms/google_genai.py +62 -218
langfun/core/llms/google_genai_test.py +9 -202
langfun/core/llms/groq.py +160 -144
langfun/core/llms/groq_test.py +31 -137
langfun/core/llms/llama_cpp.py +15 -42
langfun/core/llms/llama_cpp_test.py +4 -30
langfun/core/llms/openai.py +395 -203
langfun/core/llms/openai_compatible.py +179 -0
langfun/core/llms/openai_compatible_test.py +495 -0
langfun/core/llms/openai_test.py +30 -395
langfun/core/llms/rest.py +113 -0
langfun/core/llms/rest_test.py +111 -0
langfun/core/llms/vertexai.py +192 -0
langfun/core/llms/vertexai_test.py +52 -0
langfun/core/logging.py +284 -0
langfun/core/logging_test.py +125 -0
langfun/core/message.py +319 -9
langfun/core/message_test.py +190 -13
langfun/core/modalities/__init__.py +6 -2
langfun/core/modalities/audio.py +30 -0
langfun/core/modalities/audio_test.py +63 -0
langfun/core/modalities/image.py +39 -20
langfun/core/modalities/image_test.py +52 -9
langfun/core/modalities/mime.py +206 -29
langfun/core/modalities/mime_test.py +90 -9
langfun/core/modalities/ms_office.py +117 -0
langfun/core/modalities/ms_office_test.py +389 -0
langfun/core/modalities/pdf.py +22 -0
langfun/core/modalities/pdf_test.py +57 -0
langfun/core/modalities/video.py +9 -26
langfun/core/modalities/video_test.py +3 -3
langfun/core/modality.py +26 -3
langfun/core/modality_test.py +2 -2
langfun/core/sampling.py +11 -11
langfun/core/structured/__init__.py +12 -16
langfun/core/structured/completion.py +32 -5
langfun/core/structured/completion_test.py +7 -6
langfun/core/structured/description.py +2 -2
langfun/core/structured/description_test.py +3 -3
langfun/core/structured/function_generation.py +60 -27
langfun/core/structured/function_generation_test.py +72 -2
langfun/core/structured/mapping.py +97 -47
langfun/core/structured/mapping_test.py +90 -2
langfun/core/structured/parsing.py +33 -21
langfun/core/structured/parsing_test.py +53 -9
langfun/core/structured/querying.py +746 -0
langfun/core/structured/{prompting_test.py → querying_test.py} +469 -51
langfun/core/structured/schema.py +204 -97
langfun/core/structured/schema_generation.py +1 -1
langfun/core/structured/schema_test.py +130 -29
langfun/core/structured/scoring.py +125 -19
langfun/core/structured/scoring_test.py +30 -0
langfun/core/structured/tokenization.py +64 -0
langfun/core/structured/tokenization_test.py +48 -0
langfun/core/template.py +115 -1
langfun/core/template_test.py +71 -1
langfun/core/templates/conversation.py +9 -0
langfun/core/templates/conversation_test.py +4 -3
langfun/core/templates/selfplay_test.py +10 -2
langfun-0.1.2.dev202501150804.dist-info/METADATA +225 -0
langfun-0.1.2.dev202501150804.dist-info/RECORD +153 -0
{langfun-0.0.2.dev20240429.dist-info → langfun-0.1.2.dev202501150804.dist-info}/WHEEL +1 -1
langfun/core/coding/python/errors.py +0 -108
langfun/core/coding/python/errors_test.py +0 -99
langfun/core/coding/python/permissions.py +0 -90
langfun/core/coding/python/permissions_test.py +0 -86
langfun/core/structured/prompting.py +0 -238
langfun/core/text_formatting.py +0 -162
langfun/core/text_formatting_test.py +0 -47
langfun-0.0.2.dev20240429.dist-info/METADATA +0 -100
langfun-0.0.2.dev20240429.dist-info/RECORD +0 -108
{langfun-0.0.2.dev20240429.dist-info → langfun-0.1.2.dev202501150804.dist-info}/LICENSE +0 -0
{langfun-0.0.2.dev20240429.dist-info → langfun-0.1.2.dev202501150804.dist-info}/top_level.txt +0 -0

langfun/core/llms/anthropic_test.py CHANGED Viewed

@@ -18,6 +18,10 @@ import os
 from typing import Any
 import unittest
 from unittest import mock
+from google.auth import exceptions
+from langfun.core import language_model
+from langfun.core import message as lf_message
 from langfun.core import modalities as lf_modalities
 from langfun.core.llms import anthropic
 import pyglove as pg
@@ -59,18 +63,30 @@ image_content = (
     b'\xdao\xd0|\x00\x00\x00\x00IEND\xaeB`\x82'
 )
+pdf_content = (
+    b'%PDF-1.4\n1 0 obj\n<< /Type /Catalog /Pages 2 0 R >>\nendobj\n2 0 obj\n<<'
+    b' /Type /Pages /Count 1 /Kids [3 0 R] >>\nendobj\n3 0 obj\n<< /Type /Page'
+    b' /Parent 2 0 R /MediaBox [0 0 612 792] /Contents 4 0 R >>\nendobj\n4 0'
+    b' obj\n<< /Length 44 >>\nstream\nBT /F1 24 Tf 100 700 Td (Hello, PDF'
+    b' content!) Tj ET\nendstream\nendobj\n5 0 obj\n<< /Type /Font /Subtype'
+    b' /Type1 /BaseFont /Helvetica >>\nendobj\nxref\n0 6\n0000000000 65535 f'
+    b' \n0000000010 00000 n \n0000000079 00000 n \n0000000178 00000 n'
+    b' \n0000000278 00000 n \n0000000407 00000 n \ntrailer\n<< /Size 6 /Root 1'
+    b' 0 R >>\nstartxref\n517\n%%EOF'
+)
 def mock_mm_requests_post(url: str, json: dict[str, Any], **kwargs):
   del url, kwargs
   v = json['messages'][0]['content'][0]
-  image = lf_modalities.Image.from_bytes(base64.b64decode(v['source']['data']))
+  content = lf_modalities.Mime.from_bytes(base64.b64decode(v['source']['data']))
   response = requests.Response()
   response.status_code = 200
   response._content = pg.to_json_str({
       'content': [{
           'type': 'text',
-          'text': f'{v["type"]}: {image.mime_type}',
+          'text': f'{v["type"]}: {content.mime_type}',
       }],
       'usage': {
           'input_tokens': 2,
@@ -146,6 +162,13 @@ class AnthropicTest(unittest.TestCase):
       response = lm(lf_modalities.Image.from_bytes(image_content), lm=lm)
       self.assertEqual(response.text, 'image: image/png')
+  def test_pdf_call(self):
+    with mock.patch('requests.Session.post') as mock_mm_request:
+      mock_mm_request.side_effect = mock_mm_requests_post
+      lm = anthropic.Claude3Haiku(api_key='fake_key')
+      response = lm(lf_modalities.PDF.from_bytes(pdf_content), lm=lm)
+      self.assertEqual(response.text, 'document: application/pdf')
   def test_call_errors(self):
     for status_code, error_type, error_message in [
         (429, 'rate_limit', 'Rate limit exceeded.'),
@@ -160,7 +183,52 @@ class AnthropicTest(unittest.TestCase):
         with self.assertRaisesRegex(
             Exception, f'.*{status_code}: .*{error_message}'
         ):
-          lm('hello', lm=lm, max_attempts=1)
+          lm('hello', max_attempts=1)
+class VertexAIAnthropicTest(unittest.TestCase):
+  """Tests for VertexAI Anthropic models."""
+  def test_basics(self):
+    with self.assertRaisesRegex(ValueError, 'Please specify `project`'):
+      lm = anthropic.VertexAIClaude3_5_Sonnet_20241022()
+      lm('hi')
+    model = anthropic.VertexAIClaude3_5_Sonnet_20241022(project='langfun')
+    # NOTE(daiyip): For OSS users, default credentials are not available unless
+    # users have already set up their GCP project. Therefore we ignore the
+    # exception here.
+    try:
+      model._initialize()
+    except exceptions.DefaultCredentialsError:
+      pass
+    self.assertEqual(
+        model.api_endpoint,
+        (
+            'https://us-east5-aiplatform.googleapis.com/v1/projects/'
+            'langfun/locations/us-east5/publishers/anthropic/'
+            'models/claude-3-5-sonnet-v2@20241022:streamRawPredict'
+        )
+    )
+    request = model.request(
+        lf_message.UserMessage('hi'),
+        language_model.LMSamplingOptions(temperature=0.0),
+    )
+    self.assertEqual(
+        request,
+        {
+            'anthropic_version': 'vertex-2023-10-16',
+            'max_tokens': 8192,
+            'messages': [
+                {'content': [{'text': 'hi', 'type': 'text'}], 'role': 'user'}
+            ],
+            'stream': False,
+            'temperature': 0.0,
+            'top_k': 40,
+        },
+    )
 if __name__ == '__main__':

langfun/core/llms/cache/base.py CHANGED Viewed

@@ -60,13 +60,16 @@ class LMCacheBase(lf.LMCache):
       self, lm: lf.LanguageModel, prompt: lf.Message, seed: int
   ) -> lf.LMSamplingResult | None:
     """Gets the cached result of a prompt generated by a language model."""
-    entry = self._get(lm.model_id, self._key(lm, prompt, seed))
+    key = self._key(lm, prompt, seed)
+    entry = self._get(lm.model_id, key)
     self._stats.num_queries += 1
     if entry is None:
       self._stats.num_misses += 1
       return None
     if entry.expire is not None and entry.expire < datetime.datetime.now():
       self._stats.num_hit_expires += 1
+      self._stats.num_deletes += 1
+      assert self._delete(lm.model_id, key)
       return None
     self._stats.num_hits += 1
     return entry.result
@@ -86,6 +89,18 @@ class LMCacheBase(lf.LMCache):
     self._put(lm.model_id, self._key(lm, prompt, seed), entry)
     self._stats.num_updates += 1
+  def delete(
+      self,
+      lm: lf.LanguageModel,
+      prompt: lf.Message,
+      seed: int,
+  ) -> bool:
+    """Deletes the result of a prompt generated by a language model in cache."""
+    deleted = self._delete(lm.model_id, self._key(lm, prompt, seed))
+    if deleted:
+      self._stats.num_deletes += 1
+    return deleted
   @abc.abstractmethod
   def _get(self, model_id: str, key: str) -> LMCacheEntry | None:
     """Returns a LM cache entry associated with the key."""
@@ -94,6 +109,10 @@ class LMCacheBase(lf.LMCache):
   def _put(self, model_id: str, key: str, entry: LMCacheEntry) -> None:
     """Puts a LM cache entry associated with the key."""
+  @abc.abstractmethod
+  def _delete(self, model_id: str, key: str) -> bool:
+    """Deletes a LM cache entry associated with the key."""
   def _sym_clone(self, deep: bool, memo: Any = None) -> 'LMCacheBase':
     v = super()._sym_clone(deep, memo)
     v._stats = self._stats  # pylint: disable=protected-access
@@ -102,4 +121,4 @@ class LMCacheBase(lf.LMCache):
 def default_key(lm: lf.LanguageModel, prompt: lf.Message, seed: int) -> Any:
   """Default key for LM cache."""
-  return (prompt.text, lm.sampling_options.cache_key(), seed)
+  return (prompt.text_with_modality_hash, lm.sampling_options.cache_key(), seed)

langfun/core/llms/cache/in_memory.py CHANGED Viewed

@@ -15,6 +15,7 @@
 import collections
 import contextlib
+import json
 from typing import Annotated, Any, Iterator
 import langfun.core as lf
 from langfun.core.llms.cache import base
@@ -49,6 +50,11 @@ class InMemory(base.LMCacheBase):
             "Creating a new cache as cache file '%s' does not exist.",
             self.filename,
         )
+      except json.JSONDecodeError:
+        pg.logging.warning(
+            "Creating a new cache as cache file '%s' is corrupted.",
+            self.filename,
+        )
   def model_ids(self) -> list[str]:
     """Returns the model ids of cached queires."""
@@ -99,6 +105,13 @@ class InMemory(base.LMCacheBase):
     """Puts a LM cache entry associated with the key."""
     self._cache[model_id][key] = entry
+  def _delete(self, model_id: str, key: str) -> bool:
+    """Deletes a LM cache entry associated with the key."""
+    model_cache = self._cache.get(model_id, None)
+    if model_cache is None:
+      return False
+    return model_cache.pop(key, None) is not None
   def reset(self, model_id: str | None = None) -> None:
     """Resets the cache."""
     if model_id is not None:

langfun/core/llms/cache/in_memory_test.py CHANGED Viewed

@@ -66,14 +66,15 @@ class InMemoryLMCacheTest(unittest.TestCase):
               [
                   lf.LMSample(
                       lf.AIMessage(response_text, cache_seed=cache_seed),
-                      score=1.0
+                      score=1.0,
                   )
               ],
               usage=lf.LMSamplingUsage(
                   1,
                   len(response_text),
                   len(response_text) + 1,
-              )
+              ),
+              is_cached=True,
           )
       )
@@ -148,6 +149,50 @@ class InMemoryLMCacheTest(unittest.TestCase):
     self.assertIs(copy.deepcopy(cache)._cache, cache._cache)
     self.assertIs(copy.deepcopy(cache)._stats, cache._stats)
+    self.assertFalse(
+        cache.delete(fake.StaticResponse('hi'), lf.UserMessage('c'), seed=0)
+    )
+    self.assertFalse(cache.delete(lm, lf.UserMessage('c'), seed=1))
+    self.assertFalse(cache.delete(lm, lf.UserMessage('d'), seed=0))
+    self.assertTrue(cache.delete(lm, lf.UserMessage('c'), seed=0))
+    self.assertEqual(
+        list(cache.keys('StaticSequence')),
+        [
+            ('a', (None, None, 1, 40, None, None), 0),
+            ('a', (None, None, 1, 40, None, None), 1),
+            ('b', (None, None, 1, 40, None, None), 0),
+        ],
+    )
+    self.assertEqual(cache.stats.num_deletes, 1)
+  def test_cache_with_modalities(self):
+    class CustomModality(lf.Modality):
+      content: str
+      def to_bytes(self):
+        return self.content.encode()
+    cache = in_memory.InMemory()
+    lm = fake.StaticSequence(['1', '2', '3', '4', '5', '6'], cache=cache)
+    lm(lf.UserMessage('hi <<[[image]]>>', image=CustomModality('foo')))
+    lm(lf.UserMessage('hi <<[[image]]>>', image=CustomModality('bar')))
+    self.assertEqual(
+        list(cache.keys()),
+        [
+            (
+                'hi <<[[image]]>><image>acbd18db</image>',
+                (None, None, 1, 40, None, None),
+                0,
+            ),
+            (
+                'hi <<[[image]]>><image>37b51d19</image>',
+                (None, None, 1, 40, None, None),
+                0,
+            ),
+        ],
+    )
   def test_ttl(self):
     cache = in_memory.InMemory(ttl=1)
     lm = fake.StaticSequence(['1', '2', '3'], cache=cache)
@@ -160,6 +205,7 @@ class InMemoryLMCacheTest(unittest.TestCase):
     self.assertEqual(cache.stats.num_hits, 1)
     self.assertEqual(cache.stats.num_hit_expires, 1)
     self.assertEqual(cache.stats.num_misses, 1)
+    self.assertEqual(cache.stats.num_deletes, 1)
   def test_different_sampling_options(self):
     cache = in_memory.InMemory()
@@ -249,6 +295,11 @@ class InMemoryLMCacheTest(unittest.TestCase):
     self.assertEqual(cache2.stats.num_updates, 2)
     cache2.save()
+    # Corrupted file.
+    pg.io.writefile(path, 'bad_content')
+    cache3 = in_memory.InMemory(path)
+    self.assertEqual(len(cache3), 0)
 class LmCacheTest(unittest.TestCase):

langfun/core/llms/compositional.py ADDED Viewed

@@ -0,0 +1,101 @@
+# Copyright 2024 The Langfun Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Compositions of different LLM models."""
+import random
+from typing import Annotated
+import langfun.core as lf
+import pyglove as pg
+@pg.use_init_args(['candidates', 'seed'])
+class RandomChoice(lf.LanguageModel):
+  """Random choice of a list of LLM models."""
+  candidates: Annotated[
+      list[lf.LanguageModel],
+      (
+          'A list of LLMs as candidates to choose from.'
+      )
+  ]
+  seed: Annotated[
+      int,
+      (
+          'The random seed to use for the random choice.'
+      )
+  ] = 0
+  def _on_bound(self):
+    super()._on_bound()
+    self._rand = random.Random(self.seed)
+    # Applying sampling options to all candidates.
+    parent_non_default = self.sampling_options.sym_nondefault()
+    if parent_non_default:
+      for c in self.candidates:
+        c.sampling_options.rebind(
+            parent_non_default, notify_parents=False, raise_on_no_change=False
+        )
+  @property
+  def model_id(self) -> str:
+    model_ids = ', '.join(
+        sorted(c.model_id for c in self.candidates)
+    )
+    return f'RandomChoice({model_ids})'
+  @property
+  def resource_id(self) -> str:
+    resource_ids = ', '.join(
+        sorted(c.resource_id for c in self.candidates)
+    )
+    return f'RandomChoice({resource_ids})'
+  def _select_lm(self) -> lf.LanguageModel:
+    """Selects a random LLM from the candidates."""
+    return self._rand.choice(self.candidates)
+  def sample(
+      self,
+      prompts: list[str | lf.Message],
+      *,
+      cache_seed: int = 0,
+      **kwargs,
+  ) -> list[lf.LMSamplingResult]:
+    return self._select_lm().sample(
+        prompts, cache_seed=cache_seed, **kwargs
+    )
+  def __call__(
+      self, prompt: lf.Message, *, cache_seed: int = 0, **kwargs
+  ) -> lf.Message:
+    return self._select_lm()(prompt, cache_seed=cache_seed, **kwargs)
+  def score(
+      self,
+      prompt: str | lf.Message | list[lf.Message],
+      completions: list[str | lf.Message],
+      **kwargs,
+  ) -> list[lf.LMScoringResult]:
+    return self._select_lm().score(prompt, completions, **kwargs)
+  def tokenize(
+      self,
+      prompt: str | lf.Message,
+      **kwargs,
+  ) -> list[tuple[str | bytes, int]]:
+    return self._select_lm().tokenize(prompt, **kwargs)
+  def _sample(self, *arg, **kwargs):
+    assert False, 'Should never trigger.'

langfun/core/llms/compositional_test.py ADDED Viewed

@@ -0,0 +1,73 @@
+# Copyright 2024 The Langfun Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Tests for compositional models."""
+import unittest
+import langfun.core as lf
+from langfun.core.llms import compositional
+from langfun.core.llms import fake
+class RandomChoiceTest(unittest.TestCase):
+  def test_basic(self):
+    lm = compositional.RandomChoice([
+        fake.StaticResponse('hi'),
+        fake.StaticSequence(['hello', 'world'])
+    ])
+    self.assertEqual(
+        lm.model_id,
+        'RandomChoice(StaticResponse, StaticSequence)'
+    )
+    self.assertEqual(
+        lm.resource_id,
+        'RandomChoice(StaticResponse, StaticSequence)'
+    )
+    self.assertEqual(
+        [lm('a'), lm('b'), lm('c')],
+        ['hello', 'world', 'hi']
+    )
+    lm = lm.clone()
+    self.assertEqual(
+        [
+            x.samples[0].response for x in [
+                lm.sample(['a'])[0],
+                lm.sample(['b'])[0],
+                lm.sample(['c'])[0],
+            ]
+        ],
+        ['hello', 'world', 'hi']
+    )
+    self.assertEqual(
+        lm.score('hello', ['world']),
+        [lf.LMScoringResult(0.0)]
+    )
+    self.assertEqual(
+        lm.tokenize('hello'),
+        [('hello', 0)]
+    )
+  def test_sampling_options(self):
+    lm = compositional.RandomChoice([
+        fake.StaticResponse('hi'),
+        fake.StaticSequence(['hello', 'world'])
+    ], temperature=0.5)
+    self.assertEqual(
+        lm.candidates[0].sampling_options.temperature,
+        0.5
+    )
+if __name__ == '__main__':
+  unittest.main()

langfun/core/llms/deepseek.py ADDED Viewed

@@ -0,0 +1,117 @@
+# Copyright 2024 The Langfun Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Language models from DeepSeek."""
+import os
+from typing import Annotated, Any
+import langfun.core as lf
+from langfun.core.llms import openai_compatible
+import pyglove as pg
+SUPPORTED_MODELS_AND_SETTINGS = {
+    # pylint: disable=g-line-too-long
+    # TODO(yifenglu): The RPM and TPM are arbitrary numbers. Update them once DeepSeek provides concrete guidelines.
+    # DeepSeek doesn't control the rate limit at the moment: https://api-docs.deepseek.com/quick_start/rate_limit
+    # The cost is based on: https://api-docs.deepseek.com/quick_start/pricing
+    'deepseek-chat': pg.Dict(
+        in_service=True,
+        rpm=100,
+        tpm=1000000,
+        cost_per_1k_input_tokens=0.00014,
+        cost_per_1k_output_tokens=0.00028,
+    ),
+}
+# DeepSeek API uses an API format compatible with OpenAI.
+# Reference: https://api-docs.deepseek.com/
+@lf.use_init_args(['model'])
+class DeepSeek(openai_compatible.OpenAICompatible):
+  """DeepSeek model."""
+  model: pg.typing.Annotated[
+      pg.typing.Enum(
+          pg.MISSING_VALUE, list(SUPPORTED_MODELS_AND_SETTINGS.keys())
+      ),
+      'The name of the model to use.',
+  ]
+  api_endpoint: str = 'https://api.deepseek.com/chat/completions'
+  api_key: Annotated[
+      str | None,
+      (
+          'API key. If None, the key will be read from environment variable '
+          "'DEEPSEEK_API_KEY'."
+      ),
+  ] = None
+  @property
+  def headers(self) -> dict[str, Any]:
+    api_key = self.api_key or os.environ.get('DEEPSEEK_API_KEY', None)
+    if not api_key:
+      raise ValueError(
+          'Please specify `api_key` during `__init__` or set environment '
+          'variable `DEEPSEEK_API_KEY` with your DeepSeek API key.'
+      )
+    headers = super().headers
+    headers.update({
+        'Authorization': f'Bearer {api_key}',
+    })
+    return headers
+  @property
+  def model_id(self) -> str:
+    """Returns a string to identify the model."""
+    return f'DeepSeek({self.model})'
+  @property
+  def max_concurrency(self) -> int:
+    rpm = SUPPORTED_MODELS_AND_SETTINGS[self.model].get('rpm', 0)
+    tpm = SUPPORTED_MODELS_AND_SETTINGS[self.model].get('tpm', 0)
+    return self.rate_to_max_concurrency(
+        requests_per_min=rpm, tokens_per_min=tpm
+    )
+  def estimate_cost(
+      self, num_input_tokens: int, num_output_tokens: int
+  ) -> float | None:
+    """Estimate the cost based on usage."""
+    cost_per_1k_input_tokens = SUPPORTED_MODELS_AND_SETTINGS[self.model].get(
+        'cost_per_1k_input_tokens', None
+    )
+    cost_per_1k_output_tokens = SUPPORTED_MODELS_AND_SETTINGS[self.model].get(
+        'cost_per_1k_output_tokens', None
+    )
+    if cost_per_1k_output_tokens is None or cost_per_1k_input_tokens is None:
+      return None
+    return (
+        cost_per_1k_input_tokens * num_input_tokens
+        + cost_per_1k_output_tokens * num_output_tokens
+    ) / 1000
+  @classmethod
+  def dir(cls):
+    return [k for k, v in SUPPORTED_MODELS_AND_SETTINGS.items() if v.in_service]
+class DeepSeekChat(DeepSeek):
+  """DeepSeek Chat model.
+  Currently, it is powered by DeepSeek-V3 model, 64K input contenxt window and
+  8k max output tokens.
+  """
+  model = 'deepseek-chat'

langfun/core/llms/deepseek_test.py ADDED Viewed

@@ -0,0 +1,61 @@
+# Copyright 2023 The Langfun Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+from langfun.core.llms import deepseek
+class DeepSeekTest(unittest.TestCase):
+  """Tests for DeepSeek language model."""
+  def test_dir(self):
+    self.assertIn('deepseek-chat', deepseek.DeepSeek.dir())
+  def test_key(self):
+    with self.assertRaisesRegex(ValueError, 'Please specify `api_key`'):
+      _ = deepseek.DeepSeekChat().headers
+    self.assertEqual(
+        deepseek.DeepSeekChat(api_key='test_key').headers,
+        {
+            'Content-Type': 'application/json',
+            'Authorization': 'Bearer test_key',
+        }
+    )
+  def test_model_id(self):
+    self.assertEqual(
+        deepseek.DeepSeekChat(api_key='test_key').model_id,
+        'DeepSeek(deepseek-chat)',
+    )
+  def test_resource_id(self):
+    self.assertEqual(
+        deepseek.DeepSeekChat(api_key='test_key').resource_id,
+        'DeepSeek(deepseek-chat)',
+    )
+  def test_max_concurrency(self):
+    self.assertGreater(
+        deepseek.DeepSeekChat(api_key='test_key').max_concurrency, 0
+    )
+  def test_estimate_cost(self):
+    self.assertEqual(
+        deepseek.DeepSeekChat(api_key='test_key').estimate_cost(
+            num_input_tokens=100, num_output_tokens=100
+        ),
+        4.2e-5
+    )
+if __name__ == '__main__':
+  unittest.main()

langfun 0.0.2.dev20240429__py3-none-any.whl → 0.1.2.dev202501150804__py3-none-any.whl

langfun 0.0.2.dev20240429py3-none-any.whl → 0.1.2.dev202501150804py3-none-any.whl