PyPI - edsl - Versions diffs - 0.1.58__py3-none-any.whl → 0.1.60__py3-none-any.whl - Mend

edsl 0.1.58py3-none-any.whl → 0.1.60py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

edsl/__version__.py +1 -1
edsl/agents/agent.py +23 -4
edsl/agents/agent_list.py +36 -6
edsl/base/data_transfer_models.py +5 -0
edsl/base/enums.py +7 -2
edsl/coop/coop.py +103 -1
edsl/dataset/dataset.py +74 -0
edsl/dataset/dataset_operations_mixin.py +69 -64
edsl/inference_services/services/__init__.py +3 -1
edsl/inference_services/services/open_ai_service_v2.py +243 -0
edsl/inference_services/services/test_service.py +1 -1
edsl/interviews/exception_tracking.py +66 -20
edsl/invigilators/invigilators.py +5 -1
edsl/invigilators/prompt_constructor.py +299 -136
edsl/jobs/data_structures.py +3 -0
edsl/jobs/html_table_job_logger.py +18 -1
edsl/jobs/jobs_pricing_estimation.py +6 -2
edsl/jobs/jobs_remote_inference_logger.py +2 -0
edsl/jobs/remote_inference.py +34 -7
edsl/key_management/key_lookup_builder.py +25 -3
edsl/language_models/language_model.py +41 -3
edsl/language_models/raw_response_handler.py +126 -7
edsl/prompts/prompt.py +1 -0
edsl/questions/question_list.py +76 -20
edsl/results/result.py +37 -0
edsl/results/results.py +9 -1
edsl/scenarios/file_store.py +8 -12
edsl/scenarios/scenario.py +50 -2
edsl/scenarios/scenario_list.py +34 -12
edsl/surveys/survey.py +4 -0
edsl/tasks/task_history.py +180 -6
edsl/utilities/wikipedia.py +194 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/METADATA +5 -4
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/RECORD +37 -35
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/LICENSE +0 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/WHEEL +0 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/entry_points.txt +0 -0

edsl/inference_services/services/open_ai_service_v2.py ADDED Viewed

@@ -0,0 +1,243 @@
+from __future__ import annotations
+from typing import Any, List, Optional, Dict, NewType, TYPE_CHECKING
+import os
+import openai
+from ..inference_service_abc import InferenceServiceABC
+# Use TYPE_CHECKING to avoid circular imports at runtime
+if TYPE_CHECKING:
+    from ...language_models import LanguageModel
+from ..rate_limits_cache import rate_limits
+# Default to completions API but can use responses API with parameter
+if TYPE_CHECKING:
+    from ....scenarios.file_store import FileStore as Files
+    from ....invigilators.invigilator_base import InvigilatorBase as InvigilatorAI
+APIToken = NewType("APIToken", str)
+class OpenAIServiceV2(InferenceServiceABC):
+    """OpenAI service class using the Responses API."""
+    _inference_service_ = "openai_v2"
+    _env_key_name_ = "OPENAI_API_KEY"
+    _base_url_ = None
+    _sync_client_ = openai.OpenAI
+    _async_client_ = openai.AsyncOpenAI
+    _sync_client_instances: Dict[APIToken, openai.OpenAI] = {}
+    _async_client_instances: Dict[APIToken, openai.AsyncOpenAI] = {}
+    # sequence to extract text from response.output
+    key_sequence = ["output", 1, "content", 0, "text"]
+    usage_sequence = ["usage"]
+    # sequence to extract reasoning summary from response.output
+    reasoning_sequence = ["output", 0, "summary"]
+    input_token_name = "prompt_tokens"
+    output_token_name = "completion_tokens"
+    available_models_url = "https://platform.openai.com/docs/models/gp"
+    def __init_subclass__(cls, **kwargs):
+        super().__init_subclass__(**kwargs)
+        cls._sync_client_instances = {}
+        cls._async_client_instances = {}
+    @classmethod
+    def sync_client(cls, api_key: str) -> openai.OpenAI:
+        if api_key not in cls._sync_client_instances:
+            client = cls._sync_client_(
+                api_key=api_key,
+                base_url=cls._base_url_,
+            )
+            cls._sync_client_instances[api_key] = client
+        return cls._sync_client_instances[api_key]
+    @classmethod
+    def async_client(cls, api_key: str) -> openai.AsyncOpenAI:
+        if api_key not in cls._async_client_instances:
+            client = cls._async_client_(
+                api_key=api_key,
+                base_url=cls._base_url_,
+            )
+            cls._async_client_instances[api_key] = client
+        return cls._async_client_instances[api_key]
+    model_exclude_list = [
+        "whisper-1",
+        "davinci-002",
+        "dall-e-2",
+        "tts-1-hd-1106",
+        "tts-1-hd",
+        "dall-e-3",
+        "tts-1",
+        "babbage-002",
+        "tts-1-1106",
+        "text-embedding-3-large",
+        "text-embedding-3-small",
+        "text-embedding-ada-002",
+        "ft:davinci-002:mit-horton-lab::8OfuHgoo",
+        "gpt-3.5-turbo-instruct-0914",
+        "gpt-3.5-turbo-instruct",
+    ]
+    _models_list_cache: List[str] = []
+    @classmethod
+    def get_model_list(cls, api_key: str | None = None) -> List[str]:
+        if api_key is None:
+            api_key = os.getenv(cls._env_key_name_)
+        raw = cls.sync_client(api_key).models.list()
+        return raw.data if hasattr(raw, "data") else raw
+    @classmethod
+    def available(cls, api_token: str | None = None) -> List[str]:
+        if api_token is None:
+            api_token = os.getenv(cls._env_key_name_)
+        if not cls._models_list_cache:
+            data = cls.get_model_list(api_key=api_token)
+            cls._models_list_cache = [
+                m.id for m in data if m.id not in cls.model_exclude_list
+            ]
+        return cls._models_list_cache
+    @classmethod
+    def create_model(
+        cls,
+        model_name: str,
+        model_class_name: str | None = None,
+    ) -> LanguageModel:
+        if model_class_name is None:
+            model_class_name = cls.to_class_name(model_name)
+        from ...language_models import LanguageModel
+        class LLM(LanguageModel):
+            """Child class for OpenAI Responses API"""
+            key_sequence = cls.key_sequence
+            usage_sequence = cls.usage_sequence
+            reasoning_sequence = cls.reasoning_sequence
+            input_token_name = cls.input_token_name
+            output_token_name = cls.output_token_name
+            _inference_service_ = cls._inference_service_
+            _model_ = model_name
+            _parameters_ = {
+                "temperature": 0.5,
+                "max_tokens": 2000,
+                "top_p": 1,
+                "frequency_penalty": 0,
+                "presence_penalty": 0,
+                "logprobs": False,
+                "top_logprobs": 3,
+            }
+            def sync_client(self) -> openai.OpenAI:
+                return cls.sync_client(api_key=self.api_token)
+            def async_client(self) -> openai.AsyncOpenAI:
+                return cls.async_client(api_key=self.api_token)
+            @classmethod
+            def available(cls) -> list[str]:
+                return cls.sync_client().models.list().data
+            def get_headers(self) -> dict[str, Any]:
+                client = self.sync_client()
+                response = client.responses.with_raw_response.create(
+                    model=self.model,
+                    input=[{"role": "user", "content": "Say this is a test"}],
+                    store=False,
+                )
+                return dict(response.headers)
+            def get_rate_limits(self) -> dict[str, Any]:
+                try:
+                    headers = rate_limits.get("openai", self.get_headers())
+                except Exception:
+                    return {"rpm": 10000, "tpm": 2000000}
+                return {
+                    "rpm": int(headers["x-ratelimit-limit-requests"]),
+                    "tpm": int(headers["x-ratelimit-limit-tokens"]),
+                }
+            async def async_execute_model_call(
+                self,
+                user_prompt: str,
+                system_prompt: str = "",
+                files_list: Optional[List[Files]] = None,
+                invigilator: Optional[InvigilatorAI] = None,
+            ) -> dict[str, Any]:
+                content = user_prompt
+                if files_list:
+                    # embed files as separate inputs
+                    content = [{"type": "text", "text": user_prompt}]
+                    for f in files_list:
+                        content.append(
+                            {
+                                "type": "image_url",
+                                "image_url": {
+                                    "url": f"data:{f.mime_type};base64,{f.base64_string}"
+                                },
+                            }
+                        )
+                # build input sequence
+                messages: Any
+                if system_prompt and not self.omit_system_prompt_if_empty:
+                    messages = [
+                        {"role": "system", "content": system_prompt},
+                        {"role": "user", "content": content},
+                    ]
+                else:
+                    messages = [{"role": "user", "content": content}]
+                # All OpenAI models with the responses API use these base parameters
+                params = {
+                    "model": self.model,
+                    "input": messages,
+                    "temperature": self.temperature,
+                    "top_p": self.top_p,
+                    "store": False,
+                }
+                # Check if this is a reasoning model (o-series models)
+                is_reasoning_model = any(tag in self.model for tag in ["o1", "o1-mini", "o3", "o3-mini", "o1-pro", "o4-mini"])
+                # Only add reasoning parameter for reasoning models
+                if is_reasoning_model:
+                    params["reasoning"] = {"summary": "auto"}
+                # For all models using the responses API, use max_output_tokens
+                # instead of max_tokens (which is for the completions API)
+                params["max_output_tokens"] = self.max_tokens
+                # Specifically for o-series, we also set temperature to 1
+                if is_reasoning_model:
+                    params["temperature"] = 1
+                client = self.async_client()
+                try:
+                    response = await client.responses.create(**params)
+                except Exception as e:
+                    return {"message": str(e)}
+                # convert to dict
+                response_dict = response.model_dump()
+                return response_dict
+        LLM.__name__ = model_class_name
+        return LLM
+    @staticmethod
+    def _create_reasoning_sequence():
+        """Create the reasoning sequence for extracting reasoning summaries from model responses."""
+        # For OpenAI responses, the reasoning summary is typically found at:
+        # ["output", 0, "summary"]
+        # This is the path to the 'summary' field in the first item of the 'output' array
+        return ["output", 0, "summary"]

edsl/inference_services/services/test_service.py CHANGED Viewed

@@ -54,7 +54,7 @@ class TestService(InferenceServiceABC):
             input_token_name = cls.input_token_name
             output_token_name = cls.output_token_name
             _rpm = 1000
-            _tpm = 100000
+            _tpm = 8000000
             @property
             def _canned_response(self):

edsl/interviews/exception_tracking.py CHANGED Viewed

@@ -16,8 +16,9 @@ class InterviewExceptionEntry:
         invigilator: "InvigilatorBase",
         traceback_format="text",
         answers=None,
+        time=None,  # Added time parameter for deserialization
     ):
-        self.time = datetime.datetime.now().isoformat()
+        self.time = time or datetime.datetime.now().isoformat()
         self.exception = exception
         self.invigilator = invigilator
         self.traceback_format = traceback_format
@@ -130,7 +131,12 @@ class InterviewExceptionEntry:
         'Traceback (most recent call last):...'
         """
         e = self.exception
-        tb_str = "".join(traceback.format_exception(type(e), e, e.__traceback__))
+        # Check if the exception has a traceback attribute
+        if hasattr(e, "__traceback__") and e.__traceback__:
+            tb_str = "".join(traceback.format_exception(type(e), e, e.__traceback__))
+        else:
+            # Use the message as traceback if no traceback available
+            tb_str = f"Exception: {str(e)}"
         return tb_str
     @property
@@ -144,14 +150,19 @@ class InterviewExceptionEntry:
         console = Console(file=html_output, record=True)
-        tb = Traceback.from_exception(
-            type(self.exception),
-            self.exception,
-            self.exception.__traceback__,
-            show_locals=True,
-        )
-        console.print(tb)
-        return html_output.getvalue()
+        # Check if the exception has a traceback attribute
+        if hasattr(self.exception, "__traceback__") and self.exception.__traceback__:
+            tb = Traceback.from_exception(
+                type(self.exception),
+                self.exception,
+                self.exception.__traceback__,
+                show_locals=True,
+            )
+            console.print(tb)
+            return html_output.getvalue()
+        else:
+            # Return a simple string if no traceback available
+            return f"<pre>Exception: {str(self.exception)}</pre>"
     @staticmethod
     def serialize_exception(exception: Exception) -> dict:
@@ -160,14 +171,25 @@ class InterviewExceptionEntry:
         >>> entry = InterviewExceptionEntry.example()
         >>> _ = entry.serialize_exception(entry.exception)
         """
-        return {
-            "type": type(exception).__name__,
-            "message": str(exception),
-            "traceback": "".join(
+        # Store the original exception type for proper reconstruction
+        exception_type = type(exception).__name__
+        module_name = getattr(type(exception), "__module__", "builtins")
+        # Extract traceback if available
+        if hasattr(exception, "__traceback__") and exception.__traceback__:
+            tb_str = "".join(
                 traceback.format_exception(
                     type(exception), exception, exception.__traceback__
                 )
-            ),
+            )
+        else:
+            tb_str = f"Exception: {str(exception)}"
+        return {
+            "type": exception_type,
+            "module": module_name,
+            "message": str(exception),
+            "traceback": tb_str,
         }
     @staticmethod
@@ -177,11 +199,31 @@ class InterviewExceptionEntry:
         >>> entry = InterviewExceptionEntry.example()
         >>> _ = entry.deserialize_exception(entry.to_dict()["exception"])
         """
+        exception_type = data.get("type", "Exception")
+        module_name = data.get("module", "builtins")
+        message = data.get("message", "")
         try:
-            exception_class = globals()[data["type"]]
-        except KeyError:
-            exception_class = Exception
-        return exception_class(data["message"])
+            # Try to import the module and get the exception class
+            # if module_name != "builtins":
+            #     import importlib
+            #     module = importlib.import_module(module_name)
+            #     exception_class = getattr(module, exception_type, Exception)
+            # else:
+            #     # Look for exception in builtins
+            import builtins
+            exception_class = getattr(builtins, exception_type, Exception)
+        except (ImportError, AttributeError):
+            # Fall back to a generic Exception but preserve the type name
+            exception = Exception(message)
+            exception.__class__.__name__ = exception_type
+            return exception
+        # Create instance of the original exception type if possible
+        return exception_class(message)
     def to_dict(self) -> dict:
         """Return the exception as a dictionary.
@@ -221,7 +263,11 @@ class InterviewExceptionEntry:
             invigilator = None
         else:
             invigilator = InvigilatorAI.from_dict(data["invigilator"])
-        return cls(exception=exception, invigilator=invigilator)
+        # Use the original timestamp from serialization
+        time = data.get("time")
+        return cls(exception=exception, invigilator=invigilator, time=time)
 class InterviewExceptionCollection(UserDict):

edsl/invigilators/invigilators.py CHANGED Viewed

@@ -105,7 +105,11 @@ class InvigilatorBase(ABC):
             value = getattr(self, attr)
             if value is None:
                 return None
-            if hasattr(value, "to_dict"):
+            if attr == "scenario" and hasattr(value, "offload"):
+                # Use the scenario's offload method to replace base64_string values
+                offloaded = value.offload()
+                return offloaded.to_dict()
+            elif hasattr(value, "to_dict"):
                 return value.to_dict()
             if isinstance(value, (int, float, str, bool, dict, list)):
                 return value

edsl 0.1.58__py3-none-any.whl → 0.1.60__py3-none-any.whl

edsl 0.1.58py3-none-any.whl → 0.1.60py3-none-any.whl