PyPI - edsl - Versions diffs - 0.1.58__py3-none-any.whl → 0.1.60__py3-none-any.whl - Mend

edsl 0.1.58py3-none-any.whl → 0.1.60py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

edsl/__version__.py +1 -1
edsl/agents/agent.py +23 -4
edsl/agents/agent_list.py +36 -6
edsl/base/data_transfer_models.py +5 -0
edsl/base/enums.py +7 -2
edsl/coop/coop.py +103 -1
edsl/dataset/dataset.py +74 -0
edsl/dataset/dataset_operations_mixin.py +69 -64
edsl/inference_services/services/__init__.py +3 -1
edsl/inference_services/services/open_ai_service_v2.py +243 -0
edsl/inference_services/services/test_service.py +1 -1
edsl/interviews/exception_tracking.py +66 -20
edsl/invigilators/invigilators.py +5 -1
edsl/invigilators/prompt_constructor.py +299 -136
edsl/jobs/data_structures.py +3 -0
edsl/jobs/html_table_job_logger.py +18 -1
edsl/jobs/jobs_pricing_estimation.py +6 -2
edsl/jobs/jobs_remote_inference_logger.py +2 -0
edsl/jobs/remote_inference.py +34 -7
edsl/key_management/key_lookup_builder.py +25 -3
edsl/language_models/language_model.py +41 -3
edsl/language_models/raw_response_handler.py +126 -7
edsl/prompts/prompt.py +1 -0
edsl/questions/question_list.py +76 -20
edsl/results/result.py +37 -0
edsl/results/results.py +9 -1
edsl/scenarios/file_store.py +8 -12
edsl/scenarios/scenario.py +50 -2
edsl/scenarios/scenario_list.py +34 -12
edsl/surveys/survey.py +4 -0
edsl/tasks/task_history.py +180 -6
edsl/utilities/wikipedia.py +194 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/METADATA +5 -4
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/RECORD +37 -35
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/LICENSE +0 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/WHEEL +0 -0
{edsl-0.1.58.dist-info → edsl-0.1.60.dist-info}/entry_points.txt +0 -0

edsl/results/result.py CHANGED Viewed

@@ -95,6 +95,7 @@ class Result(Base, UserDict):
         question_to_attributes: Optional[dict[QuestionName, Any]] = None,
         generated_tokens: Optional[dict] = None,
         comments_dict: Optional[dict] = None,
+        reasoning_summaries_dict: Optional[dict] = None,
         cache_used_dict: Optional[dict[QuestionName, bool]] = None,
         indices: Optional[dict] = None,
         cache_keys: Optional[dict[QuestionName, str]] = None,
@@ -112,6 +113,7 @@ class Result(Base, UserDict):
         :param question_to_attributes: A dictionary of question attributes.
         :param generated_tokens: A dictionary of generated tokens.
         :param comments_dict: A dictionary of comments.
+        :param reasoning_summaries_dict: A dictionary of reasoning summaries.
         :param cache_used_dict: A dictionary of cache usage.
         :param indices: A dictionary of indices.
@@ -130,6 +132,7 @@ class Result(Base, UserDict):
             "question_to_attributes": self.question_to_attributes,
             "generated_tokens": generated_tokens or {},
             "comments_dict": comments_dict or {},
+            "reasoning_summaries_dict": reasoning_summaries_dict or {},
             "cache_used_dict": cache_used_dict or {},
             "cache_keys": cache_keys or {},
         }
@@ -236,6 +239,7 @@ class Result(Base, UserDict):
             "answer": self.data["answer"],
             "prompt": self.data["prompt"],
             "comment": self.data["comments_dict"],
+            "reasoning_summary": self.data["reasoning_summaries_dict"],
             "generated_tokens": self.data["generated_tokens"],
             "raw_model_response": self.data["raw_model_response"],
             "question_text": sub_dicts_needing_new_keys["question_text"],
@@ -497,6 +501,7 @@ class Result(Base, UserDict):
             question_to_attributes=json_dict.get("question_to_attributes", None),
             generated_tokens=json_dict.get("generated_tokens", {}),
             comments_dict=json_dict.get("comments_dict", {}),
+            reasoning_summaries_dict=json_dict.get("reasoning_summaries_dict", {}),
             cache_used_dict=json_dict.get("cache_used_dict", {}),
             cache_keys=json_dict.get("cache_keys", {}),
             indices=json_dict.get("indices", None),
@@ -631,6 +636,36 @@ class Result(Base, UserDict):
             }
             return comments_dict
+        def get_reasoning_summaries_dict(answer_key_names) -> dict[str, Any]:
+            reasoning_summaries_dict = {}
+            for k in answer_key_names:
+                reasoning_summary = question_results[k].reasoning_summary
+                # If reasoning summary is None but we have a raw model response, try to extract it
+                if reasoning_summary is None and hasattr(question_results[k], 'raw_model_response'):
+                    try:
+                        # Get the model class to access the reasoning_sequence
+                        model_class = interview.model.__class__ if hasattr(interview, 'model') else None
+                        if model_class and hasattr(model_class, 'reasoning_sequence'):
+                            from ..language_models.raw_response_handler import RawResponseHandler
+                            # Create a handler with the model's reasoning sequence
+                            handler = RawResponseHandler(
+                                key_sequence=model_class.key_sequence if hasattr(model_class, 'key_sequence') else None,
+                                usage_sequence=model_class.usage_sequence if hasattr(model_class, 'usage_sequence') else None,
+                                reasoning_sequence=model_class.reasoning_sequence
+                            )
+                            # Try to extract the reasoning summary
+                            reasoning_summary = handler.get_reasoning_summary(question_results[k].raw_model_response)
+                    except Exception:
+                        # If extraction fails, keep it as None
+                        pass
+                reasoning_summaries_dict[k + "_reasoning_summary"] = reasoning_summary
+            return reasoning_summaries_dict
         def get_question_name_to_prompts(
             model_response_objects,
         ) -> dict[str, dict[str, str]]:
@@ -705,6 +740,7 @@ class Result(Base, UserDict):
         answer_key_names = list(question_results.keys())
         generated_tokens_dict = get_generated_tokens_dict(answer_key_names) if answer_key_names else {}
         comments_dict = get_comments_dict(answer_key_names) if answer_key_names else {}
+        reasoning_summaries_dict = get_reasoning_summaries_dict(answer_key_names) if answer_key_names else {}
         # Get answers that are in the question results
         answer_dict = {}
@@ -735,6 +771,7 @@ class Result(Base, UserDict):
             survey=survey_copy,
             generated_tokens=generated_tokens_dict,
             comments_dict=comments_dict,
+            reasoning_summaries_dict=reasoning_summaries_dict,
             cache_used_dict=cache_used_dictionary,
             indices=indices_copy,
             cache_keys=cache_keys,

edsl/results/results.py CHANGED Viewed

@@ -273,6 +273,7 @@ class Results(MutableSequence, ResultsOperationsMixin, Base):
         "generated_tokens",
         "cache_used",
         "cache_keys",
+        "reasoning_summary",
     ]
     @classmethod
@@ -771,6 +772,10 @@ class Results(MutableSequence, ResultsOperationsMixin, Base):
     def to_dataset(self) -> "Dataset":
         return self.select()
+    def optimzie_scenarios(self):
+        for result in self.data:
+            result.scenario.offload(inplace=True)
     def to_dict(
         self,
         sort: bool = False,
@@ -778,9 +783,12 @@ class Results(MutableSequence, ResultsOperationsMixin, Base):
         include_cache: bool = True,
         include_task_history: bool = False,
         include_cache_info: bool = True,
+        offload_scenarios: bool = True,
     ) -> dict[str, Any]:
         from ..caching import Cache
+        if offload_scenarios:
+            self.optimzie_scenarios()
         if sort:
             data = sorted([result for result in self.data], key=lambda x: hash(x))
         else:
@@ -809,7 +817,7 @@ class Results(MutableSequence, ResultsOperationsMixin, Base):
             )
         if self.task_history.has_unfixed_exceptions or include_task_history:
-            d.update({"task_history": self.task_history.to_dict()})
+            d.update({"task_history": self.task_history.to_dict(offload_content=True)})
         if add_edsl_version:
             from .. import __version__

edsl/scenarios/file_store.py CHANGED Viewed

@@ -446,9 +446,7 @@ class FileStore(Scenario):
         if suffix is None:
             suffix = self.suffix
         if self.binary:
-            file_like_object = self.base64_to_file(
-                self["base64_string"], is_binary=True
-            )
+            file_like_object = self.base64_to_file(self.base64_string, is_binary=True)
         else:
             file_like_object = self.base64_to_text_file(self.base64_string)
@@ -765,15 +763,13 @@ class FileStore(Scenario):
         if name.startswith("__") and name.endswith("__"):
             raise AttributeError(name)
-        # Only try to access suffix if it's in our __dict__
-        if hasattr(self, "_data") and "suffix" in self._data:
-            if self._data["suffix"] == "csv":
-                # Get the pandas DataFrame
-                df = self.to_pandas()
-                # Check if the requested attribute exists in the DataFrame
-                if hasattr(df, name):
-                    return getattr(df, name)
-        # If not a CSV or attribute doesn't exist in DataFrame, raise AttributeError
+        # Check for _data directly in __dict__ to avoid recursion
+        _data = self.__dict__.get("_data", None)
+        if _data and _data.get("suffix") == "csv":
+            df = self.to_pandas()
+            if hasattr(df, name):
+                return getattr(df, name)
         raise AttributeError(
             f"'{self.__class__.__name__}' object has no attribute '{name}'"
         )

edsl/scenarios/scenario.py CHANGED Viewed

@@ -264,9 +264,49 @@ class Scenario(Base, UserDict):
         """Display a scenario as a table."""
         return self.to_dataset().table(tablefmt=tablefmt)
-    def to_dict(self, add_edsl_version: bool = True) -> dict:
+    def offload(self, inplace=False) -> "Scenario":
+        """
+        Offloads base64-encoded content from the scenario by replacing 'base64_string'
+        fields with 'offloaded'. This reduces memory usage.
+        Args:
+            inplace (bool): If True, modify the current scenario. If False, return a new one.
+        Returns:
+            Scenario: The modified scenario (either self or a new instance).
+        """
+        from edsl.scenarios import FileStore
+        from edsl.prompts import Prompt
+        target = self if inplace else Scenario()
+        for key, value in self.items():
+            if isinstance(value, FileStore):
+                file_store_dict = value.to_dict()
+                if "base64_string" in file_store_dict:
+                    file_store_dict["base64_string"] = "offloaded"
+                modified_value = FileStore.from_dict(file_store_dict)
+            elif isinstance(value, dict) and "base64_string" in value:
+                value_copy = value.copy()
+                value_copy["base64_string"] = "offloaded"
+                modified_value = value_copy
+            else:
+                modified_value = value
+            target[key] = modified_value
+        return target
+    def to_dict(
+        self, add_edsl_version: bool = True, offload_base64: bool = False
+    ) -> dict:
         """Convert a scenario to a dictionary.
+        Args:
+            add_edsl_version: If True, adds the EDSL version to the returned dictionary.
+            offload_base64: If True, replaces any base64_string fields with 'offloaded'
+                           to reduce memory usage.
         Example:
         >>> s = Scenario({"food": "wood chips"})
@@ -283,7 +323,15 @@ class Scenario(Base, UserDict):
         d = self.data.copy()
         for key, value in d.items():
             if isinstance(value, FileStore) or isinstance(value, Prompt):
-                d[key] = value.to_dict(add_edsl_version=add_edsl_version)
+                value_dict = value.to_dict(add_edsl_version=add_edsl_version)
+                if (
+                    offload_base64
+                    and isinstance(value_dict, dict)
+                    and "base64_string" in value_dict
+                ):
+                    value_dict["base64_string"] = "offloaded"
+                d[key] = value_dict
         if add_edsl_version:
             from edsl import __version__

edsl/scenarios/scenario_list.py CHANGED Viewed

@@ -145,22 +145,18 @@ class ScenarioList(MutableSequence, Base, ScenarioListOperationsMixin):
         """Initialize a new ScenarioList with optional data and codebook."""
         self._data_class = data_class
         self.data = self._data_class([])
-        warned = False
         for item in data or []:
-            try:
-                _ = json.dumps(item.to_dict())
-            except:
-                import warnings
-                if not warned:
-                    warnings.warn(
-                        f"One or more items in the data list are not JSON serializable. "
-                        "This would prevent running a job that uses this ScenarioList."
-                        "One solution is to use 'str(item)' to convert the item to a string before adding."
-                    )
-                    warned = True
             self.data.append(item)
         self.codebook = codebook or {}
+    def is_serializable(self):
+        for item in self.data:
+            try:
+                _ = json.dumps(item.to_dict())
+            except Exception as e:
+                return False
+        return True
     # Required MutableSequence abstract methods
     def __getitem__(self, index):
         """Get item at index."""
@@ -360,6 +356,32 @@ class ScenarioList(MutableSequence, Base, ScenarioListOperationsMixin):
                 new_scenarios.append(Scenario(new_scenario))
         return new_scenarios
+    @classmethod
+    def from_search_terms(cls, search_terms: List[str]) -> ScenarioList:
+        """Create a ScenarioList from a list of search terms, using Wikipedia.
+        Args:
+            search_terms: A list of search terms.
+        """
+        from ..utilities.wikipedia import fetch_wikipedia_content
+        results = fetch_wikipedia_content(search_terms)
+        return cls([Scenario(result) for result in results])
+    def augment_with_wikipedia(self, search_key:str, content_only: bool = True, key_name: str = "wikipedia_content") -> ScenarioList:
+        """Augment the ScenarioList with Wikipedia content."""
+        search_terms = self.select(search_key).to_list()
+        wikipedia_results = ScenarioList.from_search_terms(search_terms)
+        new_sl = ScenarioList(data = [], codebook = self.codebook)
+        for scenario, wikipedia_result in zip(self, wikipedia_results):
+            if content_only:
+                scenario[key_name] = wikipedia_result["content"]
+                new_sl.append(scenario)
+            else:
+                scenario[key_name] = wikipedia_result
+                new_sl.append(scenario)
+        return new_sl
     def pivot(
         self,

edsl/surveys/survey.py CHANGED Viewed

@@ -384,6 +384,10 @@ class Survey(Base):
         if question_name not in self.question_name_to_index:
             raise SurveyError(f"Question name {question_name} not found in survey.")
         return self.questions[self.question_name_to_index[question_name]]
+    def get(self, question_name: str) -> QuestionBase:
+        """Return the question object given the question name."""
+        return self._get_question_by_name(question_name)
     def question_names_to_questions(self) -> dict:
         """Return a dictionary mapping question names to question attributes."""

edsl/tasks/task_history.py CHANGED Viewed

@@ -43,6 +43,7 @@ class TaskHistory(RepresentationMixin):
     - Generates interactive HTML reports with filtering and drill-down
     - Computes statistics across interviews (by model, question type, etc.)
     - Exports to various formats (HTML, notebook, etc.)
+    - Memory optimization via offloading of large file content
     """
     def __init__(
@@ -191,8 +192,22 @@ class TaskHistory(RepresentationMixin):
         """Return a string representation of the TaskHistory."""
         return f"TaskHistory(interviews={self.total_interviews})."
-    def to_dict(self, add_edsl_version=True):
-        """Return the TaskHistory as a dictionary."""
+    def to_dict(self, add_edsl_version=True, offload_content=False):
+        """
+        Return the TaskHistory as a dictionary.
+        Parameters:
+            add_edsl_version: Whether to include EDSL version in the output
+            offload_content: Whether to offload large file content like videos and images
+                            to reduce memory usage
+        Returns:
+            A dictionary representation of this TaskHistory instance
+        """
+        # Offload large file content if requested
+        if offload_content:
+            self.offload_files_content()
         # Serialize each interview object
         interview_dicts = []
         for i in self.total_interviews:
@@ -255,27 +270,60 @@ class TaskHistory(RepresentationMixin):
                             InterviewExceptionCollection,
                         )
+                        # Store the original data in full
+                        self._original_data = data
+                        # Preserve the original interview id
+                        self._interview_id = data.get("id", None)
+                        # Store exceptions using the original data structure
+                        # This ensures when we re-serialize, we keep original data intact
+                        self._exceptions_data = data.get("exceptions", {})
+                        # Create the InterviewExceptionCollection for runtime use
                         exceptions_data = data.get("exceptions", {})
                         self.exceptions = (
                             InterviewExceptionCollection.from_dict(exceptions_data)
                             if exceptions_data
                             else InterviewExceptionCollection()
                         )
+                        # Store other fields
                         self.task_status_logs = data.get("task_status_logs", {})
                         self.model = data.get("model", {})
                         self.survey = data.get("survey", {})
                     def to_dict(self, add_edsl_version=True):
-                        return {
+                        # Use the original exceptions data structure when serializing again
+                        # This preserves all exception details exactly as they were
+                        data = {
                             "type": "InterviewReference",
-                            "exceptions": self.exceptions.to_dict()
-                            if hasattr(self.exceptions, "to_dict")
-                            else self.exceptions,
+                            "exceptions": self._exceptions_data
+                            if hasattr(self, "_exceptions_data")
+                            else (
+                                self.exceptions.to_dict()
+                                if hasattr(self.exceptions, "to_dict")
+                                else self.exceptions
+                            ),
                             "task_status_logs": self.task_status_logs,
                             "model": self.model,
                             "survey": self.survey,
                         }
+                        # Preserve the original interview id if it exists
+                        if self._interview_id:
+                            data["id"] = self._interview_id
+                        # Preserve original version info
+                        if (
+                            add_edsl_version
+                            and hasattr(self, "_original_data")
+                            and "edsl_version" in self._original_data
+                        ):
+                            data["edsl_version"] = self._original_data["edsl_version"]
+                        return data
                 # Create the reference and add it directly
                 ref = DeserializedInterviewRef(interview_data)
                 instance.total_interviews.append(ref)
@@ -728,6 +776,132 @@ class TaskHistory(RepresentationMixin):
         return nb
+    def offload_files_content(self):
+        """
+        Offload large file content from scenarios in interview exceptions.
+        This method iterates over all the interview exceptions and calls the offload method
+        for any scenario components in the invigilator. This significantly reduces memory usage
+        by replacing base64-encoded content with a placeholder string, while preserving the
+        structure of the scenarios.
+        Returns:
+            self: Returns the TaskHistory instance for method chaining
+        This is particularly useful for TaskHistory instances containing interviews with
+        large file content, such as videos, images, or other binary data.
+        """
+        for interview in self.total_interviews:
+            if not hasattr(interview, "exceptions") or not interview.exceptions:
+                continue
+            for question_name, exceptions in interview.exceptions.items():
+                for exception in exceptions:
+                    # Check if exception has an invigilator with scenario
+                    if hasattr(exception, "invigilator") and exception.invigilator:
+                        if (
+                            hasattr(exception.invigilator, "scenario")
+                            and exception.invigilator.scenario
+                        ):
+                            # Call the offload method on the scenario
+                            if hasattr(exception.invigilator.scenario, "offload"):
+                                try:
+                                    # Replace the original scenario with the offloaded version
+                                    exception.invigilator.scenario = (
+                                        exception.invigilator.scenario.offload()
+                                    )
+                                except Exception as e:
+                                    # Silently continue if offloading fails for any reason
+                                    pass
+        return self
+    def deduplicate_and_clean_interviews(self):
+        """
+        Deduplicates exception entries in this task history to reduce memory usage.
+        This method removes duplicate error messages across interviews while preserving
+        the first occurrence of each unique error. This significantly reduces the size
+        of serialized task history data, especially for jobs with many similar errors.
+        Returns:
+            self: Returns the TaskHistory instance for method chaining.
+        """
+        seen = set()
+        cleaned_interviews = []
+        for interview in self.total_interviews:
+            # Skip if interview has no exceptions
+            if not hasattr(interview, "exceptions") or not interview.exceptions:
+                continue
+            keep_interview = False
+            questions_to_modify = {}
+            questions_to_remove = []
+            # First pass: Collect all modifications without changing the dictionary
+            if hasattr(interview.exceptions, "items"):
+                for question_name, exceptions in list(interview.exceptions.items()):
+                    filtered_exceptions = []
+                    for exception in exceptions:
+                        # Get the exception message (may require different access based on structure)
+                        if hasattr(exception, "exception") and hasattr(
+                            exception.exception, "args"
+                        ):
+                            message = (
+                                str(exception.exception.args[0])
+                                if exception.exception.args
+                                else ""
+                            )
+                        else:
+                            message = str(exception)
+                        # Create a unique key for this exception
+                        key = (question_name, message)
+                        # Only keep exceptions we haven't seen before
+                        if key not in seen:
+                            seen.add(key)
+                            filtered_exceptions.append(exception)
+                    # Track what should happen to this question's exceptions
+                    if filtered_exceptions:
+                        keep_interview = True
+                        questions_to_modify[question_name] = filtered_exceptions
+                    else:
+                        questions_to_remove.append(question_name)
+            # Second pass: Apply all modifications safely
+            if hasattr(interview.exceptions, "items"):
+                # Add/replace filtered exceptions
+                for question_name, filtered_exceptions in questions_to_modify.items():
+                    interview.exceptions[question_name] = filtered_exceptions
+                # Remove questions with all duplicate exceptions
+                for question_name in questions_to_remove:
+                    if hasattr(interview.exceptions, "pop"):
+                        interview.exceptions.pop(question_name, None)
+                    elif (
+                        hasattr(interview.exceptions, "__delitem__")
+                        and question_name in interview.exceptions
+                    ):
+                        del interview.exceptions[question_name]
+            # Only keep the interview if it still has exceptions after filtering
+            if keep_interview:
+                cleaned_interviews.append(interview)
+        # Replace the total_interviews with our cleaned list
+        self.total_interviews = cleaned_interviews
+        # Rebuild the _interviews dictionary
+        self._interviews = {
+            index: interview for index, interview in enumerate(self.total_interviews)
+        }
+        return self
 if __name__ == "__main__":
     import doctest

edsl 0.1.58__py3-none-any.whl → 0.1.60__py3-none-any.whl

edsl 0.1.58py3-none-any.whl → 0.1.60py3-none-any.whl