PyPI - edsl - Versions diffs - 0.1.38.dev4__py3-none-any.whl → 0.1.39__py3-none-any.whl - Mend

edsl 0.1.38.dev4py3-none-any.whl → 0.1.39py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

edsl/Base.py +197 -116
edsl/__init__.py +15 -7
edsl/__version__.py +1 -1
edsl/agents/Agent.py +351 -147
edsl/agents/AgentList.py +211 -73
edsl/agents/Invigilator.py +101 -50
edsl/agents/InvigilatorBase.py +62 -70
edsl/agents/PromptConstructor.py +143 -225
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/__init__.py +0 -1
edsl/agents/prompt_helpers.py +3 -3
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +18 -5
edsl/auto/StageBase.py +53 -40
edsl/auto/StageQuestions.py +2 -1
edsl/auto/utilities.py +0 -6
edsl/config.py +22 -2
edsl/conversation/car_buying.py +2 -1
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +1 -1
edsl/coop/coop.py +125 -47
edsl/coop/utils.py +14 -14
edsl/data/Cache.py +45 -27
edsl/data/CacheEntry.py +12 -15
edsl/data/CacheHandler.py +31 -12
edsl/data/RemoteCacheSync.py +154 -46
edsl/data/__init__.py +4 -3
edsl/data_transfer_models.py +2 -1
edsl/enums.py +27 -0
edsl/exceptions/__init__.py +50 -50
edsl/exceptions/agents.py +12 -0
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/questions.py +24 -6
edsl/exceptions/scenarios.py +7 -0
edsl/inference_services/AnthropicService.py +38 -19
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +0 -2
edsl/inference_services/AzureAI.py +0 -2
edsl/inference_services/GoogleService.py +7 -12
edsl/inference_services/InferenceServiceABC.py +18 -85
edsl/inference_services/InferenceServicesCollection.py +120 -79
edsl/inference_services/MistralAIService.py +0 -3
edsl/inference_services/OpenAIService.py +47 -35
edsl/inference_services/PerplexityService.py +0 -3
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +11 -10
edsl/inference_services/TogetherAIService.py +5 -3
edsl/inference_services/data_structures.py +134 -0
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +1 -14
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +356 -431
edsl/jobs/JobsChecks.py +35 -10
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +6 -4
edsl/jobs/JobsRemoteInferenceHandler.py +205 -133
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +44 -3
edsl/jobs/buckets/TokenBucket.py +53 -21
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +143 -408
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +88 -403
edsl/jobs/runners/JobsRunnerStatus.py +133 -165
edsl/jobs/tasks/QuestionTaskCreator.py +21 -19
edsl/jobs/tasks/TaskHistory.py +38 -18
edsl/jobs/tasks/task_status_enum.py +0 -2
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +194 -236
edsl/language_models/ModelList.py +28 -19
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/__init__.py +1 -2
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +2 -2
edsl/language_models/utilities.py +5 -4
edsl/notebooks/Notebook.py +19 -14
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/prompts/Prompt.py +29 -39
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +68 -214
edsl/questions/QuestionBasePromptsMixin.py +7 -3
edsl/questions/QuestionBudget.py +1 -1
edsl/questions/QuestionCheckBox.py +3 -3
edsl/questions/QuestionExtract.py +5 -7
edsl/questions/QuestionFreeText.py +2 -3
edsl/questions/QuestionList.py +10 -18
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +67 -23
edsl/questions/QuestionNumerical.py +2 -4
edsl/questions/QuestionRank.py +7 -17
edsl/questions/SimpleAskMixin.py +4 -3
edsl/questions/__init__.py +2 -1
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +47 -2
edsl/questions/data_structures.py +20 -0
edsl/questions/derived/QuestionLinearScale.py +6 -3
edsl/questions/derived/QuestionTopK.py +1 -1
edsl/questions/descriptors.py +17 -3
edsl/questions/loop_processor.py +149 -0
edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +57 -50
edsl/questions/question_registry.py +1 -1
edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +40 -26
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/results/CSSParameterizer.py +1 -1
edsl/results/Dataset.py +170 -7
edsl/results/DatasetExportMixin.py +168 -305
edsl/results/DatasetTree.py +28 -8
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +298 -206
edsl/results/Results.py +149 -131
edsl/results/ResultsExportMixin.py +2 -0
edsl/results/TableDisplay.py +98 -171
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +1 -1
edsl/results/file_exports.py +252 -0
edsl/results/{Selector.py → results_selector.py} +23 -13
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_renderers.py +118 -0
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +150 -239
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +90 -193
edsl/scenarios/ScenarioHtmlMixin.py +4 -3
edsl/scenarios/ScenarioList.py +415 -244
edsl/scenarios/ScenarioListExportMixin.py +0 -7
edsl/scenarios/ScenarioListPdfMixin.py +15 -37
edsl/scenarios/__init__.py +1 -2
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +49 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +10 -6
edsl/scenarios/scenario_selector.py +156 -0
edsl/study/ObjectEntry.py +1 -1
edsl/study/SnapShot.py +1 -1
edsl/study/Study.py +5 -12
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/Rule.py +5 -4
edsl/surveys/RuleCollection.py +25 -27
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +270 -791
edsl/surveys/SurveyCSS.py +20 -8
edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +11 -9
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +4 -2
edsl/surveys/descriptors.py +6 -2
edsl/surveys/instructions/ChangeInstruction.py +1 -2
edsl/surveys/instructions/Instruction.py +4 -13
edsl/surveys/instructions/InstructionCollection.py +11 -6
edsl/templates/error_reporting/interview_details.html +1 -1
edsl/templates/error_reporting/report.html +1 -1
edsl/tools/plotting.py +1 -1
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/utilities.py +35 -23
{edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/METADATA +12 -10
edsl-0.1.39.dist-info/RECORD +358 -0
{edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/WHEEL +1 -1
edsl/language_models/KeyLookup.py +0 -30
edsl/language_models/registry.py +0 -190
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/results/ResultsDBMixin.py +0 -238
edsl-0.1.38.dev4.dist-info/RECORD +0 -277
/edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +0 -0
/edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +0 -0
/edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +0 -0
{edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/LICENSE +0 -0

edsl/results/Results.py CHANGED Viewed

@@ -9,13 +9,9 @@ import random
 from collections import UserList, defaultdict
 from typing import Optional, Callable, Any, Type, Union, List, TYPE_CHECKING
-if TYPE_CHECKING:
-    from edsl import Survey, Cache, AgentList, ModelList, ScenarioList
-    from edsl.results.Result import Result
-    from edsl.jobs.tasks.TaskHistory import TaskHistory
-from simpleeval import EvalWithCompoundTypes
+from bisect import bisect_left
+from edsl.Base import Base
 from edsl.exceptions.results import (
     ResultsError,
     ResultsBadMutationstringError,
@@ -26,25 +22,27 @@ from edsl.exceptions.results import (
     ResultsDeserializationError,
 )
+if TYPE_CHECKING:
+    from edsl.surveys.Survey import Survey
+    from edsl.data.Cache import Cache
+    from edsl.agents.AgentList import AgentList
+    from edsl.language_models.model import Model
+    from edsl.scenarios.ScenarioList import ScenarioList
+    from edsl.results.Result import Result
+    from edsl.jobs.tasks.TaskHistory import TaskHistory
+    from edsl.language_models.ModelList import ModelList
+    from simpleeval import EvalWithCompoundTypes
 from edsl.results.ResultsExportMixin import ResultsExportMixin
-from edsl.results.ResultsToolsMixin import ResultsToolsMixin
-from edsl.results.ResultsDBMixin import ResultsDBMixin
 from edsl.results.ResultsGGMixin import ResultsGGMixin
-from edsl.results.ResultsFetchMixin import ResultsFetchMixin
-from edsl.utilities.decorators import remove_edsl_version
-from edsl.utilities.utilities import dict_hash
-from edsl.Base import Base
+from edsl.results.results_fetch_mixin import ResultsFetchMixin
+from edsl.utilities.remove_edsl_version import remove_edsl_version
 class Mixins(
     ResultsExportMixin,
-    ResultsDBMixin,
     ResultsFetchMixin,
     ResultsGGMixin,
-    ResultsToolsMixin,
 ):
     def long(self):
         return self.table().long()
@@ -91,6 +89,7 @@ class Results(UserList, Mixins, Base):
         "question_type",
         "comment",
         "generated_tokens",
+        "cache_used",
     ]
     def __init__(
@@ -129,22 +128,43 @@ class Results(UserList, Mixins, Base):
     def _summary(self) -> dict:
         import reprlib
-        # import yaml
         d = {
-            "EDSL Class": "Results",
-            # "docs_url": self.__documentation__,
-            "# of agents": len(set(self.agents)),
-            "# of distinct models": len(set(self.models)),
-            "# of observations": len(self),
-            "# Scenarios": len(set(self.scenarios)),
-            "Survey Length (# questions)": len(self.survey),
+            "observations": len(self),
+            "agents": len(set(self.agents)),
+            "models": len(set(self.models)),
+            "scenarios": len(set(self.scenarios)),
+            "questions": len(self.survey),
             "Survey question names": reprlib.repr(self.survey.question_names),
-            "Object hash": hash(self),
         }
         return d
-    def compute_job_cost(self, include_cached_responses_in_cost=False) -> float:
+    def insert(self, item):
+        item_order = getattr(item, "order", None)
+        if item_order is not None:
+            # Get list of orders, putting None at the end
+            orders = [getattr(x, "order", None) for x in self]
+            # Filter to just the non-None orders for bisect
+            sorted_orders = [x for x in orders if x is not None]
+            if sorted_orders:
+                index = bisect_left(sorted_orders, item_order)
+                # Account for any None values before this position
+                index += orders[:index].count(None)
+            else:
+                # If no sorted items yet, insert before any unordered items
+                index = 0
+            self.data.insert(index, item)
+        else:
+            # No order - append to end
+            self.data.append(item)
+    def append(self, item):
+        self.insert(item)
+    def extend(self, other):
+        for item in other:
+            self.insert(item)
+    def compute_job_cost(self, include_cached_responses_in_cost: bool = False) -> float:
         """
         Computes the cost of a completed job in USD.
         """
@@ -258,24 +278,6 @@ class Results(UserList, Mixins, Base):
         raise TypeError("Invalid argument type")
-    def _update_results(self) -> None:
-        from edsl import Agent, Scenario
-        from edsl.language_models import LanguageModel
-        from edsl.results import Result
-        if self._job_uuid and len(self.data) < self._total_results:
-            results = [
-                Result(
-                    agent=Agent.from_dict(json.loads(r.agent)),
-                    scenario=Scenario.from_dict(json.loads(r.scenario)),
-                    model=LanguageModel.from_dict(json.loads(r.model)),
-                    iteration=1,
-                    answer=json.loads(r.answer),
-                )
-                for r in CRUD.read_results(self._job_uuid)
-            ]
-            self.data = results
     def __add__(self, other: Results) -> Results:
         """Add two Results objects together.
         They must have the same survey and created columns.
@@ -303,13 +305,10 @@ class Results(UserList, Mixins, Base):
         )
     def __repr__(self) -> str:
-        import reprlib
-        return f"Results(data = {reprlib.repr(self.data)}, survey = {repr(self.survey)}, created_columns = {self.created_columns})"
+        return f"Results(data = {self.data}, survey = {repr(self.survey)}, created_columns = {self.created_columns})"
     def table(
         self,
-        # selector_string: Optional[str] = "*.*",
         *fields,
         tablefmt: Optional[str] = None,
         pretty_labels: Optional[dict] = None,
@@ -345,28 +344,14 @@ class Results(UserList, Mixins, Base):
                 print_parameters=print_parameters,
             )
         )
-        # return (
-        #     self.select(f"{selector_string}")
-        #     .to_scenario_list()
-        #     .table(*fields, tablefmt=tablefmt)
-        # )
-    def _repr_html_(self) -> str:
-        d = self._summary()
-        from edsl import Scenario
-        footer = f"<a href={self.__documentation__}>(docs)</a>"
-        s = Scenario(d)
-        td = s.to_dataset().table(tablefmt="html")
-        return td._repr_html_() + footer
     def to_dict(
         self,
-        sort=False,
-        add_edsl_version=False,
-        include_cache=False,
-        include_task_history=False,
+        sort: bool = False,
+        add_edsl_version: bool = False,
+        include_cache: bool = False,
+        include_task_history: bool = False,
+        include_cache_info: bool = True,
     ) -> dict[str, Any]:
         from edsl.data.Cache import Cache
@@ -377,7 +362,11 @@ class Results(UserList, Mixins, Base):
         d = {
             "data": [
-                result.to_dict(add_edsl_version=add_edsl_version) for result in data
+                result.to_dict(
+                    add_edsl_version=add_edsl_version,
+                    include_cache_info=include_cache_info,
+                )
+                for result in data
             ],
             "survey": self.survey.to_dict(add_edsl_version=add_edsl_version),
             "created_columns": self.created_columns,
@@ -404,7 +393,7 @@ class Results(UserList, Mixins, Base):
         return d
-    def compare(self, other_results):
+    def compare(self, other_results: Results) -> dict:
         """
         Compare two Results objects and return the differences.
         """
@@ -422,11 +411,15 @@ class Results(UserList, Mixins, Base):
         }
     @property
-    def has_unfixed_exceptions(self):
+    def has_unfixed_exceptions(self) -> bool:
         return self.task_history.has_unfixed_exceptions
     def __hash__(self) -> int:
-        return dict_hash(self.to_dict(sort=True, add_edsl_version=False))
+        from edsl.utilities.utilities import dict_hash
+        return dict_hash(
+            self.to_dict(sort=True, add_edsl_version=False, include_cache_info=False)
+        )
     @property
     def hashes(self) -> set:
@@ -472,32 +465,35 @@ class Results(UserList, Mixins, Base):
         >>> r == r2
         True
         """
-        from edsl import Survey, Cache
+        from edsl.surveys.Survey import Survey
+        from edsl.data.Cache import Cache
         from edsl.results.Result import Result
         from edsl.jobs.tasks.TaskHistory import TaskHistory
+        from edsl.agents.Agent import Agent
+        survey = Survey.from_dict(data["survey"])
+        results_data = [Result.from_dict(r) for r in data["data"]]
+        created_columns = data.get("created_columns", None)
+        cache = Cache.from_dict(data.get("cache")) if "cache" in data else Cache()
+        task_history = (
+            TaskHistory.from_dict(data.get("task_history"))
+            if "task_history" in data
+            else TaskHistory(interviews=[])
+        )
+        params = {
+            "survey": survey,
+            "data": results_data,
+            "created_columns": created_columns,
+            "cache": cache,
+            "task_history": task_history,
+        }
         try:
-            results = cls(
-                survey=Survey.from_dict(data["survey"]),
-                data=[Result.from_dict(r) for r in data["data"]],
-                created_columns=data.get("created_columns", None),
-                cache=(
-                    Cache.from_dict(data.get("cache")) if "cache" in data else Cache()
-                ),
-                task_history=(
-                    TaskHistory.from_dict(data.get("task_history"))
-                    if "task_history" in data
-                    else TaskHistory(interviews=[])
-                ),
-            )
+            results = cls(**params)
         except Exception as e:
             raise ResultsDeserializationError(f"Error in Results.from_dict: {e}")
         return results
-    ######################
-    ## Convenience methods
-    ## & Report methods
-    ######################
     @property
     def _key_to_data_type(self) -> dict[str, str]:
         """
@@ -544,10 +540,12 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.columns
-        ['agent.agent_instruction', ...]
+        ['agent.agent_index', ...]
         """
         column_names = [f"{v}.{k}" for k, v in self._key_to_data_type.items()]
-        return sorted(column_names)
+        from edsl.utilities.PrettyList import PrettyList
+        return PrettyList(sorted(column_names))
     @property
     def answer_keys(self) -> dict[str, str]:
@@ -567,7 +565,7 @@ class Results(UserList, Mixins, Base):
         answer_keys = self._data_type_to_keys["answer"]
         answer_keys = {k for k in answer_keys if "_comment" not in k}
         questions_text = [
-            self.survey.get_question(k).question_text for k in answer_keys
+            self.survey._get_question_by_name(k).question_text for k in answer_keys
         ]
         short_question_text = [shorten_string(q, 80) for q in questions_text]
         initial_dict = dict(zip(answer_keys, short_question_text))
@@ -584,7 +582,7 @@ class Results(UserList, Mixins, Base):
         >>> r.agents
         AgentList([Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Sad'}), Agent(traits = {'status': 'Sad'})])
         """
-        from edsl import AgentList
+        from edsl.agents.AgentList import AgentList
         return AgentList([r.agent for r in self.data])
@@ -598,10 +596,13 @@ class Results(UserList, Mixins, Base):
         >>> r.models[0]
         Model(model_name = ...)
         """
-        from edsl import ModelList
+        from edsl.language_models.ModelList import ModelList
         return ModelList([r.model for r in self.data])
+    def __eq__(self, other):
+        return hash(self) == hash(other)
     @property
     def scenarios(self) -> ScenarioList:
         """Return a list of all of the scenarios in the Results.
@@ -610,9 +611,9 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.scenarios
-        ScenarioList([Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'}), Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'})])
+        ScenarioList([Scenario({'period': 'morning', 'scenario_index': 0}), Scenario({'period': 'afternoon', 'scenario_index': 1}), Scenario({'period': 'morning', 'scenario_index': 0}), Scenario({'period': 'afternoon', 'scenario_index': 1})])
         """
-        from edsl import ScenarioList
+        from edsl.scenarios.ScenarioList import ScenarioList
         return ScenarioList([r.scenario for r in self.data])
@@ -624,7 +625,7 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.agent_keys
-        ['agent_instruction', 'agent_name', 'status']
+        ['agent_index', 'agent_instruction', 'agent_name', 'status']
         """
         return sorted(self._data_type_to_keys["agent"])
@@ -634,7 +635,7 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.model_keys
-        ['frequency_penalty', 'logprobs', 'max_tokens', 'model', 'presence_penalty', 'temperature', 'top_logprobs', 'top_p']
+        ['frequency_penalty', 'logprobs', 'max_tokens', 'model', 'model_index', 'presence_penalty', 'temperature', 'top_logprobs', 'top_p']
         """
         return sorted(self._data_type_to_keys["model"])
@@ -644,7 +645,7 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.scenario_keys
-        ['period']
+        ['period', 'scenario_index']
         """
         return sorted(self._data_type_to_keys["scenario"])
@@ -670,7 +671,7 @@ class Results(UserList, Mixins, Base):
         >>> r = Results.example()
         >>> r.all_keys
-        ['agent_instruction', 'agent_name', 'frequency_penalty', 'how_feeling', 'how_feeling_yesterday', 'logprobs', 'max_tokens', 'model', 'period', 'presence_penalty', 'status', 'temperature', 'top_logprobs', 'top_p']
+        ['agent_index', ...]
         """
         answer_keys = set(self.answer_keys)
         all_keys = (
@@ -691,13 +692,19 @@ class Results(UserList, Mixins, Base):
         """
         return self.data[0]
-    def answer_truncate(self, column: str, top_n=5, new_var_name=None) -> Results:
+    def answer_truncate(
+        self, column: str, top_n: int = 5, new_var_name: str = None
+    ) -> Results:
         """Create a new variable that truncates the answers to the top_n.
         :param column: The column to truncate.
         :param top_n: The number of top answers to keep.
         :param new_var_name: The name of the new variable. If None, it is the original name + '_truncated'.
+        Example:
+        >>> r = Results.example()
+        >>> r.answer_truncate('how_feeling', top_n = 2).select('how_feeling', 'how_feeling_truncated')
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling_truncated': ['Other', 'Other', 'Other', 'Other']}])
         """
@@ -777,7 +784,7 @@ class Results(UserList, Mixins, Base):
     @staticmethod
     def _create_evaluator(
         result: Result, functions_dict: Optional[dict] = None
-    ) -> EvalWithCompoundTypes:
+    ) -> "EvalWithCompoundTypes":
         """Create an evaluator for the expression.
         >>> from unittest.mock import Mock
@@ -800,6 +807,8 @@ class Results(UserList, Mixins, Base):
         ...
         simpleeval.NameNotDefined: 'how_feeling' is not defined for expression 'how_feeling== 'OK''
         """
+        from simpleeval import EvalWithCompoundTypes
         if functions_dict is None:
             functions_dict = {}
         evaluator = EvalWithCompoundTypes(
@@ -858,6 +867,26 @@ class Results(UserList, Mixins, Base):
             created_columns=self.created_columns + [var_name],
         )
+    def add_column(self, column_name: str, values: list) -> Results:
+        """Adds columns to Results
+        >>> r = Results.example()
+        >>> r.add_column('a', [1,2,3, 4]).select('a')
+        Dataset([{'answer.a': [1, 2, 3, 4]}])
+        """
+        assert len(values) == len(
+            self.data
+        ), "The number of values must match the number of results."
+        new_results = self.data.copy()
+        for i, result in enumerate(new_results):
+            result["answer"][column_name] = values[i]
+        return Results(
+            survey=self.survey,
+            data=new_results,
+            created_columns=self.created_columns + [column_name],
+        )
     def rename(self, old_name: str, new_name: str) -> Results:
         """Rename an answer column in a Results object.
@@ -896,7 +925,7 @@ class Results(UserList, Mixins, Base):
         n: Optional[int] = None,
         frac: Optional[float] = None,
         with_replacement: bool = True,
-        seed: Optional[str] = "edsl",
+        seed: Optional[str] = None,
     ) -> Results:
         """Sample the results.
@@ -911,7 +940,7 @@ class Results(UserList, Mixins, Base):
         >>> len(r.sample(2))
         2
         """
-        if seed != "edsl":
+        if seed:
             random.seed(seed)
         if n is None and frac is None:
@@ -949,7 +978,7 @@ class Results(UserList, Mixins, Base):
         Dataset([{'answer.how_feeling_yesterday': ['Great', 'Good', 'OK', 'Terrible']}])
         """
-        from edsl.results.Selector import Selector
+        from edsl.results.results_selector import Selector
         if len(self) == 0:
             raise Exception("No data to select from---the Results object is empty.")
@@ -964,6 +993,7 @@ class Results(UserList, Mixins, Base):
         return selector.select(*columns)
     def sort_by(self, *columns: str, reverse: bool = False) -> Results:
+        """Sort the results by one or more columns."""
         import warnings
         warnings.warn(
@@ -972,6 +1002,7 @@ class Results(UserList, Mixins, Base):
         return self.order_by(*columns, reverse=reverse)
     def _parse_column(self, column: str) -> tuple[str, str]:
+        """Parse a column name into a data type and key."""
         if "." in column:
             return column.split(".")
         return self._key_to_data_type[column], column
@@ -987,20 +1018,12 @@ class Results(UserList, Mixins, Base):
         Example:
         >>> r = Results.example()
-        >>> r.sort_by('how_feeling', reverse=False).select('how_feeling').print()
-        answer.how_feeling
-        --------------------
-        Great
-        OK
-        OK
-        Terrible
-        >>> r.sort_by('how_feeling', reverse=True).select('how_feeling').print()
-        answer.how_feeling
-        --------------------
-        Terrible
-        OK
-        OK
-        Great
+        >>> r.sort_by('how_feeling', reverse=False).select('how_feeling')
+        Dataset([{'answer.how_feeling': ['Great', 'OK', 'OK', 'Terrible']}])
+        >>> r.sort_by('how_feeling', reverse=True).select('how_feeling')
+        Dataset([{'answer.how_feeling': ['Terrible', 'OK', 'OK', 'Great']}])
         """
         def to_numeric_if_possible(v):
@@ -1032,24 +1055,19 @@ class Results(UserList, Mixins, Base):
         Example usage: Create an example `Results` instance and apply filters to it:
         >>> r = Results.example()
-        >>> r.filter("how_feeling == 'Great'").select('how_feeling').print()
-        answer.how_feeling
-        --------------------
-        Great
+        >>> r.filter("how_feeling == 'Great'").select('how_feeling')
+        Dataset([{'answer.how_feeling': ['Great']}])
         Example usage: Using an OR operator in the filter expression.
-        >>> r = Results.example().filter("how_feeling = 'Great'").select('how_feeling').print()
+        >>> r = Results.example().filter("how_feeling = 'Great'").select('how_feeling')
         Traceback (most recent call last):
         ...
         edsl.exceptions.results.ResultsFilterError: You must use '==' instead of '=' in the filter expression.
         ...
-        >>> r.filter("how_feeling == 'Great' or how_feeling == 'Terrible'").select('how_feeling').print()
-        answer.how_feeling
-        --------------------
-        Great
-        Terrible
+        >>> r.filter("how_feeling == 'Great' or how_feeling == 'Terrible'").select('how_feeling')
+        Dataset([{'answer.how_feeling': ['Great', 'Terrible']}])
         """
         def has_single_equals(string):

edsl/results/ResultsExportMixin.py CHANGED Viewed

@@ -14,6 +14,8 @@ def to_dataset(func):
         """Return the function with the Results object converted to a Dataset object."""
         if self.__class__.__name__ == "Results":
             return func(self.select(), *args, **kwargs)
+        elif self.__class__.__name__ == "AgentList":
+            return func(self.to_dataset(), *args, **kwargs)
         else:
             return func(self, *args, **kwargs)

edsl 0.1.38.dev4__py3-none-any.whl → 0.1.39__py3-none-any.whl

edsl 0.1.38.dev4py3-none-any.whl → 0.1.39py3-none-any.whl