PyPI - edsl - Versions diffs - 0.1.38.dev3__py3-none-any.whl → 0.1.38.dev4__py3-none-any.whl - Mend

edsl 0.1.38.dev3py3-none-any.whl → 0.1.38.dev4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (256) hide show

edsl/Base.py +332 -303
edsl/BaseDiff.py +260 -260
edsl/TemplateLoader.py +24 -24
edsl/__init__.py +49 -49
edsl/__version__.py +1 -1
edsl/agents/Agent.py +867 -858
edsl/agents/AgentList.py +413 -362
edsl/agents/Invigilator.py +233 -222
edsl/agents/InvigilatorBase.py +265 -284
edsl/agents/PromptConstructor.py +354 -353
edsl/agents/__init__.py +3 -3
edsl/agents/descriptors.py +99 -99
edsl/agents/prompt_helpers.py +129 -129
edsl/auto/AutoStudy.py +117 -117
edsl/auto/StageBase.py +230 -230
edsl/auto/StageGenerateSurvey.py +178 -178
edsl/auto/StageLabelQuestions.py +125 -125
edsl/auto/StagePersona.py +61 -61
edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
edsl/auto/StagePersonaDimensionValues.py +74 -74
edsl/auto/StagePersonaDimensions.py +69 -69
edsl/auto/StageQuestions.py +73 -73
edsl/auto/SurveyCreatorPipeline.py +21 -21
edsl/auto/utilities.py +224 -224
edsl/base/Base.py +279 -279
edsl/config.py +157 -149
edsl/conversation/Conversation.py +290 -290
edsl/conversation/car_buying.py +58 -58
edsl/conversation/chips.py +95 -95
edsl/conversation/mug_negotiation.py +81 -81
edsl/conversation/next_speaker_utilities.py +93 -93
edsl/coop/PriceFetcher.py +54 -54
edsl/coop/__init__.py +2 -2
edsl/coop/coop.py +1028 -961
edsl/coop/utils.py +131 -131
edsl/data/Cache.py +555 -530
edsl/data/CacheEntry.py +233 -228
edsl/data/CacheHandler.py +149 -149
edsl/data/RemoteCacheSync.py +78 -97
edsl/data/SQLiteDict.py +292 -292
edsl/data/__init__.py +4 -4
edsl/data/orm.py +10 -10
edsl/data_transfer_models.py +73 -73
edsl/enums.py +175 -173
edsl/exceptions/BaseException.py +21 -21
edsl/exceptions/__init__.py +54 -54
edsl/exceptions/agents.py +42 -42
edsl/exceptions/cache.py +5 -5
edsl/exceptions/configuration.py +16 -16
edsl/exceptions/coop.py +10 -10
edsl/exceptions/data.py +14 -14
edsl/exceptions/general.py +34 -34
edsl/exceptions/jobs.py +33 -33
edsl/exceptions/language_models.py +63 -63
edsl/exceptions/prompts.py +15 -15
edsl/exceptions/questions.py +91 -91
edsl/exceptions/results.py +29 -29
edsl/exceptions/scenarios.py +22 -22
edsl/exceptions/surveys.py +37 -37
edsl/inference_services/AnthropicService.py +87 -87
edsl/inference_services/AwsBedrock.py +120 -120
edsl/inference_services/AzureAI.py +217 -217
edsl/inference_services/DeepInfraService.py +18 -18
edsl/inference_services/GoogleService.py +148 -156
edsl/inference_services/GroqService.py +20 -20
edsl/inference_services/InferenceServiceABC.py +147 -147
edsl/inference_services/InferenceServicesCollection.py +97 -97
edsl/inference_services/MistralAIService.py +123 -123
edsl/inference_services/OllamaService.py +18 -18
edsl/inference_services/OpenAIService.py +224 -224
edsl/inference_services/PerplexityService.py +163 -0
edsl/inference_services/TestService.py +89 -89
edsl/inference_services/TogetherAIService.py +170 -170
edsl/inference_services/models_available_cache.py +118 -118
edsl/inference_services/rate_limits_cache.py +25 -25
edsl/inference_services/registry.py +41 -39
edsl/inference_services/write_available.py +10 -10
edsl/jobs/Answers.py +56 -56
edsl/jobs/Jobs.py +898 -1358
edsl/jobs/JobsChecks.py +147 -0
edsl/jobs/JobsPrompts.py +268 -0
edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
edsl/jobs/__init__.py +1 -1
edsl/jobs/buckets/BucketCollection.py +63 -63
edsl/jobs/buckets/ModelBuckets.py +65 -65
edsl/jobs/buckets/TokenBucket.py +251 -251
edsl/jobs/interviews/Interview.py +661 -661
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
edsl/jobs/interviews/InterviewStatistic.py +63 -63
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
edsl/jobs/interviews/InterviewStatusLog.py +92 -92
edsl/jobs/interviews/ReportErrors.py +66 -66
edsl/jobs/interviews/interview_status_enum.py +9 -9
edsl/jobs/runners/JobsRunnerAsyncio.py +466 -361
edsl/jobs/runners/JobsRunnerStatus.py +330 -332
edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
edsl/jobs/tasks/TaskCreators.py +64 -64
edsl/jobs/tasks/TaskHistory.py +450 -451
edsl/jobs/tasks/TaskStatusLog.py +23 -23
edsl/jobs/tasks/task_status_enum.py +163 -163
edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
edsl/jobs/tokens/TokenUsage.py +34 -34
edsl/language_models/KeyLookup.py +30 -30
edsl/language_models/LanguageModel.py +668 -708
edsl/language_models/ModelList.py +155 -109
edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
edsl/language_models/__init__.py +3 -3
edsl/language_models/fake_openai_call.py +15 -15
edsl/language_models/fake_openai_service.py +61 -61
edsl/language_models/registry.py +190 -137
edsl/language_models/repair.py +156 -156
edsl/language_models/unused/ReplicateBase.py +83 -83
edsl/language_models/utilities.py +64 -64
edsl/notebooks/Notebook.py +258 -258
edsl/notebooks/__init__.py +1 -1
edsl/prompts/Prompt.py +362 -357
edsl/prompts/__init__.py +2 -2
edsl/questions/AnswerValidatorMixin.py +289 -289
edsl/questions/QuestionBase.py +664 -660
edsl/questions/QuestionBaseGenMixin.py +161 -161
edsl/questions/QuestionBasePromptsMixin.py +217 -217
edsl/questions/QuestionBudget.py +227 -227
edsl/questions/QuestionCheckBox.py +359 -359
edsl/questions/QuestionExtract.py +182 -183
edsl/questions/QuestionFreeText.py +114 -114
edsl/questions/QuestionFunctional.py +166 -166
edsl/questions/QuestionList.py +231 -231
edsl/questions/QuestionMultipleChoice.py +286 -286
edsl/questions/QuestionNumerical.py +153 -153
edsl/questions/QuestionRank.py +324 -324
edsl/questions/Quick.py +41 -41
edsl/questions/RegisterQuestionsMeta.py +71 -71
edsl/questions/ResponseValidatorABC.py +174 -174
edsl/questions/SimpleAskMixin.py +73 -73
edsl/questions/__init__.py +26 -26
edsl/questions/compose_questions.py +98 -98
edsl/questions/decorators.py +21 -21
edsl/questions/derived/QuestionLikertFive.py +76 -76
edsl/questions/derived/QuestionLinearScale.py +87 -87
edsl/questions/derived/QuestionTopK.py +93 -93
edsl/questions/derived/QuestionYesNo.py +82 -82
edsl/questions/descriptors.py +413 -413
edsl/questions/prompt_templates/question_budget.jinja +13 -13
edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
edsl/questions/prompt_templates/question_extract.jinja +11 -11
edsl/questions/prompt_templates/question_free_text.jinja +3 -3
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
edsl/questions/prompt_templates/question_list.jinja +17 -17
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
edsl/questions/prompt_templates/question_numerical.jinja +36 -36
edsl/questions/question_registry.py +177 -147
edsl/questions/settings.py +12 -12
edsl/questions/templates/budget/answering_instructions.jinja +7 -7
edsl/questions/templates/budget/question_presentation.jinja +7 -7
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
edsl/questions/templates/extract/answering_instructions.jinja +7 -7
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
edsl/questions/templates/list/answering_instructions.jinja +3 -3
edsl/questions/templates/list/question_presentation.jinja +5 -5
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
edsl/questions/templates/numerical/question_presentation.jinja +6 -6
edsl/questions/templates/rank/answering_instructions.jinja +11 -11
edsl/questions/templates/rank/question_presentation.jinja +15 -15
edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
edsl/questions/templates/top_k/question_presentation.jinja +22 -22
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +424 -293
edsl/results/DatasetExportMixin.py +731 -717
edsl/results/DatasetTree.py +275 -145
edsl/results/Result.py +465 -456
edsl/results/Results.py +1165 -1071
edsl/results/ResultsDBMixin.py +238 -238
edsl/results/ResultsExportMixin.py +43 -43
edsl/results/ResultsFetchMixin.py +33 -33
edsl/results/ResultsGGMixin.py +121 -121
edsl/results/ResultsToolsMixin.py +98 -98
edsl/results/Selector.py +135 -135
edsl/results/TableDisplay.py +198 -0
edsl/results/__init__.py +2 -2
edsl/results/table_display.css +78 -0
edsl/results/tree_explore.py +115 -115
edsl/scenarios/FileStore.py +632 -458
edsl/scenarios/Scenario.py +601 -544
edsl/scenarios/ScenarioHtmlMixin.py +64 -64
edsl/scenarios/ScenarioJoin.py +127 -0
edsl/scenarios/ScenarioList.py +1287 -1112
edsl/scenarios/ScenarioListExportMixin.py +52 -52
edsl/scenarios/ScenarioListPdfMixin.py +261 -261
edsl/scenarios/__init__.py +4 -4
edsl/shared.py +1 -1
edsl/study/ObjectEntry.py +173 -173
edsl/study/ProofOfWork.py +113 -113
edsl/study/SnapShot.py +80 -80
edsl/study/Study.py +528 -528
edsl/study/__init__.py +4 -4
edsl/surveys/DAG.py +148 -148
edsl/surveys/Memory.py +31 -31
edsl/surveys/MemoryPlan.py +244 -244
edsl/surveys/Rule.py +326 -326
edsl/surveys/RuleCollection.py +387 -387
edsl/surveys/Survey.py +1801 -1787
edsl/surveys/SurveyCSS.py +261 -261
edsl/surveys/SurveyExportMixin.py +259 -259
edsl/surveys/SurveyFlowVisualizationMixin.py +179 -121
edsl/surveys/SurveyQualtricsImport.py +284 -284
edsl/surveys/__init__.py +3 -3
edsl/surveys/base.py +53 -53
edsl/surveys/descriptors.py +56 -56
edsl/surveys/instructions/ChangeInstruction.py +49 -49
edsl/surveys/instructions/Instruction.py +65 -53
edsl/surveys/instructions/InstructionCollection.py +77 -77
edsl/templates/error_reporting/base.html +23 -23
edsl/templates/error_reporting/exceptions_by_model.html +34 -34
edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
edsl/templates/error_reporting/exceptions_by_type.html +16 -16
edsl/templates/error_reporting/interview_details.html +115 -115
edsl/templates/error_reporting/interviews.html +19 -10
edsl/templates/error_reporting/overview.html +4 -4
edsl/templates/error_reporting/performance_plot.html +1 -1
edsl/templates/error_reporting/report.css +73 -73
edsl/templates/error_reporting/report.html +117 -117
edsl/templates/error_reporting/report.js +25 -25
edsl/tools/__init__.py +1 -1
edsl/tools/clusters.py +192 -192
edsl/tools/embeddings.py +27 -27
edsl/tools/embeddings_plotting.py +118 -118
edsl/tools/plotting.py +112 -112
edsl/tools/summarize.py +18 -18
edsl/utilities/SystemInfo.py +28 -28
edsl/utilities/__init__.py +22 -22
edsl/utilities/ast_utilities.py +25 -25
edsl/utilities/data/Registry.py +6 -6
edsl/utilities/data/__init__.py +1 -1
edsl/utilities/data/scooter_results.json +1 -1
edsl/utilities/decorators.py +77 -77
edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
edsl/utilities/interface.py +627 -627
edsl/utilities/naming_utilities.py +263 -263
edsl/utilities/repair_functions.py +28 -28
edsl/utilities/restricted_python.py +70 -70
edsl/utilities/utilities.py +424 -409
{edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/LICENSE +21 -21
{edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/METADATA +2 -1
edsl-0.1.38.dev4.dist-info/RECORD +277 -0
edsl-0.1.38.dev3.dist-info/RECORD +0 -269
{edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/WHEEL +0 -0

edsl/results/Results.py CHANGED Viewed

@@ -1,1071 +1,1165 @@
-"""
-The Results object is the result of running a survey.
-It is not typically instantiated directly, but is returned by the run method of a `Job` object.
-"""
-from __future__ import annotations
-import json
-import random
-from collections import UserList, defaultdict
-from typing import Optional, Callable, Any, Type, Union, List, TYPE_CHECKING
-if TYPE_CHECKING:
-    from edsl import Survey, Cache, AgentList, ModelList, ScenarioList
-    from edsl.results.Result import Result
-    from edsl.jobs.tasks.TaskHistory import TaskHistory
-from simpleeval import EvalWithCompoundTypes
-from edsl.exceptions.results import (
-    ResultsError,
-    ResultsBadMutationstringError,
-    ResultsColumnNotFoundError,
-    ResultsInvalidNameError,
-    ResultsMutateError,
-    ResultsFilterError,
-    ResultsDeserializationError,
-)
-from edsl.results.ResultsExportMixin import ResultsExportMixin
-from edsl.results.ResultsToolsMixin import ResultsToolsMixin
-from edsl.results.ResultsDBMixin import ResultsDBMixin
-from edsl.results.ResultsGGMixin import ResultsGGMixin
-from edsl.results.ResultsFetchMixin import ResultsFetchMixin
-from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
-from edsl.utilities.utilities import dict_hash
-from edsl.Base import Base
-class Mixins(
-    ResultsExportMixin,
-    ResultsDBMixin,
-    ResultsFetchMixin,
-    ResultsGGMixin,
-    ResultsToolsMixin,
-):
-    def print_long(self, max_rows: int = None) -> None:
-        """Print the results in long format.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').print_long(max_rows = 2)
-        ┏━━━━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━┓
-        ┃ Result index ┃ Key         ┃ Value ┃
-        ┡━━━━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━┩
-        │ 0            │ how_feeling │ OK    │
-        │ 1            │ how_feeling │ Great │
-        └──────────────┴─────────────┴───────┘
-        """
-        from edsl.utilities.interface import print_results_long
-        print_results_long(self, max_rows=max_rows)
-class Results(UserList, Mixins, Base):
-    """
-    This class is a UserList of Result objects.
-    It is instantiated with a `Survey` and a list of `Result` objects.
-    It can be manipulated in various ways with select, filter, mutate, etc.
-    It also has a list of created_columns, which are columns that have been created with `mutate` and are not part of the original data.
-    """
-    known_data_types = [
-        "answer",
-        "scenario",
-        "agent",
-        "model",
-        "prompt",
-        "raw_model_response",
-        "iteration",
-        "question_text",
-        "question_options",
-        "question_type",
-        "comment",
-        "generated_tokens",
-    ]
-    def __init__(
-        self,
-        survey: Optional[Survey] = None,
-        data: Optional[list[Result]] = None,
-        created_columns: Optional[list[str]] = None,
-        cache: Optional[Cache] = None,
-        job_uuid: Optional[str] = None,
-        total_results: Optional[int] = None,
-        task_history: Optional[TaskHistory] = None,
-    ):
-        """Instantiate a `Results` object with a survey and a list of `Result` objects.
-        :param survey: A Survey object.
-        :param data: A list of Result objects.
-        :param created_columns: A list of strings that are created columns.
-        :param job_uuid: A string representing the job UUID.
-        :param total_results: An integer representing the total number of results.
-        """
-        super().__init__(data)
-        from edsl.data.Cache import Cache
-        from edsl.jobs.tasks.TaskHistory import TaskHistory
-        self.survey = survey
-        self.created_columns = created_columns or []
-        self._job_uuid = job_uuid
-        self._total_results = total_results
-        self.cache = cache or Cache()
-        self.task_history = task_history or TaskHistory(interviews=[])
-        if hasattr(self, "_add_output_functions"):
-            self._add_output_functions()
-    def leaves(self):
-        leaves = []
-        for result in self:
-            leaves.extend(result.leaves())
-        return leaves
-    def tree(
-        self,
-        fold_attributes: Optional[List[str]] = None,
-        drop: Optional[List[str]] = None,
-        open_file=True,
-    ) -> dict:
-        """Return the results as a tree."""
-        from edsl.results.tree_explore import FoldableHTMLTableGenerator
-        if drop is None:
-            drop = []
-        valid_attributes = [
-            "model",
-            "scenario",
-            "agent",
-            "answer",
-            "question",
-            "iteration",
-        ]
-        if fold_attributes is None:
-            fold_attributes = []
-        for attribute in fold_attributes:
-            if attribute not in valid_attributes:
-                raise ValueError(
-                    f"Invalid fold attribute: {attribute}; must be in {valid_attributes}"
-                )
-        data = self.leaves()
-        generator = FoldableHTMLTableGenerator(data)
-        tree = generator.tree(fold_attributes=fold_attributes, drop=drop)
-        html_content = generator.generate_html(tree, fold_attributes)
-        import tempfile
-        from edsl.utilities.utilities import is_notebook
-        from IPython.display import display, HTML
-        if is_notebook():
-            import html
-            from IPython.display import display, HTML
-            height = 1000
-            width = 1000
-            escaped_output = html.escape(html_content)
-            # escaped_output = rendered_html
-            iframe = f""""
-            <iframe srcdoc="{ escaped_output }" style="width: {width}px; height: {height}px;"></iframe>
-            """
-            display(HTML(iframe))
-            return None
-        with tempfile.NamedTemporaryFile(suffix=".html", delete=False) as f:
-            f.write(html_content.encode())
-            print(f"HTML file has been generated: {f.name}")
-            if open_file:
-                import webbrowser
-                import time
-                time.sleep(1)  # Wait for 1 second
-                # webbrowser.open(f.name)
-                import os
-                filename = f.name
-                webbrowser.open(f"file://{os.path.abspath(filename)}")
-            else:
-                return html_content
-    def code(self):
-        raise NotImplementedError
-    def __getitem__(self, i):
-        if isinstance(i, int):
-            return self.data[i]
-        if isinstance(i, slice):
-            return self.__class__(survey=self.survey, data=self.data[i])
-        if isinstance(i, str):
-            return self.to_dict()[i]
-        raise TypeError("Invalid argument type")
-    def _update_results(self) -> None:
-        from edsl import Agent, Scenario
-        from edsl.language_models import LanguageModel
-        from edsl.results import Result
-        if self._job_uuid and len(self.data) < self._total_results:
-            results = [
-                Result(
-                    agent=Agent.from_dict(json.loads(r.agent)),
-                    scenario=Scenario.from_dict(json.loads(r.scenario)),
-                    model=LanguageModel.from_dict(json.loads(r.model)),
-                    iteration=1,
-                    answer=json.loads(r.answer),
-                )
-                for r in CRUD.read_results(self._job_uuid)
-            ]
-            self.data = results
-    def __add__(self, other: Results) -> Results:
-        """Add two Results objects together.
-        They must have the same survey and created columns.
-        :param other: A Results object.
-        Example:
-        >>> r = Results.example()
-        >>> r2 = Results.example()
-        >>> r3 = r + r2
-        """
-        if self.survey != other.survey:
-            raise ResultsError(
-                "The surveys are not the same so the the results cannot be added together."
-            )
-        if self.created_columns != other.created_columns:
-            raise ResultsError(
-                "The created columns are not the same so they cannot be added together."
-            )
-        return Results(
-            survey=self.survey,
-            data=self.data + other.data,
-            created_columns=self.created_columns,
-        )
-    def __repr__(self) -> str:
-        import reprlib
-        return f"Results(data = {reprlib.repr(self.data)}, survey = {repr(self.survey)}, created_columns = {self.created_columns})"
-    def _repr_html_(self) -> str:
-        # from IPython.display import HTML
-        json_str = json.dumps(self.to_dict(add_edsl_version=False)["data"], indent=4)
-        return f"<pre>{json_str}</pre>"
-    def to_dict(self, sort=False, add_edsl_version=False) -> dict[str, Any]:
-        from edsl.data.Cache import Cache
-        if sort:
-            data = sorted([result for result in self.data], key=lambda x: hash(x))
-        else:
-            data = [result for result in self.data]
-        d = {
-            "data": [
-                result.to_dict(add_edsl_version=add_edsl_version) for result in data
-            ],
-            "survey": self.survey.to_dict(add_edsl_version=add_edsl_version),
-            "created_columns": self.created_columns,
-            "cache": (
-                Cache()
-                if not hasattr(self, "cache")
-                else self.cache.to_dict(add_edsl_version=add_edsl_version)
-            ),
-            "task_history": self.task_history.to_dict(),
-        }
-        if add_edsl_version:
-            from edsl import __version__
-            d["edsl_version"] = __version__
-            d["edsl_class_name"] = "Results"
-        return d
-    def compare(self, other_results):
-        """
-        Compare two Results objects and return the differences.
-        """
-        hashes_0 = [hash(result) for result in self]
-        hashes_1 = [hash(result) for result in other_results]
-        in_self_but_not_other = set(hashes_0).difference(set(hashes_1))
-        in_other_but_not_self = set(hashes_1).difference(set(hashes_0))
-        indicies_self = [hashes_0.index(h) for h in in_self_but_not_other]
-        indices_other = [hashes_1.index(h) for h in in_other_but_not_self]
-        return {
-            "a_not_b": [self[i] for i in indicies_self],
-            "b_not_a": [other_results[i] for i in indices_other],
-        }
-    @property
-    def has_unfixed_exceptions(self):
-        return self.task_history.has_unfixed_exceptions
-    def __hash__(self) -> int:
-        return dict_hash(self.to_dict(sort=True, add_edsl_version=False))
-    @property
-    def hashes(self) -> set:
-        return set(hash(result) for result in self.data)
-    def sample(self, n: int) -> Results:
-        """Return a random sample of the results.
-        :param n: The number of samples to return.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> len(r.sample(2))
-        2
-        """
-        indices = None
-        for entry in self:
-            key, values = list(entry.items())[0]
-            if indices is None:  # gets the indices for the first time
-                indices = list(range(len(values)))
-                sampled_indices = random.sample(indices, n)
-                if n > len(indices):
-                    raise ResultsError(
-                        f"Cannot sample {n} items from a list of length {len(indices)}."
-                    )
-            entry[key] = [values[i] for i in sampled_indices]
-        return self
-    @classmethod
-    @remove_edsl_version
-    def from_dict(cls, data: dict[str, Any]) -> Results:
-        """Convert a dictionary to a Results object.
-        :param data: A dictionary representation of a Results object.
-        Example:
-        >>> r = Results.example()
-        >>> d = r.to_dict()
-        >>> r2 = Results.from_dict(d)
-        >>> r == r2
-        True
-        """
-        from edsl import Survey, Cache
-        from edsl.results.Result import Result
-        from edsl.jobs.tasks.TaskHistory import TaskHistory
-        try:
-            results = cls(
-                survey=Survey.from_dict(data["survey"]),
-                data=[Result.from_dict(r) for r in data["data"]],
-                created_columns=data.get("created_columns", None),
-                cache=(
-                    Cache.from_dict(data.get("cache")) if "cache" in data else Cache()
-                ),
-                task_history=TaskHistory.from_dict(data.get("task_history")),
-            )
-        except Exception as e:
-            raise ResultsDeserializationError(f"Error in Results.from_dict: {e}")
-        return results
-    ######################
-    ## Convenience methods
-    ## & Report methods
-    ######################
-    @property
-    def _key_to_data_type(self) -> dict[str, str]:
-        """
-        Return a mapping of keys (how_feeling, status, etc.) to strings representing data types.
-        Objects such as Agent, Answer, Model, Scenario, etc.
-        - Uses the key_to_data_type property of the Result class.
-        - Includes any columns that the user has created with `mutate`
-        """
-        d: dict = {}
-        for result in self.data:
-            d.update(result.key_to_data_type)
-        for column in self.created_columns:
-            d[column] = "answer"
-        return d
-    @property
-    def _data_type_to_keys(self) -> dict[str, str]:
-        """
-        Return a mapping of strings representing data types (objects such as Agent, Answer, Model, Scenario, etc.) to keys (how_feeling, status, etc.)
-        - Uses the key_to_data_type property of the Result class.
-        - Includes any columns that the user has created with `mutate`
-        Example:
-        >>> r = Results.example()
-        >>> r._data_type_to_keys
-        defaultdict(...
-        """
-        d: dict = defaultdict(set)
-        for result in self.data:
-            for key, value in result.key_to_data_type.items():
-                d[value] = d[value].union(set({key}))
-        for column in self.created_columns:
-            d["answer"] = d["answer"].union(set({column}))
-        return d
-    @property
-    def columns(self) -> list[str]:
-        """Return a list of all of the columns that are in the Results.
-        Example:
-        >>> r = Results.example()
-        >>> r.columns
-        ['agent.agent_instruction', ...]
-        """
-        column_names = [f"{v}.{k}" for k, v in self._key_to_data_type.items()]
-        return sorted(column_names)
-    @property
-    def answer_keys(self) -> dict[str, str]:
-        """Return a mapping of answer keys to question text.
-        Example:
-        >>> r = Results.example()
-        >>> r.answer_keys
-        {'how_feeling': 'How are you this {{ period }}?', 'how_feeling_yesterday': 'How were you feeling yesterday {{ period }}?'}
-        """
-        from edsl.utilities.utilities import shorten_string
-        if not self.survey:
-            raise ResultsError("Survey is not defined so no answer keys are available.")
-        answer_keys = self._data_type_to_keys["answer"]
-        answer_keys = {k for k in answer_keys if "_comment" not in k}
-        questions_text = [
-            self.survey.get_question(k).question_text for k in answer_keys
-        ]
-        short_question_text = [shorten_string(q, 80) for q in questions_text]
-        initial_dict = dict(zip(answer_keys, short_question_text))
-        sorted_dict = {key: initial_dict[key] for key in sorted(initial_dict)}
-        return sorted_dict
-    @property
-    def agents(self) -> AgentList:
-        """Return a list of all of the agents in the Results.
-        Example:
-        >>> r = Results.example()
-        >>> r.agents
-        AgentList([Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Sad'}), Agent(traits = {'status': 'Sad'})])
-        """
-        from edsl import AgentList
-        return AgentList([r.agent for r in self.data])
-    @property
-    def models(self) -> ModelList:
-        """Return a list of all of the models in the Results.
-        Example:
-        >>> r = Results.example()
-        >>> r.models[0]
-        Model(model_name = ...)
-        """
-        from edsl import ModelList
-        return ModelList([r.model for r in self.data])
-    @property
-    def scenarios(self) -> ScenarioList:
-        """Return a list of all of the scenarios in the Results.
-        Example:
-        >>> r = Results.example()
-        >>> r.scenarios
-        ScenarioList([Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'}), Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'})])
-        """
-        from edsl import ScenarioList
-        return ScenarioList([r.scenario for r in self.data])
-    @property
-    def agent_keys(self) -> list[str]:
-        """Return a set of all of the keys that are in the Agent data.
-        Example:
-        >>> r = Results.example()
-        >>> r.agent_keys
-        ['agent_instruction', 'agent_name', 'status']
-        """
-        return sorted(self._data_type_to_keys["agent"])
-    @property
-    def model_keys(self) -> list[str]:
-        """Return a set of all of the keys that are in the LanguageModel data.
-        >>> r = Results.example()
-        >>> r.model_keys
-        ['frequency_penalty', 'logprobs', 'max_tokens', 'model', 'presence_penalty', 'temperature', 'top_logprobs', 'top_p']
-        """
-        return sorted(self._data_type_to_keys["model"])
-    @property
-    def scenario_keys(self) -> list[str]:
-        """Return a set of all of the keys that are in the Scenario data.
-        >>> r = Results.example()
-        >>> r.scenario_keys
-        ['period']
-        """
-        return sorted(self._data_type_to_keys["scenario"])
-    @property
-    def question_names(self) -> list[str]:
-        """Return a list of all of the question names.
-        Example:
-        >>> r = Results.example()
-        >>> r.question_names
-        ['how_feeling', 'how_feeling_yesterday']
-        """
-        if self.survey is None:
-            return []
-        return sorted(list(self.survey.question_names))
-    @property
-    def all_keys(self) -> list[str]:
-        """Return a set of all of the keys that are in the Results.
-        Example:
-        >>> r = Results.example()
-        >>> r.all_keys
-        ['agent_instruction', 'agent_name', 'frequency_penalty', 'how_feeling', 'how_feeling_yesterday', 'logprobs', 'max_tokens', 'model', 'period', 'presence_penalty', 'status', 'temperature', 'top_logprobs', 'top_p']
-        """
-        answer_keys = set(self.answer_keys)
-        all_keys = (
-            answer_keys.union(self.agent_keys)
-            .union(self.scenario_keys)
-            .union(self.model_keys)
-        )
-        return sorted(list(all_keys))
-    def first(self) -> Result:
-        """Return the first observation in the results.
-        Example:
-        >>> r = Results.example()
-        >>> r.first()
-        Result(agent...
-        """
-        return self.data[0]
-    def answer_truncate(self, column: str, top_n=5, new_var_name=None) -> Results:
-        """Create a new variable that truncates the answers to the top_n.
-        :param column: The column to truncate.
-        :param top_n: The number of top answers to keep.
-        :param new_var_name: The name of the new variable. If None, it is the original name + '_truncated'.
-        """
-        if new_var_name is None:
-            new_var_name = column + "_truncated"
-        answers = list(self.select(column).tally().keys())
-        def f(x):
-            if x in answers[:top_n]:
-                return x
-            else:
-                return "Other"
-        return self.recode(column, recode_function=f, new_var_name=new_var_name)
-    def recode(
-        self, column: str, recode_function: Optional[Callable], new_var_name=None
-    ) -> Results:
-        """
-        Recode a column in the Results object.
-        >>> r = Results.example()
-        >>> r.recode('how_feeling', recode_function = lambda x: 1 if x == 'Great' else 0).select('how_feeling', 'how_feeling_recoded')
-        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling_recoded': [0, 1, 0, 0]}])
-        """
-        if new_var_name is None:
-            new_var_name = column + "_recoded"
-        new_data = []
-        for result in self.data:
-            new_result = result.copy()
-            value = new_result.get_value("answer", column)
-            # breakpoint()
-            new_result["answer"][new_var_name] = recode_function(value)
-            new_data.append(new_result)
-        # print("Created new variable", new_var_name)
-        return Results(
-            survey=self.survey,
-            data=new_data,
-            created_columns=self.created_columns + [new_var_name],
-        )
-    def add_column(self, column_name: str, values: list) -> Results:
-        """Adds columns to Results
-        >>> r = Results.example()
-        >>> r.add_column('a', [1,2,3, 4]).select('a')
-        Dataset([{'answer.a': [1, 2, 3, 4]}])
-        """
-        assert len(values) == len(
-            self.data
-        ), "The number of values must match the number of results."
-        new_results = self.data.copy()
-        for i, result in enumerate(new_results):
-            result["answer"][column_name] = values[i]
-        return Results(
-            survey=self.survey,
-            data=new_results,
-            created_columns=self.created_columns + [column_name],
-        )
-    def add_columns_from_dict(self, columns: List[dict]) -> Results:
-        """Adds columns to Results from a list of dictionaries.
-        >>> r = Results.example()
-        >>> r.add_columns_from_dict([{'a': 1, 'b': 2}, {'a': 3, 'b': 4}, {'a':3, 'b':2}, {'a':3, 'b':2}]).select('a', 'b')
-        Dataset([{'answer.a': [1, 3, 3, 3]}, {'answer.b': [2, 4, 2, 2]}])
-        """
-        keys = list(columns[0].keys())
-        for key in keys:
-            values = [d[key] for d in columns]
-            self = self.add_column(key, values)
-        return self
-    @staticmethod
-    def _create_evaluator(
-        result: Result, functions_dict: Optional[dict] = None
-    ) -> EvalWithCompoundTypes:
-        """Create an evaluator for the expression.
-        >>> from unittest.mock import Mock
-        >>> result = Mock()
-        >>> result.combined_dict = {'how_feeling': 'OK'}
-        >>> evaluator = Results._create_evaluator(result = result, functions_dict = {})
-        >>> evaluator.eval("how_feeling == 'OK'")
-        True
-        >>> result.combined_dict = {'answer': {'how_feeling': 'OK'}}
-        >>> evaluator = Results._create_evaluator(result = result, functions_dict = {})
-        >>> evaluator.eval("answer.how_feeling== 'OK'")
-        True
-        Note that you need to refer to the answer dictionary in the expression.
-        >>> evaluator.eval("how_feeling== 'OK'")
-        Traceback (most recent call last):
-        ...
-        simpleeval.NameNotDefined: 'how_feeling' is not defined for expression 'how_feeling== 'OK''
-        """
-        if functions_dict is None:
-            functions_dict = {}
-        evaluator = EvalWithCompoundTypes(
-            names=result.combined_dict, functions=functions_dict
-        )
-        evaluator.functions.update(int=int, float=float)
-        return evaluator
-    def mutate(
-        self, new_var_string: str, functions_dict: Optional[dict] = None
-    ) -> Results:
-        """
-        Creates a value in the Results object as if has been asked as part of the survey.
-        :param new_var_string: A string that is a valid Python expression.
-        :param functions_dict: A dictionary of functions that can be used in the expression. The keys are the function names and the values are the functions themselves.
-        It splits the new_var_string at the "=" and uses simple_eval
-        Example:
-        >>> r = Results.example()
-        >>> r.mutate('how_feeling_x = how_feeling + "x"').select('how_feeling_x')
-        Dataset([{'answer.how_feeling_x': ...
-        """
-        # extract the variable name and the expression
-        if "=" not in new_var_string:
-            raise ResultsBadMutationstringError(
-                f"Mutate requires an '=' in the string, but '{new_var_string}' doesn't have one."
-            )
-        raw_var_name, expression = new_var_string.split("=", 1)
-        var_name = raw_var_name.strip()
-        from edsl.utilities.utilities import is_valid_variable_name
-        if not is_valid_variable_name(var_name):
-            raise ResultsInvalidNameError(f"{var_name} is not a valid variable name.")
-        # create the evaluator
-        functions_dict = functions_dict or {}
-        def new_result(old_result: "Result", var_name: str) -> "Result":
-            evaluator = self._create_evaluator(old_result, functions_dict)
-            value = evaluator.eval(expression)
-            new_result = old_result.copy()
-            new_result["answer"][var_name] = value
-            return new_result
-        try:
-            new_data = [new_result(result, var_name) for result in self.data]
-        except Exception as e:
-            raise ResultsMutateError(f"Error in mutate. Exception:{e}")
-        return Results(
-            survey=self.survey,
-            data=new_data,
-            created_columns=self.created_columns + [var_name],
-        )
-    def rename(self, old_name: str, new_name: str) -> Results:
-        """Rename an answer column in a Results object.
-        >>> s = Results.example()
-        >>> s.rename('how_feeling', 'how_feeling_new').select('how_feeling_new')
-        Dataset([{'answer.how_feeling_new': ['OK', 'Great', 'Terrible', 'OK']}])
-        # TODO: Should we allow renaming of scenario fields as well? Probably.
-        """
-        for obs in self.data:
-            obs["answer"][new_name] = obs["answer"][old_name]
-            del obs["answer"][old_name]
-        return self
-    def shuffle(self, seed: Optional[str] = "edsl") -> Results:
-        """Shuffle the results.
-        Example:
-        >>> r = Results.example()
-        >>> r.shuffle(seed = 1)[0]
-        Result(...)
-        """
-        if seed != "edsl":
-            seed = random.seed(seed)
-        new_data = self.data.copy()
-        random.shuffle(new_data)
-        return Results(survey=self.survey, data=new_data, created_columns=None)
-    def sample(
-        self,
-        n: Optional[int] = None,
-        frac: Optional[float] = None,
-        with_replacement: bool = True,
-        seed: Optional[str] = "edsl",
-    ) -> Results:
-        """Sample the results.
-        :param n: An integer representing the number of samples to take.
-        :param frac: A float representing the fraction of samples to take.
-        :param with_replacement: A boolean representing whether to sample with replacement.
-        :param seed: An integer representing the seed for the random number generator.
-        Example:
-        >>> r = Results.example()
-        >>> len(r.sample(2))
-        2
-        """
-        if seed != "edsl":
-            random.seed(seed)
-        if n is None and frac is None:
-            raise Exception("You must specify either n or frac.")
-        if n is not None and frac is not None:
-            raise Exception("You cannot specify both n and frac.")
-        if frac is not None and n is None:
-            n = int(frac * len(self.data))
-        if with_replacement:
-            new_data = random.choices(self.data, k=n)
-        else:
-            new_data = random.sample(self.data, n)
-        return Results(survey=self.survey, data=new_data, created_columns=None)
-    def select(self, *columns: Union[str, list[str]]) -> Results:
-        """
-        Select data from the results and format it.
-        :param columns: A list of strings, each of which is a column name. The column name can be a single key, e.g. "how_feeling", or a dot-separated string, e.g. "answer.how_feeling".
-        Example:
-        >>> results = Results.example()
-        >>> results.select('how_feeling')
-        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}])
-        >>> results.select('how_feeling', 'model', 'how_feeling')
-        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'model.model': ['...', '...', '...', '...']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}])
-        >>> from edsl import Results; r = Results.example(); r.select('answer.how_feeling_y')
-        Dataset([{'answer.how_feeling_yesterday': ['Great', 'Good', 'OK', 'Terrible']}])
-        """
-        from edsl.results.Selector import Selector
-        if len(self) == 0:
-            raise Exception("No data to select from---the Results object is empty.")
-        selector = Selector(
-            known_data_types=self.known_data_types,
-            data_type_to_keys=self._data_type_to_keys,
-            key_to_data_type=self._key_to_data_type,
-            fetch_list_func=self._fetch_list,
-            columns=self.columns,
-        )
-        return selector.select(*columns)
-    def sort_by(self, *columns: str, reverse: bool = False) -> Results:
-        import warnings
-        warnings.warn(
-            "sort_by is deprecated. Use order_by instead.", DeprecationWarning
-        )
-        return self.order_by(*columns, reverse=reverse)
-    def _parse_column(self, column: str) -> tuple[str, str]:
-        if "." in column:
-            return column.split(".")
-        return self._key_to_data_type[column], column
-    def order_by(self, *columns: str, reverse: bool = False) -> Results:
-        """Sort the results by one or more columns.
-        :param columns: One or more column names as strings.
-        :param reverse: A boolean that determines whether to sort in reverse order.
-        Each column name can be a single key, e.g. "how_feeling", or a dot-separated string, e.g. "answer.how_feeling".
-        Example:
-        >>> r = Results.example()
-        >>> r.sort_by('how_feeling', reverse=False).select('how_feeling').print()
-        ┏━━━━━━━━━━━━━━┓
-        ┃ answer       ┃
-        ┃ .how_feeling ┃
-        ┡━━━━━━━━━━━━━━┩
-        │ Great        │
-        ├──────────────┤
-        │ OK           │
-        ├──────────────┤
-        │ OK           │
-        ├──────────────┤
-        │ Terrible     │
-        └──────────────┘
-        >>> r.sort_by('how_feeling', reverse=True).select('how_feeling').print()
-        ┏━━━━━━━━━━━━━━┓
-        ┃ answer       ┃
-        ┃ .how_feeling ┃
-        ┡━━━━━━━━━━━━━━┩
-        │ Terrible     │
-        ├──────────────┤
-        │ OK           │
-        ├──────────────┤
-        │ OK           │
-        ├──────────────┤
-        │ Great        │
-        └──────────────┘
-        """
-        def to_numeric_if_possible(v):
-            try:
-                return float(v)
-            except:
-                return v
-        def sort_key(item):
-            key_components = []
-            for col in columns:
-                data_type, key = self._parse_column(col)
-                value = item.get_value(data_type, key)
-                key_components.append(to_numeric_if_possible(value))
-            return tuple(key_components)
-        new_data = sorted(self.data, key=sort_key, reverse=reverse)
-        return Results(survey=self.survey, data=new_data, created_columns=None)
-    def filter(self, expression: str) -> Results:
-        """
-        Filter based on the given expression and returns the filtered `Results`.
-        :param expression: A string expression that evaluates to a boolean. The expression is applied to each element in `Results` to determine whether it should be included in the filtered results.
-        The `expression` parameter is a string that must resolve to a boolean value when evaluated against each element in `Results`.
-        This expression is used to determine which elements to include in the returned `Results`.
-        Example usage: Create an example `Results` instance and apply filters to it:
-        >>> r = Results.example()
-        >>> r.filter("how_feeling == 'Great'").select('how_feeling').print()
-        ┏━━━━━━━━━━━━━━┓
-        ┃ answer       ┃
-        ┃ .how_feeling ┃
-        ┡━━━━━━━━━━━━━━┩
-        │ Great        │
-        └──────────────┘
-        Example usage: Using an OR operator in the filter expression.
-        >>> r = Results.example().filter("how_feeling = 'Great'").select('how_feeling').print()
-        Traceback (most recent call last):
-        ...
-        edsl.exceptions.results.ResultsFilterError: You must use '==' instead of '=' in the filter expression.
-        ...
-        >>> r.filter("how_feeling == 'Great' or how_feeling == 'Terrible'").select('how_feeling').print()
-        ┏━━━━━━━━━━━━━━┓
-        ┃ answer       ┃
-        ┃ .how_feeling ┃
-        ┡━━━━━━━━━━━━━━┩
-        │ Great        │
-        ├──────────────┤
-        │ Terrible     │
-        └──────────────┘
-        """
-        def has_single_equals(string):
-            if "!=" in string:
-                return False
-            if "=" in string and not (
-                "==" in string or "<=" in string or ">=" in string
-            ):
-                return True
-        if has_single_equals(expression):
-            raise ResultsFilterError(
-                "You must use '==' instead of '=' in the filter expression."
-            )
-        try:
-            # iterates through all the results and evaluates the expression
-            new_data = []
-            for result in self.data:
-                evaluator = self._create_evaluator(result)
-                result.check_expression(expression)  # check expression
-                if evaluator.eval(expression):
-                    new_data.append(result)
-        except ValueError as e:
-            raise ResultsFilterError(
-                f"Error in filter. Exception:{e}",
-                f"The expression you provided was: {expression}",
-                "See https://docs.expectedparrot.com/en/latest/results.html#filtering-results for more details.",
-            )
-        except Exception as e:
-            raise ResultsFilterError(
-                f"""Error in filter. Exception:{e}.""",
-                f"""The expression you provided was: {expression}.""",
-                """Please make sure that the expression is a valid Python expression that evaluates to a boolean.""",
-                """For example, 'how_feeling == "Great"' is a valid expression, as is 'how_feeling in ["Great", "Terrible"]'., """,
-                """However, 'how_feeling = "Great"' is not a valid expression.""",
-                """See https://docs.expectedparrot.com/en/latest/results.html#filtering-results for more details.""",
-            )
-        if len(new_data) == 0:
-            import warnings
-            warnings.warn("No results remain after applying the filter.")
-        return Results(survey=self.survey, data=new_data, created_columns=None)
-    @classmethod
-    def example(cls, randomize: bool = False) -> Results:
-        """Return an example `Results` object.
-        Example usage:
-        >>> r = Results.example()
-        :param debug: if False, uses actual API calls
-        """
-        from edsl.jobs.Jobs import Jobs
-        from edsl.data.Cache import Cache
-        c = Cache()
-        job = Jobs.example(randomize=randomize)
-        results = job.run(
-            cache=c,
-            stop_on_exception=True,
-            skip_retry=True,
-            raise_validation_errors=True,
-            disable_remote_cache=True,
-            disable_remote_inference=True,
-        )
-        return results
-    def rich_print(self):
-        """Display an object as a table."""
-        pass
-    def __str__(self):
-        data = self.to_dict()["data"]
-        return json.dumps(data, indent=4)
-    def show_exceptions(self, traceback=False):
-        """Print the exceptions."""
-        if hasattr(self, "task_history"):
-            self.task_history.show_exceptions(traceback)
-        else:
-            print("No exceptions to show.")
-    def score(self, f: Callable) -> list:
-        """Score the results using in a function.
-        :param f: A function that takes values from a Resul object and returns a score.
-        >>> r = Results.example()
-        >>> def f(status): return 1 if status == 'Joyful' else 0
-        >>> r.score(f)
-        [1, 1, 0, 0]
-        """
-        return [r.score(f) for r in self.data]
-def main():  # pragma: no cover
-    """Call the OpenAI API credits."""
-    from edsl.results.Results import Results
-    results = Results.example(debug=True)
-    print(results.filter("how_feeling == 'Great'").select("how_feeling"))
-    print(results.mutate("how_feeling_x = how_feeling + 'x'").select("how_feeling_x"))
-if __name__ == "__main__":
-    import doctest
-    doctest.testmod(optionflags=doctest.ELLIPSIS)
+"""
+The Results object is the result of running a survey.
+It is not typically instantiated directly, but is returned by the run method of a `Job` object.
+"""
+from __future__ import annotations
+import json
+import random
+from collections import UserList, defaultdict
+from typing import Optional, Callable, Any, Type, Union, List, TYPE_CHECKING
+if TYPE_CHECKING:
+    from edsl import Survey, Cache, AgentList, ModelList, ScenarioList
+    from edsl.results.Result import Result
+    from edsl.jobs.tasks.TaskHistory import TaskHistory
+from simpleeval import EvalWithCompoundTypes
+from edsl.exceptions.results import (
+    ResultsError,
+    ResultsBadMutationstringError,
+    ResultsColumnNotFoundError,
+    ResultsInvalidNameError,
+    ResultsMutateError,
+    ResultsFilterError,
+    ResultsDeserializationError,
+)
+from edsl.results.ResultsExportMixin import ResultsExportMixin
+from edsl.results.ResultsToolsMixin import ResultsToolsMixin
+from edsl.results.ResultsDBMixin import ResultsDBMixin
+from edsl.results.ResultsGGMixin import ResultsGGMixin
+from edsl.results.ResultsFetchMixin import ResultsFetchMixin
+from edsl.utilities.decorators import remove_edsl_version
+from edsl.utilities.utilities import dict_hash
+from edsl.Base import Base
+class Mixins(
+    ResultsExportMixin,
+    ResultsDBMixin,
+    ResultsFetchMixin,
+    ResultsGGMixin,
+    ResultsToolsMixin,
+):
+    def long(self):
+        return self.table().long()
+    def print_long(self, max_rows: int = None) -> None:
+        """Print the results in long format.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').print_long(max_rows = 2)
+        ┏━━━━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━┓
+        ┃ Result index ┃ Key         ┃ Value ┃
+        ┡━━━━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━┩
+        │ 0            │ how_feeling │ OK    │
+        │ 1            │ how_feeling │ Great │
+        └──────────────┴─────────────┴───────┘
+        """
+        from edsl.utilities.interface import print_results_long
+        print_results_long(self, max_rows=max_rows)
+class Results(UserList, Mixins, Base):
+    """
+    This class is a UserList of Result objects.
+    It is instantiated with a `Survey` and a list of `Result` objects.
+    It can be manipulated in various ways with select, filter, mutate, etc.
+    It also has a list of created_columns, which are columns that have been created with `mutate` and are not part of the original data.
+    """
+    __documentation__ = "https://docs.expectedparrot.com/en/latest/results.html"
+    known_data_types = [
+        "answer",
+        "scenario",
+        "agent",
+        "model",
+        "prompt",
+        "raw_model_response",
+        "iteration",
+        "question_text",
+        "question_options",
+        "question_type",
+        "comment",
+        "generated_tokens",
+    ]
+    def __init__(
+        self,
+        survey: Optional[Survey] = None,
+        data: Optional[list[Result]] = None,
+        created_columns: Optional[list[str]] = None,
+        cache: Optional[Cache] = None,
+        job_uuid: Optional[str] = None,
+        total_results: Optional[int] = None,
+        task_history: Optional[TaskHistory] = None,
+    ):
+        """Instantiate a `Results` object with a survey and a list of `Result` objects.
+        :param survey: A Survey object.
+        :param data: A list of Result objects.
+        :param created_columns: A list of strings that are created columns.
+        :param job_uuid: A string representing the job UUID.
+        :param total_results: An integer representing the total number of results.
+        """
+        super().__init__(data)
+        from edsl.data.Cache import Cache
+        from edsl.jobs.tasks.TaskHistory import TaskHistory
+        self.survey = survey
+        self.created_columns = created_columns or []
+        self._job_uuid = job_uuid
+        self._total_results = total_results
+        self.cache = cache or Cache()
+        self.task_history = task_history or TaskHistory(interviews=[])
+        if hasattr(self, "_add_output_functions"):
+            self._add_output_functions()
+    def _summary(self) -> dict:
+        import reprlib
+        # import yaml
+        d = {
+            "EDSL Class": "Results",
+            # "docs_url": self.__documentation__,
+            "# of agents": len(set(self.agents)),
+            "# of distinct models": len(set(self.models)),
+            "# of observations": len(self),
+            "# Scenarios": len(set(self.scenarios)),
+            "Survey Length (# questions)": len(self.survey),
+            "Survey question names": reprlib.repr(self.survey.question_names),
+            "Object hash": hash(self),
+        }
+        return d
+    def compute_job_cost(self, include_cached_responses_in_cost=False) -> float:
+        """
+        Computes the cost of a completed job in USD.
+        """
+        total_cost = 0
+        for result in self:
+            for key in result.raw_model_response:
+                if key.endswith("_cost"):
+                    result_cost = result.raw_model_response[key]
+                    question_name = key.removesuffix("_cost")
+                    cache_used = result.cache_used_dict[question_name]
+                    if isinstance(result_cost, (int, float)):
+                        if include_cached_responses_in_cost:
+                            total_cost += result_cost
+                        elif not include_cached_responses_in_cost and not cache_used:
+                            total_cost += result_cost
+        return total_cost
+    def leaves(self):
+        leaves = []
+        for result in self:
+            leaves.extend(result.leaves())
+        return leaves
+    def tree(self, node_list: Optional[List[str]] = None):
+        return self.to_scenario_list().tree(node_list)
+    def interactive_tree(
+        self,
+        fold_attributes: Optional[List[str]] = None,
+        drop: Optional[List[str]] = None,
+        open_file=True,
+    ) -> dict:
+        """Return the results as a tree."""
+        from edsl.results.tree_explore import FoldableHTMLTableGenerator
+        if drop is None:
+            drop = []
+        valid_attributes = [
+            "model",
+            "scenario",
+            "agent",
+            "answer",
+            "question",
+            "iteration",
+        ]
+        if fold_attributes is None:
+            fold_attributes = []
+        for attribute in fold_attributes:
+            if attribute not in valid_attributes:
+                raise ValueError(
+                    f"Invalid fold attribute: {attribute}; must be in {valid_attributes}"
+                )
+        data = self.leaves()
+        generator = FoldableHTMLTableGenerator(data)
+        tree = generator.tree(fold_attributes=fold_attributes, drop=drop)
+        html_content = generator.generate_html(tree, fold_attributes)
+        import tempfile
+        from edsl.utilities.utilities import is_notebook
+        from IPython.display import display, HTML
+        if is_notebook():
+            import html
+            from IPython.display import display, HTML
+            height = 1000
+            width = 1000
+            escaped_output = html.escape(html_content)
+            # escaped_output = rendered_html
+            iframe = f""""
+            <iframe srcdoc="{ escaped_output }" style="width: {width}px; height: {height}px;"></iframe>
+            """
+            display(HTML(iframe))
+            return None
+        with tempfile.NamedTemporaryFile(suffix=".html", delete=False) as f:
+            f.write(html_content.encode())
+            print(f"HTML file has been generated: {f.name}")
+            if open_file:
+                import webbrowser
+                import time
+                time.sleep(1)  # Wait for 1 second
+                # webbrowser.open(f.name)
+                import os
+                filename = f.name
+                webbrowser.open(f"file://{os.path.abspath(filename)}")
+            else:
+                return html_content
+    def code(self):
+        raise NotImplementedError
+    def __getitem__(self, i):
+        if isinstance(i, int):
+            return self.data[i]
+        if isinstance(i, slice):
+            return self.__class__(survey=self.survey, data=self.data[i])
+        if isinstance(i, str):
+            return self.to_dict()[i]
+        raise TypeError("Invalid argument type")
+    def _update_results(self) -> None:
+        from edsl import Agent, Scenario
+        from edsl.language_models import LanguageModel
+        from edsl.results import Result
+        if self._job_uuid and len(self.data) < self._total_results:
+            results = [
+                Result(
+                    agent=Agent.from_dict(json.loads(r.agent)),
+                    scenario=Scenario.from_dict(json.loads(r.scenario)),
+                    model=LanguageModel.from_dict(json.loads(r.model)),
+                    iteration=1,
+                    answer=json.loads(r.answer),
+                )
+                for r in CRUD.read_results(self._job_uuid)
+            ]
+            self.data = results
+    def __add__(self, other: Results) -> Results:
+        """Add two Results objects together.
+        They must have the same survey and created columns.
+        :param other: A Results object.
+        Example:
+        >>> r = Results.example()
+        >>> r2 = Results.example()
+        >>> r3 = r + r2
+        """
+        if self.survey != other.survey:
+            raise ResultsError(
+                "The surveys are not the same so the the results cannot be added together."
+            )
+        if self.created_columns != other.created_columns:
+            raise ResultsError(
+                "The created columns are not the same so they cannot be added together."
+            )
+        return Results(
+            survey=self.survey,
+            data=self.data + other.data,
+            created_columns=self.created_columns,
+        )
+    def __repr__(self) -> str:
+        import reprlib
+        return f"Results(data = {reprlib.repr(self.data)}, survey = {repr(self.survey)}, created_columns = {self.created_columns})"
+    def table(
+        self,
+        # selector_string: Optional[str] = "*.*",
+        *fields,
+        tablefmt: Optional[str] = None,
+        pretty_labels: Optional[dict] = None,
+        print_parameters: Optional[dict] = None,
+    ):
+        new_fields = []
+        for field in fields:
+            if "." in field:
+                data_type, key = field.split(".")
+                if data_type not in self.known_data_types:
+                    raise ResultsInvalidNameError(
+                        f"{data_type} is not a valid data type. Must be in {self.known_data_types}"
+                    )
+                if key == "*":
+                    for k in self._data_type_to_keys[data_type]:
+                        new_fields.append(k)
+                else:
+                    if key not in self._key_to_data_type:
+                        raise ResultsColumnNotFoundError(
+                            f"{key} is not a valid key. Must be in {self._key_to_data_type}"
+                        )
+                    new_fields.append(key)
+            else:
+                new_fields.append(field)
+        return (
+            self.to_scenario_list()
+            .to_dataset()
+            .table(
+                *new_fields,
+                tablefmt=tablefmt,
+                pretty_labels=pretty_labels,
+                print_parameters=print_parameters,
+            )
+        )
+        # return (
+        #     self.select(f"{selector_string}")
+        #     .to_scenario_list()
+        #     .table(*fields, tablefmt=tablefmt)
+        # )
+    def _repr_html_(self) -> str:
+        d = self._summary()
+        from edsl import Scenario
+        footer = f"<a href={self.__documentation__}>(docs)</a>"
+        s = Scenario(d)
+        td = s.to_dataset().table(tablefmt="html")
+        return td._repr_html_() + footer
+    def to_dict(
+        self,
+        sort=False,
+        add_edsl_version=False,
+        include_cache=False,
+        include_task_history=False,
+    ) -> dict[str, Any]:
+        from edsl.data.Cache import Cache
+        if sort:
+            data = sorted([result for result in self.data], key=lambda x: hash(x))
+        else:
+            data = [result for result in self.data]
+        d = {
+            "data": [
+                result.to_dict(add_edsl_version=add_edsl_version) for result in data
+            ],
+            "survey": self.survey.to_dict(add_edsl_version=add_edsl_version),
+            "created_columns": self.created_columns,
+        }
+        if include_cache:
+            d.update(
+                {
+                    "cache": (
+                        Cache()
+                        if not hasattr(self, "cache")
+                        else self.cache.to_dict(add_edsl_version=add_edsl_version)
+                    )
+                }
+            )
+        if self.task_history.has_unfixed_exceptions or include_task_history:
+            d.update({"task_history": self.task_history.to_dict()})
+        if add_edsl_version:
+            from edsl import __version__
+            d["edsl_version"] = __version__
+            d["edsl_class_name"] = "Results"
+        return d
+    def compare(self, other_results):
+        """
+        Compare two Results objects and return the differences.
+        """
+        hashes_0 = [hash(result) for result in self]
+        hashes_1 = [hash(result) for result in other_results]
+        in_self_but_not_other = set(hashes_0).difference(set(hashes_1))
+        in_other_but_not_self = set(hashes_1).difference(set(hashes_0))
+        indicies_self = [hashes_0.index(h) for h in in_self_but_not_other]
+        indices_other = [hashes_1.index(h) for h in in_other_but_not_self]
+        return {
+            "a_not_b": [self[i] for i in indicies_self],
+            "b_not_a": [other_results[i] for i in indices_other],
+        }
+    @property
+    def has_unfixed_exceptions(self):
+        return self.task_history.has_unfixed_exceptions
+    def __hash__(self) -> int:
+        return dict_hash(self.to_dict(sort=True, add_edsl_version=False))
+    @property
+    def hashes(self) -> set:
+        return set(hash(result) for result in self.data)
+    def sample(self, n: int) -> Results:
+        """Return a random sample of the results.
+        :param n: The number of samples to return.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> len(r.sample(2))
+        2
+        """
+        indices = None
+        for entry in self:
+            key, values = list(entry.items())[0]
+            if indices is None:  # gets the indices for the first time
+                indices = list(range(len(values)))
+                sampled_indices = random.sample(indices, n)
+                if n > len(indices):
+                    raise ResultsError(
+                        f"Cannot sample {n} items from a list of length {len(indices)}."
+                    )
+            entry[key] = [values[i] for i in sampled_indices]
+        return self
+    @classmethod
+    @remove_edsl_version
+    def from_dict(cls, data: dict[str, Any]) -> Results:
+        """Convert a dictionary to a Results object.
+        :param data: A dictionary representation of a Results object.
+        Example:
+        >>> r = Results.example()
+        >>> d = r.to_dict()
+        >>> r2 = Results.from_dict(d)
+        >>> r == r2
+        True
+        """
+        from edsl import Survey, Cache
+        from edsl.results.Result import Result
+        from edsl.jobs.tasks.TaskHistory import TaskHistory
+        try:
+            results = cls(
+                survey=Survey.from_dict(data["survey"]),
+                data=[Result.from_dict(r) for r in data["data"]],
+                created_columns=data.get("created_columns", None),
+                cache=(
+                    Cache.from_dict(data.get("cache")) if "cache" in data else Cache()
+                ),
+                task_history=(
+                    TaskHistory.from_dict(data.get("task_history"))
+                    if "task_history" in data
+                    else TaskHistory(interviews=[])
+                ),
+            )
+        except Exception as e:
+            raise ResultsDeserializationError(f"Error in Results.from_dict: {e}")
+        return results
+    ######################
+    ## Convenience methods
+    ## & Report methods
+    ######################
+    @property
+    def _key_to_data_type(self) -> dict[str, str]:
+        """
+        Return a mapping of keys (how_feeling, status, etc.) to strings representing data types.
+        Objects such as Agent, Answer, Model, Scenario, etc.
+        - Uses the key_to_data_type property of the Result class.
+        - Includes any columns that the user has created with `mutate`
+        """
+        d: dict = {}
+        for result in self.data:
+            d.update(result.key_to_data_type)
+        for column in self.created_columns:
+            d[column] = "answer"
+        return d
+    @property
+    def _data_type_to_keys(self) -> dict[str, str]:
+        """
+        Return a mapping of strings representing data types (objects such as Agent, Answer, Model, Scenario, etc.) to keys (how_feeling, status, etc.)
+        - Uses the key_to_data_type property of the Result class.
+        - Includes any columns that the user has created with `mutate`
+        Example:
+        >>> r = Results.example()
+        >>> r._data_type_to_keys
+        defaultdict(...
+        """
+        d: dict = defaultdict(set)
+        for result in self.data:
+            for key, value in result.key_to_data_type.items():
+                d[value] = d[value].union(set({key}))
+        for column in self.created_columns:
+            d["answer"] = d["answer"].union(set({column}))
+        return d
+    @property
+    def columns(self) -> list[str]:
+        """Return a list of all of the columns that are in the Results.
+        Example:
+        >>> r = Results.example()
+        >>> r.columns
+        ['agent.agent_instruction', ...]
+        """
+        column_names = [f"{v}.{k}" for k, v in self._key_to_data_type.items()]
+        return sorted(column_names)
+    @property
+    def answer_keys(self) -> dict[str, str]:
+        """Return a mapping of answer keys to question text.
+        Example:
+        >>> r = Results.example()
+        >>> r.answer_keys
+        {'how_feeling': 'How are you this {{ period }}?', 'how_feeling_yesterday': 'How were you feeling yesterday {{ period }}?'}
+        """
+        from edsl.utilities.utilities import shorten_string
+        if not self.survey:
+            raise ResultsError("Survey is not defined so no answer keys are available.")
+        answer_keys = self._data_type_to_keys["answer"]
+        answer_keys = {k for k in answer_keys if "_comment" not in k}
+        questions_text = [
+            self.survey.get_question(k).question_text for k in answer_keys
+        ]
+        short_question_text = [shorten_string(q, 80) for q in questions_text]
+        initial_dict = dict(zip(answer_keys, short_question_text))
+        sorted_dict = {key: initial_dict[key] for key in sorted(initial_dict)}
+        return sorted_dict
+    @property
+    def agents(self) -> AgentList:
+        """Return a list of all of the agents in the Results.
+        Example:
+        >>> r = Results.example()
+        >>> r.agents
+        AgentList([Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Joyful'}), Agent(traits = {'status': 'Sad'}), Agent(traits = {'status': 'Sad'})])
+        """
+        from edsl import AgentList
+        return AgentList([r.agent for r in self.data])
+    @property
+    def models(self) -> ModelList:
+        """Return a list of all of the models in the Results.
+        Example:
+        >>> r = Results.example()
+        >>> r.models[0]
+        Model(model_name = ...)
+        """
+        from edsl import ModelList
+        return ModelList([r.model for r in self.data])
+    @property
+    def scenarios(self) -> ScenarioList:
+        """Return a list of all of the scenarios in the Results.
+        Example:
+        >>> r = Results.example()
+        >>> r.scenarios
+        ScenarioList([Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'}), Scenario({'period': 'morning'}), Scenario({'period': 'afternoon'})])
+        """
+        from edsl import ScenarioList
+        return ScenarioList([r.scenario for r in self.data])
+    @property
+    def agent_keys(self) -> list[str]:
+        """Return a set of all of the keys that are in the Agent data.
+        Example:
+        >>> r = Results.example()
+        >>> r.agent_keys
+        ['agent_instruction', 'agent_name', 'status']
+        """
+        return sorted(self._data_type_to_keys["agent"])
+    @property
+    def model_keys(self) -> list[str]:
+        """Return a set of all of the keys that are in the LanguageModel data.
+        >>> r = Results.example()
+        >>> r.model_keys
+        ['frequency_penalty', 'logprobs', 'max_tokens', 'model', 'presence_penalty', 'temperature', 'top_logprobs', 'top_p']
+        """
+        return sorted(self._data_type_to_keys["model"])
+    @property
+    def scenario_keys(self) -> list[str]:
+        """Return a set of all of the keys that are in the Scenario data.
+        >>> r = Results.example()
+        >>> r.scenario_keys
+        ['period']
+        """
+        return sorted(self._data_type_to_keys["scenario"])
+    @property
+    def question_names(self) -> list[str]:
+        """Return a list of all of the question names.
+        Example:
+        >>> r = Results.example()
+        >>> r.question_names
+        ['how_feeling', 'how_feeling_yesterday']
+        """
+        if self.survey is None:
+            return []
+        return sorted(list(self.survey.question_names))
+    @property
+    def all_keys(self) -> list[str]:
+        """Return a set of all of the keys that are in the Results.
+        Example:
+        >>> r = Results.example()
+        >>> r.all_keys
+        ['agent_instruction', 'agent_name', 'frequency_penalty', 'how_feeling', 'how_feeling_yesterday', 'logprobs', 'max_tokens', 'model', 'period', 'presence_penalty', 'status', 'temperature', 'top_logprobs', 'top_p']
+        """
+        answer_keys = set(self.answer_keys)
+        all_keys = (
+            answer_keys.union(self.agent_keys)
+            .union(self.scenario_keys)
+            .union(self.model_keys)
+        )
+        return sorted(list(all_keys))
+    def first(self) -> Result:
+        """Return the first observation in the results.
+        Example:
+        >>> r = Results.example()
+        >>> r.first()
+        Result(agent...
+        """
+        return self.data[0]
+    def answer_truncate(self, column: str, top_n=5, new_var_name=None) -> Results:
+        """Create a new variable that truncates the answers to the top_n.
+        :param column: The column to truncate.
+        :param top_n: The number of top answers to keep.
+        :param new_var_name: The name of the new variable. If None, it is the original name + '_truncated'.
+        """
+        if new_var_name is None:
+            new_var_name = column + "_truncated"
+        answers = list(self.select(column).tally().keys())
+        def f(x):
+            if x in answers[:top_n]:
+                return x
+            else:
+                return "Other"
+        return self.recode(column, recode_function=f, new_var_name=new_var_name)
+    def recode(
+        self, column: str, recode_function: Optional[Callable], new_var_name=None
+    ) -> Results:
+        """
+        Recode a column in the Results object.
+        >>> r = Results.example()
+        >>> r.recode('how_feeling', recode_function = lambda x: 1 if x == 'Great' else 0).select('how_feeling', 'how_feeling_recoded')
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling_recoded': [0, 1, 0, 0]}])
+        """
+        if new_var_name is None:
+            new_var_name = column + "_recoded"
+        new_data = []
+        for result in self.data:
+            new_result = result.copy()
+            value = new_result.get_value("answer", column)
+            # breakpoint()
+            new_result["answer"][new_var_name] = recode_function(value)
+            new_data.append(new_result)
+        # print("Created new variable", new_var_name)
+        return Results(
+            survey=self.survey,
+            data=new_data,
+            created_columns=self.created_columns + [new_var_name],
+        )
+    def add_column(self, column_name: str, values: list) -> Results:
+        """Adds columns to Results
+        >>> r = Results.example()
+        >>> r.add_column('a', [1,2,3, 4]).select('a')
+        Dataset([{'answer.a': [1, 2, 3, 4]}])
+        """
+        assert len(values) == len(
+            self.data
+        ), "The number of values must match the number of results."
+        new_results = self.data.copy()
+        for i, result in enumerate(new_results):
+            result["answer"][column_name] = values[i]
+        return Results(
+            survey=self.survey,
+            data=new_results,
+            created_columns=self.created_columns + [column_name],
+        )
+    def add_columns_from_dict(self, columns: List[dict]) -> Results:
+        """Adds columns to Results from a list of dictionaries.
+        >>> r = Results.example()
+        >>> r.add_columns_from_dict([{'a': 1, 'b': 2}, {'a': 3, 'b': 4}, {'a':3, 'b':2}, {'a':3, 'b':2}]).select('a', 'b')
+        Dataset([{'answer.a': [1, 3, 3, 3]}, {'answer.b': [2, 4, 2, 2]}])
+        """
+        keys = list(columns[0].keys())
+        for key in keys:
+            values = [d[key] for d in columns]
+            self = self.add_column(key, values)
+        return self
+    @staticmethod
+    def _create_evaluator(
+        result: Result, functions_dict: Optional[dict] = None
+    ) -> EvalWithCompoundTypes:
+        """Create an evaluator for the expression.
+        >>> from unittest.mock import Mock
+        >>> result = Mock()
+        >>> result.combined_dict = {'how_feeling': 'OK'}
+        >>> evaluator = Results._create_evaluator(result = result, functions_dict = {})
+        >>> evaluator.eval("how_feeling == 'OK'")
+        True
+        >>> result.combined_dict = {'answer': {'how_feeling': 'OK'}}
+        >>> evaluator = Results._create_evaluator(result = result, functions_dict = {})
+        >>> evaluator.eval("answer.how_feeling== 'OK'")
+        True
+        Note that you need to refer to the answer dictionary in the expression.
+        >>> evaluator.eval("how_feeling== 'OK'")
+        Traceback (most recent call last):
+        ...
+        simpleeval.NameNotDefined: 'how_feeling' is not defined for expression 'how_feeling== 'OK''
+        """
+        if functions_dict is None:
+            functions_dict = {}
+        evaluator = EvalWithCompoundTypes(
+            names=result.combined_dict, functions=functions_dict
+        )
+        evaluator.functions.update(int=int, float=float)
+        return evaluator
+    def mutate(
+        self, new_var_string: str, functions_dict: Optional[dict] = None
+    ) -> Results:
+        """
+        Creates a value in the Results object as if has been asked as part of the survey.
+        :param new_var_string: A string that is a valid Python expression.
+        :param functions_dict: A dictionary of functions that can be used in the expression. The keys are the function names and the values are the functions themselves.
+        It splits the new_var_string at the "=" and uses simple_eval
+        Example:
+        >>> r = Results.example()
+        >>> r.mutate('how_feeling_x = how_feeling + "x"').select('how_feeling_x')
+        Dataset([{'answer.how_feeling_x': ...
+        """
+        # extract the variable name and the expression
+        if "=" not in new_var_string:
+            raise ResultsBadMutationstringError(
+                f"Mutate requires an '=' in the string, but '{new_var_string}' doesn't have one."
+            )
+        raw_var_name, expression = new_var_string.split("=", 1)
+        var_name = raw_var_name.strip()
+        from edsl.utilities.utilities import is_valid_variable_name
+        if not is_valid_variable_name(var_name):
+            raise ResultsInvalidNameError(f"{var_name} is not a valid variable name.")
+        # create the evaluator
+        functions_dict = functions_dict or {}
+        def new_result(old_result: "Result", var_name: str) -> "Result":
+            evaluator = self._create_evaluator(old_result, functions_dict)
+            value = evaluator.eval(expression)
+            new_result = old_result.copy()
+            new_result["answer"][var_name] = value
+            return new_result
+        try:
+            new_data = [new_result(result, var_name) for result in self.data]
+        except Exception as e:
+            raise ResultsMutateError(f"Error in mutate. Exception:{e}")
+        return Results(
+            survey=self.survey,
+            data=new_data,
+            created_columns=self.created_columns + [var_name],
+        )
+    def rename(self, old_name: str, new_name: str) -> Results:
+        """Rename an answer column in a Results object.
+        >>> s = Results.example()
+        >>> s.rename('how_feeling', 'how_feeling_new').select('how_feeling_new')
+        Dataset([{'answer.how_feeling_new': ['OK', 'Great', 'Terrible', 'OK']}])
+        # TODO: Should we allow renaming of scenario fields as well? Probably.
+        """
+        for obs in self.data:
+            obs["answer"][new_name] = obs["answer"][old_name]
+            del obs["answer"][old_name]
+        return self
+    def shuffle(self, seed: Optional[str] = "edsl") -> Results:
+        """Shuffle the results.
+        Example:
+        >>> r = Results.example()
+        >>> r.shuffle(seed = 1)[0]
+        Result(...)
+        """
+        if seed != "edsl":
+            seed = random.seed(seed)
+        new_data = self.data.copy()
+        random.shuffle(new_data)
+        return Results(survey=self.survey, data=new_data, created_columns=None)
+    def sample(
+        self,
+        n: Optional[int] = None,
+        frac: Optional[float] = None,
+        with_replacement: bool = True,
+        seed: Optional[str] = "edsl",
+    ) -> Results:
+        """Sample the results.
+        :param n: An integer representing the number of samples to take.
+        :param frac: A float representing the fraction of samples to take.
+        :param with_replacement: A boolean representing whether to sample with replacement.
+        :param seed: An integer representing the seed for the random number generator.
+        Example:
+        >>> r = Results.example()
+        >>> len(r.sample(2))
+        2
+        """
+        if seed != "edsl":
+            random.seed(seed)
+        if n is None and frac is None:
+            raise Exception("You must specify either n or frac.")
+        if n is not None and frac is not None:
+            raise Exception("You cannot specify both n and frac.")
+        if frac is not None and n is None:
+            n = int(frac * len(self.data))
+        if with_replacement:
+            new_data = random.choices(self.data, k=n)
+        else:
+            new_data = random.sample(self.data, n)
+        return Results(survey=self.survey, data=new_data, created_columns=None)
+    def select(self, *columns: Union[str, list[str]]) -> Results:
+        """
+        Select data from the results and format it.
+        :param columns: A list of strings, each of which is a column name. The column name can be a single key, e.g. "how_feeling", or a dot-separated string, e.g. "answer.how_feeling".
+        Example:
+        >>> results = Results.example()
+        >>> results.select('how_feeling')
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}])
+        >>> results.select('how_feeling', 'model', 'how_feeling')
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'model.model': ['...', '...', '...', '...']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}])
+        >>> from edsl import Results; r = Results.example(); r.select('answer.how_feeling_y')
+        Dataset([{'answer.how_feeling_yesterday': ['Great', 'Good', 'OK', 'Terrible']}])
+        """
+        from edsl.results.Selector import Selector
+        if len(self) == 0:
+            raise Exception("No data to select from---the Results object is empty.")
+        selector = Selector(
+            known_data_types=self.known_data_types,
+            data_type_to_keys=self._data_type_to_keys,
+            key_to_data_type=self._key_to_data_type,
+            fetch_list_func=self._fetch_list,
+            columns=self.columns,
+        )
+        return selector.select(*columns)
+    def sort_by(self, *columns: str, reverse: bool = False) -> Results:
+        import warnings
+        warnings.warn(
+            "sort_by is deprecated. Use order_by instead.", DeprecationWarning
+        )
+        return self.order_by(*columns, reverse=reverse)
+    def _parse_column(self, column: str) -> tuple[str, str]:
+        if "." in column:
+            return column.split(".")
+        return self._key_to_data_type[column], column
+    def order_by(self, *columns: str, reverse: bool = False) -> Results:
+        """Sort the results by one or more columns.
+        :param columns: One or more column names as strings.
+        :param reverse: A boolean that determines whether to sort in reverse order.
+        Each column name can be a single key, e.g. "how_feeling", or a dot-separated string, e.g. "answer.how_feeling".
+        Example:
+        >>> r = Results.example()
+        >>> r.sort_by('how_feeling', reverse=False).select('how_feeling').print()
+        answer.how_feeling
+        --------------------
+        Great
+        OK
+        OK
+        Terrible
+        >>> r.sort_by('how_feeling', reverse=True).select('how_feeling').print()
+        answer.how_feeling
+        --------------------
+        Terrible
+        OK
+        OK
+        Great
+        """
+        def to_numeric_if_possible(v):
+            try:
+                return float(v)
+            except:
+                return v
+        def sort_key(item):
+            key_components = []
+            for col in columns:
+                data_type, key = self._parse_column(col)
+                value = item.get_value(data_type, key)
+                key_components.append(to_numeric_if_possible(value))
+            return tuple(key_components)
+        new_data = sorted(self.data, key=sort_key, reverse=reverse)
+        return Results(survey=self.survey, data=new_data, created_columns=None)
+    def filter(self, expression: str) -> Results:
+        """
+        Filter based on the given expression and returns the filtered `Results`.
+        :param expression: A string expression that evaluates to a boolean. The expression is applied to each element in `Results` to determine whether it should be included in the filtered results.
+        The `expression` parameter is a string that must resolve to a boolean value when evaluated against each element in `Results`.
+        This expression is used to determine which elements to include in the returned `Results`.
+        Example usage: Create an example `Results` instance and apply filters to it:
+        >>> r = Results.example()
+        >>> r.filter("how_feeling == 'Great'").select('how_feeling').print()
+        answer.how_feeling
+        --------------------
+        Great
+        Example usage: Using an OR operator in the filter expression.
+        >>> r = Results.example().filter("how_feeling = 'Great'").select('how_feeling').print()
+        Traceback (most recent call last):
+        ...
+        edsl.exceptions.results.ResultsFilterError: You must use '==' instead of '=' in the filter expression.
+        ...
+        >>> r.filter("how_feeling == 'Great' or how_feeling == 'Terrible'").select('how_feeling').print()
+        answer.how_feeling
+        --------------------
+        Great
+        Terrible
+        """
+        def has_single_equals(string):
+            if "!=" in string:
+                return False
+            if "=" in string and not (
+                "==" in string or "<=" in string or ">=" in string
+            ):
+                return True
+        if has_single_equals(expression):
+            raise ResultsFilterError(
+                "You must use '==' instead of '=' in the filter expression."
+            )
+        try:
+            # iterates through all the results and evaluates the expression
+            new_data = []
+            for result in self.data:
+                evaluator = self._create_evaluator(result)
+                result.check_expression(expression)  # check expression
+                if evaluator.eval(expression):
+                    new_data.append(result)
+        except ValueError as e:
+            raise ResultsFilterError(
+                f"Error in filter. Exception:{e}",
+                f"The expression you provided was: {expression}",
+                "See https://docs.expectedparrot.com/en/latest/results.html#filtering-results for more details.",
+            )
+        except Exception as e:
+            raise ResultsFilterError(
+                f"""Error in filter. Exception:{e}.""",
+                f"""The expression you provided was: {expression}.""",
+                """Please make sure that the expression is a valid Python expression that evaluates to a boolean.""",
+                """For example, 'how_feeling == "Great"' is a valid expression, as is 'how_feeling in ["Great", "Terrible"]'., """,
+                """However, 'how_feeling = "Great"' is not a valid expression.""",
+                """See https://docs.expectedparrot.com/en/latest/results.html#filtering-results for more details.""",
+            )
+        if len(new_data) == 0:
+            import warnings
+            warnings.warn("No results remain after applying the filter.")
+        return Results(survey=self.survey, data=new_data, created_columns=None)
+    @classmethod
+    def example(cls, randomize: bool = False) -> Results:
+        """Return an example `Results` object.
+        Example usage:
+        >>> r = Results.example()
+        :param debug: if False, uses actual API calls
+        """
+        from edsl.jobs.Jobs import Jobs
+        from edsl.data.Cache import Cache
+        c = Cache()
+        job = Jobs.example(randomize=randomize)
+        results = job.run(
+            cache=c,
+            stop_on_exception=True,
+            skip_retry=True,
+            raise_validation_errors=True,
+            disable_remote_cache=True,
+            disable_remote_inference=True,
+        )
+        return results
+    def rich_print(self):
+        """Display an object as a table."""
+        pass
+    def __str__(self):
+        data = self.to_dict()["data"]
+        return json.dumps(data, indent=4)
+    def show_exceptions(self, traceback=False):
+        """Print the exceptions."""
+        if hasattr(self, "task_history"):
+            self.task_history.show_exceptions(traceback)
+        else:
+            print("No exceptions to show.")
+    def score(self, f: Callable) -> list:
+        """Score the results using in a function.
+        :param f: A function that takes values from a Resul object and returns a score.
+        >>> r = Results.example()
+        >>> def f(status): return 1 if status == 'Joyful' else 0
+        >>> r.score(f)
+        [1, 1, 0, 0]
+        """
+        return [r.score(f) for r in self.data]
+def main():  # pragma: no cover
+    """Call the OpenAI API credits."""
+    from edsl.results.Results import Results
+    results = Results.example(debug=True)
+    print(results.filter("how_feeling == 'Great'").select("how_feeling"))
+    print(results.mutate("how_feeling_x = how_feeling + 'x'").select("how_feeling_x"))
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl 0.1.38.dev3__py3-none-any.whl → 0.1.38.dev4__py3-none-any.whl

edsl 0.1.38.dev3py3-none-any.whl → 0.1.38.dev4py3-none-any.whl