PyPI - edsl - Versions diffs - 0.1.39.dev2__py3-none-any.whl → 0.1.39.dev3__py3-none-any.whl - Mend

edsl 0.1.39.dev2py3-none-any.whl → 0.1.39.dev3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (334) hide show

edsl/Base.py +332 -385
edsl/BaseDiff.py +260 -260
edsl/TemplateLoader.py +24 -24
edsl/__init__.py +49 -57
edsl/__version__.py +1 -1
edsl/agents/Agent.py +867 -1079
edsl/agents/AgentList.py +413 -551
edsl/agents/Invigilator.py +233 -285
edsl/agents/InvigilatorBase.py +270 -254
edsl/agents/PromptConstructor.py +354 -252
edsl/agents/__init__.py +3 -2
edsl/agents/descriptors.py +99 -99
edsl/agents/prompt_helpers.py +129 -129
edsl/auto/AutoStudy.py +117 -117
edsl/auto/StageBase.py +230 -230
edsl/auto/StageGenerateSurvey.py +178 -178
edsl/auto/StageLabelQuestions.py +125 -125
edsl/auto/StagePersona.py +61 -61
edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
edsl/auto/StagePersonaDimensionValues.py +74 -74
edsl/auto/StagePersonaDimensions.py +69 -69
edsl/auto/StageQuestions.py +73 -73
edsl/auto/SurveyCreatorPipeline.py +21 -21
edsl/auto/utilities.py +224 -224
edsl/base/Base.py +279 -279
edsl/config.py +157 -177
edsl/conversation/Conversation.py +290 -290
edsl/conversation/car_buying.py +58 -59
edsl/conversation/chips.py +95 -95
edsl/conversation/mug_negotiation.py +81 -81
edsl/conversation/next_speaker_utilities.py +93 -93
edsl/coop/PriceFetcher.py +54 -54
edsl/coop/__init__.py +2 -2
edsl/coop/coop.py +1028 -1090
edsl/coop/utils.py +131 -131
edsl/data/Cache.py +555 -562
edsl/data/CacheEntry.py +233 -230
edsl/data/CacheHandler.py +149 -170
edsl/data/RemoteCacheSync.py +78 -78
edsl/data/SQLiteDict.py +292 -292
edsl/data/__init__.py +4 -5
edsl/data/orm.py +10 -10
edsl/data_transfer_models.py +73 -74
edsl/enums.py +175 -195
edsl/exceptions/BaseException.py +21 -21
edsl/exceptions/__init__.py +54 -54
edsl/exceptions/agents.py +42 -54
edsl/exceptions/cache.py +5 -5
edsl/exceptions/configuration.py +16 -16
edsl/exceptions/coop.py +10 -10
edsl/exceptions/data.py +14 -14
edsl/exceptions/general.py +34 -34
edsl/exceptions/jobs.py +33 -33
edsl/exceptions/language_models.py +63 -63
edsl/exceptions/prompts.py +15 -15
edsl/exceptions/questions.py +91 -109
edsl/exceptions/results.py +29 -29
edsl/exceptions/scenarios.py +22 -29
edsl/exceptions/surveys.py +37 -37
edsl/inference_services/AnthropicService.py +87 -84
edsl/inference_services/AwsBedrock.py +120 -118
edsl/inference_services/AzureAI.py +217 -215
edsl/inference_services/DeepInfraService.py +18 -18
edsl/inference_services/GoogleService.py +148 -139
edsl/inference_services/GroqService.py +20 -20
edsl/inference_services/InferenceServiceABC.py +147 -80
edsl/inference_services/InferenceServicesCollection.py +97 -122
edsl/inference_services/MistralAIService.py +123 -120
edsl/inference_services/OllamaService.py +18 -18
edsl/inference_services/OpenAIService.py +224 -221
edsl/inference_services/PerplexityService.py +163 -160
edsl/inference_services/TestService.py +89 -92
edsl/inference_services/TogetherAIService.py +170 -170
edsl/inference_services/models_available_cache.py +118 -118
edsl/inference_services/rate_limits_cache.py +25 -25
edsl/inference_services/registry.py +41 -41
edsl/inference_services/write_available.py +10 -10
edsl/jobs/Answers.py +56 -43
edsl/jobs/Jobs.py +898 -757
edsl/jobs/JobsChecks.py +147 -172
edsl/jobs/JobsPrompts.py +268 -270
edsl/jobs/JobsRemoteInferenceHandler.py +239 -287
edsl/jobs/__init__.py +1 -1
edsl/jobs/buckets/BucketCollection.py +63 -104
edsl/jobs/buckets/ModelBuckets.py +65 -65
edsl/jobs/buckets/TokenBucket.py +251 -283
edsl/jobs/interviews/Interview.py +661 -358
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
edsl/jobs/interviews/InterviewStatistic.py +63 -63
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
edsl/jobs/interviews/InterviewStatusLog.py +92 -92
edsl/jobs/interviews/ReportErrors.py +66 -66
edsl/jobs/interviews/interview_status_enum.py +9 -9
edsl/jobs/runners/JobsRunnerAsyncio.py +466 -421
edsl/jobs/runners/JobsRunnerStatus.py +330 -330
edsl/jobs/tasks/QuestionTaskCreator.py +242 -244
edsl/jobs/tasks/TaskCreators.py +64 -64
edsl/jobs/tasks/TaskHistory.py +450 -449
edsl/jobs/tasks/TaskStatusLog.py +23 -23
edsl/jobs/tasks/task_status_enum.py +163 -161
edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
edsl/jobs/tokens/TokenUsage.py +34 -34
edsl/language_models/KeyLookup.py +30 -0
edsl/language_models/LanguageModel.py +668 -571
edsl/language_models/ModelList.py +155 -153
edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
edsl/language_models/__init__.py +3 -2
edsl/language_models/fake_openai_call.py +15 -15
edsl/language_models/fake_openai_service.py +61 -61
edsl/language_models/registry.py +190 -180
edsl/language_models/repair.py +156 -156
edsl/language_models/unused/ReplicateBase.py +83 -0
edsl/language_models/utilities.py +64 -65
edsl/notebooks/Notebook.py +258 -263
edsl/notebooks/__init__.py +1 -1
edsl/prompts/Prompt.py +362 -352
edsl/prompts/__init__.py +2 -2
edsl/questions/AnswerValidatorMixin.py +289 -334
edsl/questions/QuestionBase.py +664 -509
edsl/questions/QuestionBaseGenMixin.py +161 -165
edsl/questions/QuestionBasePromptsMixin.py +217 -221
edsl/questions/QuestionBudget.py +227 -227
edsl/questions/QuestionCheckBox.py +359 -359
edsl/questions/QuestionExtract.py +182 -182
edsl/questions/QuestionFreeText.py +114 -113
edsl/questions/QuestionFunctional.py +166 -166
edsl/questions/QuestionList.py +231 -229
edsl/questions/QuestionMultipleChoice.py +286 -330
edsl/questions/QuestionNumerical.py +153 -151
edsl/questions/QuestionRank.py +324 -314
edsl/questions/Quick.py +41 -41
edsl/questions/RegisterQuestionsMeta.py +71 -71
edsl/questions/ResponseValidatorABC.py +174 -200
edsl/questions/SimpleAskMixin.py +73 -74
edsl/questions/__init__.py +26 -27
edsl/questions/compose_questions.py +98 -98
edsl/questions/decorators.py +21 -21
edsl/questions/derived/QuestionLikertFive.py +76 -76
edsl/questions/derived/QuestionLinearScale.py +87 -90
edsl/questions/derived/QuestionTopK.py +93 -93
edsl/questions/derived/QuestionYesNo.py +82 -82
edsl/questions/descriptors.py +413 -427
edsl/questions/prompt_templates/question_budget.jinja +13 -13
edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
edsl/questions/prompt_templates/question_extract.jinja +11 -11
edsl/questions/prompt_templates/question_free_text.jinja +3 -3
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
edsl/questions/prompt_templates/question_list.jinja +17 -17
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
edsl/questions/prompt_templates/question_numerical.jinja +36 -36
edsl/questions/question_registry.py +177 -177
edsl/questions/settings.py +12 -12
edsl/questions/templates/budget/answering_instructions.jinja +7 -7
edsl/questions/templates/budget/question_presentation.jinja +7 -7
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
edsl/questions/templates/extract/answering_instructions.jinja +7 -7
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
edsl/questions/templates/list/answering_instructions.jinja +3 -3
edsl/questions/templates/list/question_presentation.jinja +5 -5
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
edsl/questions/templates/numerical/question_presentation.jinja +6 -6
edsl/questions/templates/rank/answering_instructions.jinja +11 -11
edsl/questions/templates/rank/question_presentation.jinja +15 -15
edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
edsl/questions/templates/top_k/question_presentation.jinja +22 -22
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
edsl/results/CSSParameterizer.py +108 -108
edsl/results/Dataset.py +424 -587
edsl/results/DatasetExportMixin.py +731 -653
edsl/results/DatasetTree.py +275 -295
edsl/results/Result.py +465 -451
edsl/results/Results.py +1165 -1172
edsl/results/ResultsDBMixin.py +238 -0
edsl/results/ResultsExportMixin.py +43 -45
edsl/results/ResultsFetchMixin.py +33 -33
edsl/results/ResultsGGMixin.py +121 -121
edsl/results/ResultsToolsMixin.py +98 -98
edsl/results/Selector.py +135 -145
edsl/results/TableDisplay.py +198 -125
edsl/results/__init__.py +2 -2
edsl/results/table_display.css +77 -77
edsl/results/tree_explore.py +115 -115
edsl/scenarios/FileStore.py +632 -511
edsl/scenarios/Scenario.py +601 -498
edsl/scenarios/ScenarioHtmlMixin.py +64 -65
edsl/scenarios/ScenarioJoin.py +127 -131
edsl/scenarios/ScenarioList.py +1287 -1430
edsl/scenarios/ScenarioListExportMixin.py +52 -45
edsl/scenarios/ScenarioListPdfMixin.py +261 -239
edsl/scenarios/__init__.py +4 -3
edsl/shared.py +1 -1
edsl/study/ObjectEntry.py +173 -173
edsl/study/ProofOfWork.py +113 -113
edsl/study/SnapShot.py +80 -80
edsl/study/Study.py +528 -521
edsl/study/__init__.py +4 -4
edsl/surveys/DAG.py +148 -148
edsl/surveys/Memory.py +31 -31
edsl/surveys/MemoryPlan.py +244 -244
edsl/surveys/Rule.py +326 -327
edsl/surveys/RuleCollection.py +387 -385
edsl/surveys/Survey.py +1801 -1229
edsl/surveys/SurveyCSS.py +261 -273
edsl/surveys/SurveyExportMixin.py +259 -259
edsl/surveys/{SurveyFlowVisualization.py → SurveyFlowVisualizationMixin.py} +179 -181
edsl/surveys/SurveyQualtricsImport.py +284 -284
edsl/surveys/__init__.py +3 -5
edsl/surveys/base.py +53 -53
edsl/surveys/descriptors.py +56 -60
edsl/surveys/instructions/ChangeInstruction.py +49 -48
edsl/surveys/instructions/Instruction.py +65 -56
edsl/surveys/instructions/InstructionCollection.py +77 -82
edsl/templates/error_reporting/base.html +23 -23
edsl/templates/error_reporting/exceptions_by_model.html +34 -34
edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
edsl/templates/error_reporting/exceptions_by_type.html +16 -16
edsl/templates/error_reporting/interview_details.html +115 -115
edsl/templates/error_reporting/interviews.html +19 -19
edsl/templates/error_reporting/overview.html +4 -4
edsl/templates/error_reporting/performance_plot.html +1 -1
edsl/templates/error_reporting/report.css +73 -73
edsl/templates/error_reporting/report.html +117 -117
edsl/templates/error_reporting/report.js +25 -25
edsl/tools/__init__.py +1 -1
edsl/tools/clusters.py +192 -192
edsl/tools/embeddings.py +27 -27
edsl/tools/embeddings_plotting.py +118 -118
edsl/tools/plotting.py +112 -112
edsl/tools/summarize.py +18 -18
edsl/utilities/SystemInfo.py +28 -28
edsl/utilities/__init__.py +22 -22
edsl/utilities/ast_utilities.py +25 -25
edsl/utilities/data/Registry.py +6 -6
edsl/utilities/data/__init__.py +1 -1
edsl/utilities/data/scooter_results.json +1 -1
edsl/utilities/decorators.py +77 -77
edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
edsl/utilities/interface.py +627 -627
edsl/utilities/naming_utilities.py +263 -263
edsl/utilities/repair_functions.py +28 -28
edsl/utilities/restricted_python.py +70 -70
edsl/utilities/utilities.py +424 -436
{edsl-0.1.39.dev2.dist-info → edsl-0.1.39.dev3.dist-info}/LICENSE +21 -21
{edsl-0.1.39.dev2.dist-info → edsl-0.1.39.dev3.dist-info}/METADATA +10 -12
edsl-0.1.39.dev3.dist-info/RECORD +277 -0
edsl/agents/QuestionInstructionPromptBuilder.py +0 -128
edsl/agents/QuestionOptionProcessor.py +0 -172
edsl/agents/QuestionTemplateReplacementsBuilder.py +0 -137
edsl/coop/CoopFunctionsMixin.py +0 -15
edsl/coop/ExpectedParrotKeyHandler.py +0 -125
edsl/exceptions/inference_services.py +0 -5
edsl/inference_services/AvailableModelCacheHandler.py +0 -184
edsl/inference_services/AvailableModelFetcher.py +0 -209
edsl/inference_services/ServiceAvailability.py +0 -135
edsl/inference_services/data_structures.py +0 -62
edsl/jobs/AnswerQuestionFunctionConstructor.py +0 -188
edsl/jobs/FetchInvigilator.py +0 -40
edsl/jobs/InterviewTaskManager.py +0 -98
edsl/jobs/InterviewsConstructor.py +0 -48
edsl/jobs/JobsComponentConstructor.py +0 -189
edsl/jobs/JobsRemoteInferenceLogger.py +0 -239
edsl/jobs/RequestTokenEstimator.py +0 -30
edsl/jobs/buckets/TokenBucketAPI.py +0 -211
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/decorators.py +0 -35
edsl/jobs/jobs_status_enums.py +0 -9
edsl/jobs/loggers/HTMLTableJobLogger.py +0 -304
edsl/language_models/ComputeCost.py +0 -63
edsl/language_models/PriceManager.py +0 -127
edsl/language_models/RawResponseHandler.py +0 -106
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupBuilder.py +0 -273
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +0 -131
edsl/notebooks/NotebookToLaTeX.py +0 -142
edsl/questions/ExceptionExplainer.py +0 -77
edsl/questions/HTMLQuestion.py +0 -103
edsl/questions/LoopProcessor.py +0 -149
edsl/questions/QuestionMatrix.py +0 -265
edsl/questions/ResponseValidatorFactory.py +0 -28
edsl/questions/templates/matrix/__init__.py +0 -1
edsl/questions/templates/matrix/answering_instructions.jinja +0 -5
edsl/questions/templates/matrix/question_presentation.jinja +0 -20
edsl/results/MarkdownToDocx.py +0 -122
edsl/results/MarkdownToPDF.py +0 -111
edsl/results/TextEditor.py +0 -50
edsl/results/smart_objects.py +0 -96
edsl/results/table_data_class.py +0 -12
edsl/results/table_renderers.py +0 -118
edsl/scenarios/ConstructDownloadLink.py +0 -109
edsl/scenarios/DirectoryScanner.py +0 -96
edsl/scenarios/DocumentChunker.py +0 -102
edsl/scenarios/DocxScenario.py +0 -16
edsl/scenarios/PdfExtractor.py +0 -40
edsl/scenarios/ScenarioSelector.py +0 -156
edsl/scenarios/file_methods.py +0 -85
edsl/scenarios/handlers/__init__.py +0 -13
edsl/scenarios/handlers/csv.py +0 -38
edsl/scenarios/handlers/docx.py +0 -76
edsl/scenarios/handlers/html.py +0 -37
edsl/scenarios/handlers/json.py +0 -111
edsl/scenarios/handlers/latex.py +0 -5
edsl/scenarios/handlers/md.py +0 -51
edsl/scenarios/handlers/pdf.py +0 -68
edsl/scenarios/handlers/png.py +0 -39
edsl/scenarios/handlers/pptx.py +0 -105
edsl/scenarios/handlers/py.py +0 -294
edsl/scenarios/handlers/sql.py +0 -313
edsl/scenarios/handlers/sqlite.py +0 -149
edsl/scenarios/handlers/txt.py +0 -33
edsl/surveys/ConstructDAG.py +0 -92
edsl/surveys/EditSurvey.py +0 -221
edsl/surveys/InstructionHandler.py +0 -100
edsl/surveys/MemoryManagement.py +0 -72
edsl/surveys/RuleManager.py +0 -172
edsl/surveys/Simulator.py +0 -75
edsl/surveys/SurveyToApp.py +0 -141
edsl/utilities/PrettyList.py +0 -56
edsl/utilities/is_notebook.py +0 -18
edsl/utilities/is_valid_variable_name.py +0 -11
edsl/utilities/remove_edsl_version.py +0 -24
edsl-0.1.39.dev2.dist-info/RECORD +0 -352
{edsl-0.1.39.dev2.dist-info → edsl-0.1.39.dev3.dist-info}/WHEEL +0 -0

edsl/results/DatasetExportMixin.py CHANGED Viewed

@@ -1,653 +1,731 @@
-"""Mixin class for exporting results."""
-import base64
-import csv
-import io
-import warnings
-import textwrap
-from typing import Optional, Tuple, Union, List
-class DatasetExportMixin:
-    """Mixin class for exporting Dataset objects."""
-    def relevant_columns(
-        self, data_type: Optional[str] = None, remove_prefix=False
-    ) -> list:
-        """Return the set of keys that are present in the dataset.
-        :param data_type: The data type to filter by.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results.Dataset import Dataset
-        >>> d = Dataset([{'a.b':[1,2,3,4]}])
-        >>> d.relevant_columns()
-        ['a.b']
-        >>> d.relevant_columns(remove_prefix=True)
-        ['b']
-        >>> d = Dataset([{'a':[1,2,3,4]}, {'b':[5,6,7,8]}])
-        >>> d.relevant_columns()
-        ['a', 'b']
-        >>> from edsl.results import Results; Results.example().select('how_feeling', 'how_feeling_yesterday').relevant_columns()
-        ['answer.how_feeling', 'answer.how_feeling_yesterday']
-        >>> from edsl.results import Results
-        >>> sorted(Results.example().select().relevant_columns(data_type = "model"))
-        ['model.frequency_penalty', ...]
-        >>> Results.example().relevant_columns(data_type = "flimflam")
-        Traceback (most recent call last):
-        ...
-        ValueError: No columns found for data type: flimflam. Available data types are: ...
-        """
-        columns = [list(x.keys())[0] for x in self]
-        if remove_prefix:
-            columns = [column.split(".")[-1] for column in columns]
-        def get_data_type(column):
-            if "." in column:
-                return column.split(".")[0]
-            else:
-                return None
-        if data_type:
-            all_columns = columns[:]
-            columns = [
-                column for column in columns if get_data_type(column) == data_type
-            ]
-            if len(columns) == 0:
-                all_data_types = sorted(
-                    list(set(get_data_type(column) for column in all_columns))
-                )
-                raise ValueError(
-                    f"No columns found for data type: {data_type}. Available data types are: {all_data_types}."
-                )
-        return columns
-    def num_observations(self):
-        """Return the number of observations in the dataset.
-        >>> from edsl.results.Results import Results
-        >>> Results.example().num_observations()
-        4
-        """
-        _num_observations = None
-        for entry in self:
-            key, values = list(entry.items())[0]
-            if _num_observations is None:
-                _num_observations = len(values)
-            else:
-                if len(values) != _num_observations:
-                    raise ValueError(
-                        "The number of observations is not consistent across columns."
-                    )
-        return _num_observations
-    def _make_tabular(
-        self, remove_prefix: bool, pretty_labels: Optional[dict] = None
-    ) -> tuple[list, List[list]]:
-        """Turn the results into a tabular format.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling')._make_tabular(remove_prefix = True)
-        (['how_feeling'], [['OK'], ['Great'], ['Terrible'], ['OK']])
-        >>> r.select('how_feeling')._make_tabular(remove_prefix = True, pretty_labels = {'how_feeling': "How are you feeling"})
-        (['How are you feeling'], [['OK'], ['Great'], ['Terrible'], ['OK']])
-        """
-        def create_dict_from_list_of_dicts(list_of_dicts):
-            for entry in list_of_dicts:
-                key, list_of_values = list(entry.items())[0]
-                yield key, list_of_values
-        tabular_repr = dict(create_dict_from_list_of_dicts(self.data))
-        full_header = [list(x.keys())[0] for x in self]
-        rows = []
-        for i in range(self.num_observations()):
-            row = [tabular_repr[h][i] for h in full_header]
-            rows.append(row)
-        if remove_prefix:
-            header = [h.split(".")[-1] for h in full_header]
-        else:
-            header = full_header
-        if pretty_labels is not None:
-            header = [pretty_labels.get(h, h) for h in header]
-        return header, rows
-    def print_long(self):
-        """Print the results in a long format.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').print_long()
-        answer.how_feeling: OK
-        answer.how_feeling: Great
-        answer.how_feeling: Terrible
-        answer.how_feeling: OK
-        """
-        for entry in self:
-            key, list_of_values = list(entry.items())[0]
-            for value in list_of_values:
-                print(f"{key}: {value}")
-    def _get_tabular_data(
-        self,
-        remove_prefix: bool = False,
-        pretty_labels: Optional[dict] = None,
-    ) -> Tuple[List[str], List[List]]:
-        """Internal method to get tabular data in a standard format.
-        Args:
-            remove_prefix: Whether to remove the prefix from column names
-            pretty_labels: Dictionary mapping original column names to pretty labels
-        Returns:
-            Tuple containing (header_row, data_rows)
-        """
-        if pretty_labels is None:
-            pretty_labels = {}
-        return self._make_tabular(
-            remove_prefix=remove_prefix, pretty_labels=pretty_labels
-        )
-    def to_jsonl(self, filename: Optional[str] = None) -> "FileStore":
-        """Export the results to a FileStore instance containing JSONL data.
-        Args:
-            filename: Optional filename for the JSONL file (defaults to "results.jsonl")
-        Returns:
-            FileStore: Instance containing the JSONL data
-        """
-        if filename is None:
-            filename = "results.jsonl"
-        # Write to string buffer
-        output = io.StringIO()
-        for entry in self:
-            key, values = list(entry.items())[0]
-            output.write(f'{{"{key}": {values}}}\n')
-        # Get the CSV string and encode to base64
-        jsonl_string = output.getvalue()
-        base64_string = base64.b64encode(jsonl_string.encode()).decode()
-        from edsl.scenarios.FileStore import FileStore
-        return FileStore(
-            path=filename,
-            mime_type="application/jsonl",
-            binary=False,
-            suffix="jsonl",
-            base64_string=base64_string,
-        )
-    def to_csv(
-        self,
-        filename: Optional[str] = None,
-        remove_prefix: bool = False,
-        pretty_labels: Optional[dict] = None,
-    ) -> "FileStore":
-        """Export the results to a FileStore instance containing CSV data.
-        Args:
-            filename: Optional filename for the CSV (defaults to "results.csv")
-            remove_prefix: Whether to remove the prefix from column names
-            pretty_labels: Dictionary mapping original column names to pretty labels
-        Returns:
-            FileStore: Instance containing the CSV data
-        """
-        if filename is None:
-            filename = "results.csv"
-        # Get the tabular data
-        header, rows = self._get_tabular_data(
-            remove_prefix=remove_prefix, pretty_labels=pretty_labels
-        )
-        # Write to string buffer
-        output = io.StringIO()
-        writer = csv.writer(output)
-        writer.writerow(header)
-        writer.writerows(rows)
-        # Get the CSV string and encode to base64
-        csv_string = output.getvalue()
-        base64_string = base64.b64encode(csv_string.encode()).decode()
-        from edsl.scenarios.FileStore import FileStore
-        return FileStore(
-            path=filename,
-            mime_type="text/csv",
-            binary=False,
-            suffix="csv",
-            base64_string=base64_string,
-        )
-    def to_excel(
-        self,
-        filename: Optional[str] = None,
-        remove_prefix: bool = False,
-        pretty_labels: Optional[dict] = None,
-        sheet_name: Optional[str] = None,
-    ) -> "FileStore":
-        """Export the results to a FileStore instance containing Excel data.
-        Args:
-            filename: Optional filename for the Excel file (defaults to "results.xlsx")
-            remove_prefix: Whether to remove the prefix from column names
-            pretty_labels: Dictionary mapping original column names to pretty labels
-            sheet_name: Name of the worksheet (defaults to "Results")
-        Returns:
-            FileStore: Instance containing the Excel data
-        """
-        from openpyxl import Workbook
-        if filename is None:
-            filename = "results.xlsx"
-        if sheet_name is None:
-            sheet_name = "Results"
-        # Get the tabular data
-        header, rows = self._get_tabular_data(
-            remove_prefix=remove_prefix, pretty_labels=pretty_labels
-        )
-        # Create Excel workbook in memory
-        wb = Workbook()
-        ws = wb.active
-        ws.title = sheet_name
-        # Write header
-        for col, value in enumerate(header, 1):
-            ws.cell(row=1, column=col, value=value)
-        # Write data rows
-        for row_idx, row_data in enumerate(rows, 2):
-            for col, value in enumerate(row_data, 1):
-                ws.cell(row=row_idx, column=col, value=value)
-        # Save to bytes buffer
-        buffer = io.BytesIO()
-        wb.save(buffer)
-        buffer.seek(0)
-        # Convert to base64
-        base64_string = base64.b64encode(buffer.getvalue()).decode()
-        from edsl.scenarios.FileStore import FileStore
-        return FileStore(
-            path=filename,
-            mime_type="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-            binary=True,
-            suffix="xlsx",
-            base64_string=base64_string,
-        )
-    def _db(self, remove_prefix: bool = True):
-        """Create a SQLite database in memory and return the connection.
-        Args:
-            shape: The shape of the data in the database (wide or long)
-            remove_prefix: Whether to remove the prefix from the column names
-        Returns:
-            A database connection
-        """
-        from sqlalchemy import create_engine
-        engine = create_engine("sqlite:///:memory:")
-        if remove_prefix:
-            df = self.remove_prefix().to_pandas(lists_as_strings=True)
-        else:
-            df = self.to_pandas(lists_as_strings=True)
-        df.to_sql(
-            "self",
-            engine,
-            index=False,
-            if_exists="replace",
-        )
-        return engine.connect()
-    def sql(
-        self,
-        query: str,
-        transpose: bool = None,
-        transpose_by: str = None,
-        remove_prefix: bool = True,
-    ) -> Union["pd.DataFrame", str]:
-        """Execute a SQL query and return the results as a DataFrame.
-        Args:
-            query: The SQL query to execute
-            shape: The shape of the data in the database (wide or long)
-            remove_prefix: Whether to remove the prefix from the column names
-            transpose: Whether to transpose the DataFrame
-            transpose_by: The column to use as the index when transposing
-            csv: Whether to return the DataFrame as a CSV string
-            to_list: Whether to return the results as a list
-            to_latex: Whether to return the results as LaTeX
-            filename: Optional filename to save the results to
-        Returns:
-            DataFrame, CSV string, list, or LaTeX string depending on parameters
-        """
-        import pandas as pd
-        conn = self._db(remove_prefix=remove_prefix)
-        df = pd.read_sql_query(query, conn)
-        # Transpose the DataFrame if transpose is True
-        if transpose or transpose_by:
-            df = pd.DataFrame(df)
-            if transpose_by:
-                df = df.set_index(transpose_by)
-            else:
-                df = df.set_index(df.columns[0])
-            df = df.transpose()
-        from edsl.results.Dataset import Dataset
-        return Dataset.from_pandas_dataframe(df)
-    def to_pandas(
-        self, remove_prefix: bool = False, lists_as_strings=False
-    ) -> "DataFrame":
-        """Convert the results to a pandas DataFrame, ensuring that lists remain as lists.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        """
-        return self._to_pandas_strings(remove_prefix)
-    def _to_pandas_strings(self, remove_prefix: bool = False) -> "pd.DataFrame":
-        """Convert the results to a pandas DataFrame.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').to_pandas()
-          answer.how_feeling
-        0                 OK
-        1              Great
-        2           Terrible
-        3                 OK
-        """
-        import pandas as pd
-        csv_string = self.to_csv(remove_prefix=remove_prefix).text
-        csv_buffer = io.StringIO(csv_string)
-        df = pd.read_csv(csv_buffer)
-        # df_sorted = df.sort_index(axis=1)  # Sort columns alphabetically
-        return df
-    def to_scenario_list(self, remove_prefix: bool = True) -> list[dict]:
-        """Convert the results to a list of dictionaries, one per scenario.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').to_scenario_list()
-        ScenarioList([Scenario({'how_feeling': 'OK'}), Scenario({'how_feeling': 'Great'}), Scenario({'how_feeling': 'Terrible'}), Scenario({'how_feeling': 'OK'})])
-        """
-        from edsl.scenarios.ScenarioList import ScenarioList
-        from edsl.scenarios.Scenario import Scenario
-        list_of_dicts = self.to_dicts(remove_prefix=remove_prefix)
-        scenarios = []
-        for d in list_of_dicts:
-            scenarios.append(Scenario(d))
-        return ScenarioList(scenarios)
-    def to_agent_list(self, remove_prefix: bool = True):
-        """Convert the results to a list of dictionaries, one per agent.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').to_agent_list()
-        AgentList([Agent(traits = {'how_feeling': 'OK'}), Agent(traits = {'how_feeling': 'Great'}), Agent(traits = {'how_feeling': 'Terrible'}), Agent(traits = {'how_feeling': 'OK'})])
-        """
-        from edsl.agents import Agent
-        from edsl.agents.AgentList import AgentList
-        list_of_dicts = self.to_dicts(remove_prefix=remove_prefix)
-        agents = []
-        for d in list_of_dicts:
-            if "name" in d:
-                d["agent_name"] = d.pop("name")
-                agents.append(Agent(d, name=d["agent_name"]))
-            if "agent_parameters" in d:
-                agent_parameters = d.pop("agent_parameters")
-                agent_name = agent_parameters.get("name", None)
-                instruction = agent_parameters.get("instruction", None)
-                agents.append(Agent(d, name=agent_name, instruction=instruction))
-            else:
-                agents.append(Agent(d))
-        return AgentList(agents)
-    def to_dicts(self, remove_prefix: bool = True) -> list[dict]:
-        """Convert the results to a list of dictionaries.
-        :param remove_prefix: Whether to remove the prefix from the column names.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').to_dicts()
-        [{'how_feeling': 'OK'}, {'how_feeling': 'Great'}, {'how_feeling': 'Terrible'}, {'how_feeling': 'OK'}]
-        """
-        list_of_keys = []
-        list_of_values = []
-        for entry in self:
-            key, values = list(entry.items())[0]
-            list_of_keys.append(key)
-            list_of_values.append(values)
-        if remove_prefix:
-            list_of_keys = [key.split(".")[-1] for key in list_of_keys]
-        list_of_dicts = []
-        for entries in zip(*list_of_values):
-            list_of_dicts.append(dict(zip(list_of_keys, entries)))
-        return list_of_dicts
-    def to_list(self, flatten=False, remove_none=False, unzipped=False) -> list[list]:
-        """Convert the results to a list of lists.
-        :param flatten: Whether to flatten the list of lists.
-        :param remove_none: Whether to remove None values from the list.
-        >>> from edsl.results import Results
-        >>> Results.example().select('how_feeling', 'how_feeling_yesterday')
-        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling_yesterday': ['Great', 'Good', 'OK', 'Terrible']}])
-        >>> Results.example().select('how_feeling', 'how_feeling_yesterday').to_list()
-        [('OK', 'Great'), ('Great', 'Good'), ('Terrible', 'OK'), ('OK', 'Terrible')]
-        >>> r = Results.example()
-        >>> r.select('how_feeling').to_list()
-        ['OK', 'Great', 'Terrible', 'OK']
-        >>> from edsl.results.Dataset import Dataset
-        >>> Dataset([{'a.b': [[1, 9], 2, 3, 4]}]).select('a.b').to_list(flatten = True)
-        [1, 9, 2, 3, 4]
-        >>> from edsl.results.Dataset import Dataset
-        >>> Dataset([{'a.b': [[1, 9], 2, 3, 4]}, {'c': [6, 2, 3, 4]}]).select('a.b', 'c').to_list(flatten = True)
-        Traceback (most recent call last):
-        ...
-        ValueError: Cannot flatten a list of lists when there are multiple columns selected.
-        """
-        if len(self.relevant_columns()) > 1 and flatten:
-            raise ValueError(
-                "Cannot flatten a list of lists when there are multiple columns selected."
-            )
-        if len(self.relevant_columns()) == 1:
-            # if only one 'column' is selected (which is typical for this method
-            list_to_return = list(self[0].values())[0]
-        else:
-            keys = self.relevant_columns()
-            data = self.to_dicts(remove_prefix=False)
-            list_to_return = []
-            for d in data:
-                list_to_return.append(tuple([d[key] for key in keys]))
-        if remove_none:
-            list_to_return = [item for item in list_to_return if item is not None]
-        if flatten:
-            new_list = []
-            for item in list_to_return:
-                if isinstance(item, list):
-                    new_list.extend(item)
-                else:
-                    new_list.append(item)
-            list_to_return = new_list
-        from edsl.utilities.PrettyList import PrettyList
-        return PrettyList(list_to_return)
-    def html(
-        self,
-        filename: Optional[str] = None,
-        cta: str = "Open in browser",
-        return_link: bool = False,
-    ):
-        import os
-        import tempfile
-        from edsl.utilities.utilities import is_notebook
-        from IPython.display import HTML, display
-        from edsl.utilities.utilities import is_notebook
-        df = self.to_pandas()
-        if filename is None:
-            current_directory = os.getcwd()
-            filename = tempfile.NamedTemporaryFile(
-                "w", delete=False, suffix=".html", dir=current_directory
-            ).name
-        with open(filename, "w") as f:
-            f.write(df.to_html())
-        if is_notebook():
-            html_url = f"/files/{filename}"
-            html_link = f'<a href="{html_url}" target="_blank">{cta}</a>'
-            display(HTML(html_link))
-        else:
-            print(f"Saved to {filename}")
-            import webbrowser
-            import os
-            webbrowser.open(f"file://{os.path.abspath(filename)}")
-        if return_link:
-            return filename
-    def tally(
-        self, *fields: Optional[str], top_n: Optional[int] = None, output="Dataset"
-    ) -> Union[dict, "Dataset"]:
-        """Tally the values of a field or perform a cross-tab of multiple fields.
-        :param fields: The field(s) to tally, multiple fields for cross-tabulation.
-        >>> from edsl.results import Results
-        >>> r = Results.example()
-        >>> r.select('how_feeling').tally('answer.how_feeling', output = "dict")
-        {'OK': 2, 'Great': 1, 'Terrible': 1}
-        >>> from edsl.results.Dataset import Dataset
-        >>> expected = Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible']}, {'count': [2, 1, 1]}])
-        >>> r.select('how_feeling').tally('answer.how_feeling', output = "Dataset") == expected
-        True
-        """
-        from collections import Counter
-        if len(fields) == 0:
-            fields = self.relevant_columns()
-        relevant_columns_without_prefix = [
-            column.split(".")[-1] for column in self.relevant_columns()
-        ]
-        if not all(
-            f in self.relevant_columns() or f in relevant_columns_without_prefix
-            for f in fields
-        ):
-            raise ValueError("One or more specified fields are not in the dataset.")
-        if len(fields) == 1:
-            field = fields[0]
-            values = self._key_to_value(field)
-        else:
-            values = list(zip(*(self._key_to_value(field) for field in fields)))
-        for value in values:
-            if isinstance(value, list):
-                value = tuple(value)
-        tally = dict(Counter(values))
-        sorted_tally = dict(sorted(tally.items(), key=lambda item: -item[1]))
-        if top_n is not None:
-            sorted_tally = dict(list(sorted_tally.items())[:top_n])
-        from edsl.results.Dataset import Dataset
-        if output == "dict":
-            # why did I do this?
-            warnings.warn(
-                textwrap.dedent(
-                    """\
-                        The default output from tally will change to Dataset in the future.
-                        Use output='Dataset' to get the Dataset object for now.
-                        """
-                )
-            )
-            return sorted_tally
-        elif output == "Dataset":
-            dataset = Dataset(
-                [
-                    {"value": list(sorted_tally.keys())},
-                    {"count": list(sorted_tally.values())},
-                ]
-            )
-            # return dataset
-            sl = dataset.to_scenario_list().unpack(
-                "value",
-                new_names=[fields] if isinstance(fields, str) else fields,
-                keep_original=False,
-            )
-            keys = list(sl[0].keys())
-            keys.remove("count")
-            keys.append("count")
-            return sl.reorder_keys(keys).to_dataset()
-if __name__ == "__main__":
-    import doctest
-    doctest.testmod(optionflags=doctest.ELLIPSIS)
+"""Mixin class for exporting results."""
+import base64
+import csv
+import io
+import html
+from typing import Optional
+from typing import Literal, Optional, Union, List
+class DatasetExportMixin:
+    """Mixin class for exporting Dataset objects."""
+    def relevant_columns(
+        self, data_type: Optional[str] = None, remove_prefix=False
+    ) -> list:
+        """Return the set of keys that are present in the dataset.
+        :param data_type: The data type to filter by.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results.Dataset import Dataset
+        >>> d = Dataset([{'a.b':[1,2,3,4]}])
+        >>> d.relevant_columns()
+        ['a.b']
+        >>> d.relevant_columns(remove_prefix=True)
+        ['b']
+        >>> d = Dataset([{'a':[1,2,3,4]}, {'b':[5,6,7,8]}])
+        >>> d.relevant_columns()
+        ['a', 'b']
+        >>> from edsl.results import Results; Results.example().select('how_feeling', 'how_feeling_yesterday').relevant_columns()
+        ['answer.how_feeling', 'answer.how_feeling_yesterday']
+        >>> from edsl.results import Results
+        >>> sorted(Results.example().select().relevant_columns(data_type = "model"))
+        ['model.frequency_penalty', 'model.logprobs', 'model.max_tokens', 'model.model', 'model.presence_penalty', 'model.temperature', 'model.top_logprobs', 'model.top_p']
+        >>> Results.example().relevant_columns(data_type = "flimflam")
+        Traceback (most recent call last):
+        ...
+        ValueError: No columns found for data type: flimflam. Available data types are: ...
+        """
+        columns = [list(x.keys())[0] for x in self]
+        if remove_prefix:
+            columns = [column.split(".")[-1] for column in columns]
+        def get_data_type(column):
+            if "." in column:
+                return column.split(".")[0]
+            else:
+                return None
+        if data_type:
+            all_columns = columns[:]
+            columns = [
+                column for column in columns if get_data_type(column) == data_type
+            ]
+            if len(columns) == 0:
+                all_data_types = sorted(
+                    list(set(get_data_type(column) for column in all_columns))
+                )
+                raise ValueError(
+                    f"No columns found for data type: {data_type}. Available data types are: {all_data_types}."
+                )
+        return columns
+    def num_observations(self):
+        """Return the number of observations in the dataset.
+        >>> from edsl.results import Results
+        >>> Results.example().num_observations()
+        4
+        """
+        _num_observations = None
+        for entry in self:
+            key, values = list(entry.items())[0]
+            if _num_observations is None:
+                _num_observations = len(values)
+            else:
+                if len(values) != _num_observations:
+                    raise ValueError(
+                        "The number of observations is not consistent across columns."
+                    )
+        return _num_observations
+    def _make_tabular(
+        self, remove_prefix: bool, pretty_labels: Optional[dict] = None
+    ) -> tuple[list, List[list]]:
+        """Turn the results into a tabular format.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling')._make_tabular(remove_prefix = True)
+        (['how_feeling'], [['OK'], ['Great'], ['Terrible'], ['OK']])
+        >>> r.select('how_feeling')._make_tabular(remove_prefix = True, pretty_labels = {'how_feeling': "How are you feeling"})
+        (['How are you feeling'], [['OK'], ['Great'], ['Terrible'], ['OK']])
+        """
+        def create_dict_from_list_of_dicts(list_of_dicts):
+            for entry in list_of_dicts:
+                key, list_of_values = list(entry.items())[0]
+                yield key, list_of_values
+        tabular_repr = dict(create_dict_from_list_of_dicts(self.data))
+        full_header = [list(x.keys())[0] for x in self]
+        rows = []
+        for i in range(self.num_observations()):
+            row = [tabular_repr[h][i] for h in full_header]
+            rows.append(row)
+        if remove_prefix:
+            header = [h.split(".")[-1] for h in full_header]
+        else:
+            header = full_header
+        if pretty_labels is not None:
+            header = [pretty_labels.get(h, h) for h in header]
+        return header, rows
+    def print_long(self):
+        """Print the results in a long format.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').print_long()
+        answer.how_feeling: OK
+        answer.how_feeling: Great
+        answer.how_feeling: Terrible
+        answer.how_feeling: OK
+        """
+        for entry in self:
+            key, list_of_values = list(entry.items())[0]
+            for value in list_of_values:
+                print(f"{key}: {value}")
+    # def print(
+    #     self,
+    #     pretty_labels: Optional[dict] = None,
+    #     filename: Optional[str] = None,
+    #     format: Optional[Literal["rich", "html", "markdown", "latex"]] = None,
+    #     interactive: bool = False,
+    #     split_at_dot: bool = True,
+    #     max_rows=None,
+    #     tee=False,
+    #     iframe=False,
+    #     iframe_height: int = 200,
+    #     iframe_width: int = 600,
+    #     web=False,
+    #     return_string: bool = False,
+    # ) -> Union[None, str, "Results"]:
+    #     """Print the results in a pretty format.
+    #     :param pretty_labels: A dictionary of pretty labels for the columns.
+    #     :param filename: The filename to save the results to.
+    #     :param format: The format to print the results in. Options are 'rich', 'html', 'markdown', or 'latex'.
+    #     :param interactive: Whether to print the results interactively in a Jupyter notebook.
+    #     :param split_at_dot: Whether to split the column names at the last dot w/ a newline.
+    #     :param max_rows: The maximum number of rows to print.
+    #     :param tee: Whether to return the dataset.
+    #     :param iframe: Whether to display the table in an iframe.
+    #     :param iframe_height: The height of the iframe.
+    #     :param iframe_width: The width of the iframe.
+    #     :param web: Whether to display the table in a web browser.
+    #     :param return_string: Whether to return the output as a string instead of printing.
+    #     :return: None if tee is False and return_string is False, the dataset if tee is True, or a string if return_string is True.
+    #     Example: Print in rich format at the terminal
+    #     >>> from edsl.results import Results
+    #     >>> r = Results.example()
+    #     >>> r.select('how_feeling').print(format = "rich")
+    #     ┏━━━━━━━━━━━━━━┓
+    #     ┃ answer       ┃
+    #     ┃ .how_feeling ┃
+    #     ┡━━━━━━━━━━━━━━┩
+    #     │ OK           │
+    #     ├──────────────┤
+    #     │ Great        │
+    #     ├──────────────┤
+    #     │ Terrible     │
+    #     ├──────────────┤
+    #     │ OK           │
+    #     └──────────────┘
+    #     >>> r = Results.example()
+    #     >>> r2 = r.select("how_feeling").print(format = "rich", tee = True, max_rows = 2)
+    #     ┏━━━━━━━━━━━━━━┓
+    #     ┃ answer       ┃
+    #     ┃ .how_feeling ┃
+    #     ┡━━━━━━━━━━━━━━┩
+    #     │ OK           │
+    #     ├──────────────┤
+    #     │ Great        │
+    #     └──────────────┘
+    #     >>> r2
+    #     Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}])
+    #     >>> r.select('how_feeling').print(format = "rich", max_rows = 2)
+    #     ┏━━━━━━━━━━━━━━┓
+    #     ┃ answer       ┃
+    #     ┃ .how_feeling ┃
+    #     ┡━━━━━━━━━━━━━━┩
+    #     │ OK           │
+    #     ├──────────────┤
+    #     │ Great        │
+    #     └──────────────┘
+    #     >>> r.select('how_feeling').print(format = "rich", split_at_dot = False)
+    #     ┏━━━━━━━━━━━━━━━━━━━━┓
+    #     ┃ answer.how_feeling ┃
+    #     ┡━━━━━━━━━━━━━━━━━━━━┩
+    #     │ OK                 │
+    #     ├────────────────────┤
+    #     │ Great              │
+    #     ├────────────────────┤
+    #     │ Terrible           │
+    #     ├────────────────────┤
+    #     │ OK                 │
+    #     └────────────────────┘
+    #     Example: using the pretty_labels parameter
+    #     >>> r.select('how_feeling').print(format="rich", pretty_labels = {'answer.how_feeling': "How are you feeling"})
+    #     ┏━━━━━━━━━━━━━━━━━━━━━┓
+    #     ┃ How are you feeling ┃
+    #     ┡━━━━━━━━━━━━━━━━━━━━━┩
+    #     │ OK                  │
+    #     ├─────────────────────┤
+    #     │ Great               │
+    #     ├─────────────────────┤
+    #     │ Terrible            │
+    #     ├─────────────────────┤
+    #     │ OK                  │
+    #     └─────────────────────┘
+    #     Example: printing in markdown format
+    #     >>> r.select('how_feeling').print(format='markdown')
+    #     | answer.how_feeling |
+    #     |--|
+    #     | OK |
+    #     | Great |
+    #     | Terrible |
+    #     | OK |
+    #     ...
+    #     >>> r.select('how_feeling').print(format='latex')
+    #     \\begin{tabular}{l}
+    #     ...
+    #     \\end{tabular}
+    #     <BLANKLINE>
+    #     """
+    #     from IPython.display import HTML, display
+    #     from edsl.utilities.utilities import is_notebook
+    #     import io
+    #     import sys
+    #     def _determine_format(format):
+    #         if format is None:
+    #             if is_notebook():
+    #                 format = "html"
+    #             else:
+    #                 format = "rich"
+    #         if format not in ["rich", "html", "markdown", "latex"]:
+    #             raise ValueError(
+    #                 "format must be one of 'rich', 'html', 'markdown', or 'latex'."
+    #             )
+    #         return format
+    #     format = _determine_format(format)
+    #     if pretty_labels is None:
+    #         pretty_labels = {}
+    #     if pretty_labels != {}:  # only split at dot if there are no pretty labels
+    #         split_at_dot = False
+    #     def _create_data():
+    #         for index, entry in enumerate(self):
+    #             key, list_of_values = list(entry.items())[0]
+    #             yield {pretty_labels.get(key, key): list_of_values[:max_rows]}
+    #     new_data = list(_create_data())
+    #     # Capture output if return_string is True
+    #     if return_string:
+    #         old_stdout = sys.stdout
+    #         sys.stdout = io.StringIO()
+    #     output = None
+    #     if format == "rich":
+    #         from edsl.utilities.interface import print_dataset_with_rich
+    #         output = print_dataset_with_rich(
+    #             new_data, filename=filename, split_at_dot=split_at_dot
+    #         )
+    #     elif format == "markdown":
+    #         from edsl.utilities.interface import print_list_of_dicts_as_markdown_table
+    #         output = print_list_of_dicts_as_markdown_table(new_data, filename=filename)
+    #     elif format == "latex":
+    #         df = self.to_pandas()
+    #         df.columns = [col.replace("_", " ") for col in df.columns]
+    #         latex_string = df.to_latex(index=False)
+    #         if filename is not None:
+    #             with open(filename, "w") as f:
+    #                 f.write(latex_string)
+    #         else:
+    #             print(latex_string)
+    #             output = latex_string
+    #     elif format == "html":
+    #         from edsl.utilities.interface import print_list_of_dicts_as_html_table
+    #         html_source = print_list_of_dicts_as_html_table(
+    #             new_data, interactive=interactive
+    #         )
+    #         if iframe:
+    #             iframe = f""""
+    #             <iframe srcdoc="{ html.escape(html_source) }" style="width: {iframe_width}px; height: {iframe_height}px;"></iframe>
+    #             """
+    #             display(HTML(iframe))
+    #         elif is_notebook():
+    #             display(HTML(html_source))
+    #         else:
+    #             from edsl.utilities.interface import view_html
+    #             view_html(html_source)
+    #         output = html_source
+    #     # Restore stdout and get captured output if return_string is True
+    #     if return_string:
+    #         captured_output = sys.stdout.getvalue()
+    #         sys.stdout = old_stdout
+    #         return captured_output or output
+    #     if tee:
+    #         return self
+    #     return None
+    def to_csv(
+        self,
+        filename: Optional[str] = None,
+        remove_prefix: bool = False,
+        download_link: bool = False,
+        pretty_labels: Optional[dict] = None,
+    ):
+        """Export the results to a CSV file.
+        :param filename: The filename to save the CSV file to.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        :param download_link: Whether to display a download link in a Jupyter notebook.
+        Example:
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_csv()
+        'answer.how_feeling\\r\\nOK\\r\\nGreat\\r\\nTerrible\\r\\nOK\\r\\n'
+        >>> r.select('how_feeling').to_csv(pretty_labels = {'answer.how_feeling': "How are you feeling"})
+        'How are you feeling\\r\\nOK\\r\\nGreat\\r\\nTerrible\\r\\nOK\\r\\n'
+        >>> import tempfile
+        >>> filename = tempfile.NamedTemporaryFile(delete=False).name
+        >>> r.select('how_feeling').to_csv(filename = filename)
+        >>> import os
+        >>> import csv
+        >>> with open(filename, newline='') as f:
+        ...     reader = csv.reader(f)
+        ...     for row in reader:
+        ...         print(row)
+        ['answer.how_feeling']
+        ['OK']
+        ['Great']
+        ['Terrible']
+        ['OK']
+        """
+        if pretty_labels is None:
+            pretty_labels = {}
+        header, rows = self._make_tabular(
+            remove_prefix=remove_prefix, pretty_labels=pretty_labels
+        )
+        if filename is not None:
+            with open(filename, "w") as f:
+                writer = csv.writer(f)
+                writer.writerow(header)
+                writer.writerows(rows)
+            # print(f"Saved to {filename}")
+        else:
+            output = io.StringIO()
+            writer = csv.writer(output)
+            writer.writerow(header)
+            writer.writerows(rows)
+            if download_link:
+                from IPython.display import HTML, display
+                csv_file = output.getvalue()
+                b64 = base64.b64encode(csv_file.encode()).decode()
+                download_link = f'<a href="data:file/csv;base64,{b64}" download="my_data.csv">Download CSV file</a>'
+                display(HTML(download_link))
+            else:
+                return output.getvalue()
+    def download_link(self, pretty_labels: Optional[dict] = None) -> str:
+        """Return a download link for the results.
+        :param pretty_labels: A dictionary of pretty labels for the columns.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').download_link()
+        '<a href="data:file/csv;base64,YW5zd2VyLmhvd19mZWVsaW5nDQpPSw0KR3JlYXQNClRlcnJpYmxlDQpPSw0K" download="my_data.csv">Download CSV file</a>'
+        """
+        import base64
+        csv_string = self.to_csv(pretty_labels=pretty_labels)
+        b64 = base64.b64encode(csv_string.encode()).decode()
+        return f'<a href="data:file/csv;base64,{b64}" download="my_data.csv">Download CSV file</a>'
+    def to_pandas(
+        self, remove_prefix: bool = False, lists_as_strings=False
+    ) -> "DataFrame":
+        """Convert the results to a pandas DataFrame, ensuring that lists remain as lists.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        """
+        return self._to_pandas_strings(remove_prefix)
+        # if lists_as_strings:
+        #     return self._to_pandas_strings(remove_prefix=remove_prefix)
+        # import pandas as pd
+        # df = pd.DataFrame(self.data)
+        # if remove_prefix:
+        #     # Optionally remove prefixes from column names
+        #     df.columns = [col.split(".")[-1] for col in df.columns]
+        # df_sorted = df.sort_index(axis=1)  # Sort columns alphabetically
+        # return df_sorted
+    def _to_pandas_strings(self, remove_prefix: bool = False) -> "pd.DataFrame":
+        """Convert the results to a pandas DataFrame.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_pandas()
+          answer.how_feeling
+        0                 OK
+        1              Great
+        2           Terrible
+        3                 OK
+        """
+        import pandas as pd
+        csv_string = self.to_csv(remove_prefix=remove_prefix)
+        csv_buffer = io.StringIO(csv_string)
+        df = pd.read_csv(csv_buffer)
+        # df_sorted = df.sort_index(axis=1)  # Sort columns alphabetically
+        return df
+    def to_scenario_list(self, remove_prefix: bool = True) -> list[dict]:
+        """Convert the results to a list of dictionaries, one per scenario.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_scenario_list()
+        ScenarioList([Scenario({'how_feeling': 'OK'}), Scenario({'how_feeling': 'Great'}), Scenario({'how_feeling': 'Terrible'}), Scenario({'how_feeling': 'OK'})])
+        """
+        from edsl import ScenarioList, Scenario
+        list_of_dicts = self.to_dicts(remove_prefix=remove_prefix)
+        scenarios = []
+        for d in list_of_dicts:
+            scenarios.append(Scenario(d))
+        return ScenarioList(scenarios)
+        # return ScenarioList([Scenario(d) for d in list_of_dicts])
+    def to_agent_list(self, remove_prefix: bool = True):
+        """Convert the results to a list of dictionaries, one per agent.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_agent_list()
+        AgentList([Agent(traits = {'how_feeling': 'OK'}), Agent(traits = {'how_feeling': 'Great'}), Agent(traits = {'how_feeling': 'Terrible'}), Agent(traits = {'how_feeling': 'OK'})])
+        """
+        from edsl import AgentList, Agent
+        list_of_dicts = self.to_dicts(remove_prefix=remove_prefix)
+        agents = []
+        for d in list_of_dicts:
+            if "name" in d:
+                d["agent_name"] = d.pop("name")
+                agents.append(Agent(d, name=d["agent_name"]))
+            else:
+                agents.append(Agent(d))
+        return AgentList(agents)
+    def to_dicts(self, remove_prefix: bool = True) -> list[dict]:
+        """Convert the results to a list of dictionaries.
+        :param remove_prefix: Whether to remove the prefix from the column names.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_dicts()
+        [{'how_feeling': 'OK'}, {'how_feeling': 'Great'}, {'how_feeling': 'Terrible'}, {'how_feeling': 'OK'}]
+        """
+        list_of_keys = []
+        list_of_values = []
+        for entry in self:
+            key, values = list(entry.items())[0]
+            list_of_keys.append(key)
+            list_of_values.append(values)
+        if remove_prefix:
+            list_of_keys = [key.split(".")[-1] for key in list_of_keys]
+        list_of_dicts = []
+        for entries in zip(*list_of_values):
+            list_of_dicts.append(dict(zip(list_of_keys, entries)))
+        return list_of_dicts
+    def to_list(self, flatten=False, remove_none=False, unzipped=False) -> list[list]:
+        """Convert the results to a list of lists.
+        :param flatten: Whether to flatten the list of lists.
+        :param remove_none: Whether to remove None values from the list.
+        >>> from edsl.results import Results
+        >>> Results.example().select('how_feeling', 'how_feeling_yesterday')
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible', 'OK']}, {'answer.how_feeling_yesterday': ['Great', 'Good', 'OK', 'Terrible']}])
+        >>> Results.example().select('how_feeling', 'how_feeling_yesterday').to_list()
+        [('OK', 'Great'), ('Great', 'Good'), ('Terrible', 'OK'), ('OK', 'Terrible')]
+        >>> r = Results.example()
+        >>> r.select('how_feeling').to_list()
+        ['OK', 'Great', 'Terrible', 'OK']
+        >>> from edsl.results.Dataset import Dataset
+        >>> Dataset([{'a.b': [[1, 9], 2, 3, 4]}]).select('a.b').to_list(flatten = True)
+        [1, 9, 2, 3, 4]
+        >>> from edsl.results.Dataset import Dataset
+        >>> Dataset([{'a.b': [[1, 9], 2, 3, 4]}, {'c': [6, 2, 3, 4]}]).select('a.b', 'c').to_list(flatten = True)
+        Traceback (most recent call last):
+        ...
+        ValueError: Cannot flatten a list of lists when there are multiple columns selected.
+        """
+        if len(self.relevant_columns()) > 1 and flatten:
+            raise ValueError(
+                "Cannot flatten a list of lists when there are multiple columns selected."
+            )
+        if len(self.relevant_columns()) == 1:
+            # if only one 'column' is selected (which is typical for this method
+            list_to_return = list(self[0].values())[0]
+        else:
+            keys = self.relevant_columns()
+            data = self.to_dicts(remove_prefix=False)
+            list_to_return = []
+            for d in data:
+                list_to_return.append(tuple([d[key] for key in keys]))
+        if remove_none:
+            list_to_return = [item for item in list_to_return if item is not None]
+        if flatten:
+            new_list = []
+            for item in list_to_return:
+                if isinstance(item, list):
+                    new_list.extend(item)
+                else:
+                    new_list.append(item)
+            list_to_return = new_list
+        return list_to_return
+    def html(
+        self,
+        filename: Optional[str] = None,
+        cta: str = "Open in browser",
+        return_link: bool = False,
+    ):
+        import os
+        import tempfile
+        from edsl.utilities.utilities import is_notebook
+        from IPython.display import HTML, display
+        from edsl.utilities.utilities import is_notebook
+        df = self.to_pandas()
+        if filename is None:
+            current_directory = os.getcwd()
+            filename = tempfile.NamedTemporaryFile(
+                "w", delete=False, suffix=".html", dir=current_directory
+            ).name
+        with open(filename, "w") as f:
+            f.write(df.to_html())
+        if is_notebook():
+            html_url = f"/files/{filename}"
+            html_link = f'<a href="{html_url}" target="_blank">{cta}</a>'
+            display(HTML(html_link))
+        else:
+            print(f"Saved to {filename}")
+            import webbrowser
+            import os
+            webbrowser.open(f"file://{os.path.abspath(filename)}")
+        if return_link:
+            return filename
+    def tally(
+        self, *fields: Optional[str], top_n: Optional[int] = None, output="Dataset"
+    ) -> Union[dict, "Dataset"]:
+        """Tally the values of a field or perform a cross-tab of multiple fields.
+        :param fields: The field(s) to tally, multiple fields for cross-tabulation.
+        >>> from edsl.results import Results
+        >>> r = Results.example()
+        >>> r.select('how_feeling').tally('answer.how_feeling', output = "dict")
+        {'OK': 2, 'Great': 1, 'Terrible': 1}
+        >>> r.select('how_feeling').tally('answer.how_feeling', output = "Dataset")
+        Dataset([{'answer.how_feeling': ['OK', 'Great', 'Terrible']}, {'count': [2, 1, 1]}])
+        """
+        from collections import Counter
+        if len(fields) == 0:
+            fields = self.relevant_columns()
+        relevant_columns_without_prefix = [
+            column.split(".")[-1] for column in self.relevant_columns()
+        ]
+        if not all(
+            f in self.relevant_columns() or f in relevant_columns_without_prefix
+            for f in fields
+        ):
+            raise ValueError("One or more specified fields are not in the dataset.")
+        if len(fields) == 1:
+            field = fields[0]
+            values = self._key_to_value(field)
+        else:
+            values = list(zip(*(self._key_to_value(field) for field in fields)))
+        for value in values:
+            if isinstance(value, list):
+                value = tuple(value)
+        tally = dict(Counter(values))
+        sorted_tally = dict(sorted(tally.items(), key=lambda item: -item[1]))
+        if top_n is not None:
+            sorted_tally = dict(list(sorted_tally.items())[:top_n])
+        import warnings
+        import textwrap
+        from edsl.results.Dataset import Dataset
+        if output == "dict":
+            # why did I do this?
+            warnings.warn(
+                textwrap.dedent(
+                    """\
+                        The default output from tally will change to Dataset in the future.
+                        Use output='Dataset' to get the Dataset object for now.
+                        """
+                )
+            )
+            return sorted_tally
+        elif output == "Dataset":
+            dataset = Dataset(
+                [
+                    {"value": list(sorted_tally.keys())},
+                    {"count": list(sorted_tally.values())},
+                ]
+            )
+            # return dataset
+            sl = dataset.to_scenario_list().unpack(
+                "value",
+                new_names=[fields] if isinstance(fields, str) else fields,
+                keep_original=False,
+            )
+            keys = list(sl[0].keys())
+            keys.remove("count")
+            keys.append("count")
+            return sl.reorder_keys(keys).to_dataset()
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl 0.1.39.dev2__py3-none-any.whl → 0.1.39.dev3__py3-none-any.whl

edsl 0.1.39.dev2py3-none-any.whl → 0.1.39.dev3py3-none-any.whl