PyPI - edsl - Versions diffs - 0.1.47__py3-none-any.whl → 0.1.48__py3-none-any.whl - Mend

edsl 0.1.47py3-none-any.whl → 0.1.48py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

edsl/__init__.py +44 -39
edsl/__version__.py +1 -1
edsl/agents/__init__.py +4 -2
edsl/agents/{Agent.py → agent.py} +442 -152
edsl/agents/{AgentList.py → agent_list.py} +220 -162
edsl/agents/descriptors.py +46 -7
edsl/{exceptions/agents.py → agents/exceptions.py} +3 -12
edsl/base/__init__.py +75 -0
edsl/base/base_class.py +1303 -0
edsl/base/data_transfer_models.py +114 -0
edsl/base/enums.py +215 -0
edsl/base.py +8 -0
edsl/buckets/__init__.py +25 -0
edsl/buckets/bucket_collection.py +324 -0
edsl/buckets/model_buckets.py +206 -0
edsl/buckets/token_bucket.py +502 -0
edsl/{jobs/buckets/TokenBucketAPI.py → buckets/token_bucket_api.py} +1 -1
edsl/buckets/token_bucket_client.py +509 -0
edsl/caching/__init__.py +20 -0
edsl/caching/cache.py +814 -0
edsl/caching/cache_entry.py +427 -0
edsl/{data/CacheHandler.py → caching/cache_handler.py} +14 -15
edsl/caching/exceptions.py +24 -0
edsl/caching/orm.py +30 -0
edsl/{data/RemoteCacheSync.py → caching/remote_cache_sync.py} +3 -3
edsl/caching/sql_dict.py +441 -0
edsl/config/__init__.py +8 -0
edsl/config/config_class.py +177 -0
edsl/config.py +4 -176
edsl/conversation/Conversation.py +7 -7
edsl/conversation/car_buying.py +4 -4
edsl/conversation/chips.py +6 -6
edsl/coop/__init__.py +25 -2
edsl/coop/coop.py +303 -67
edsl/coop/{ExpectedParrotKeyHandler.py → ep_key_handling.py} +86 -10
edsl/coop/exceptions.py +62 -0
edsl/coop/price_fetcher.py +126 -0
edsl/coop/utils.py +89 -24
edsl/data_transfer_models.py +5 -72
edsl/dataset/__init__.py +10 -0
edsl/{results/Dataset.py → dataset/dataset.py} +116 -36
edsl/{results/DatasetExportMixin.py → dataset/dataset_operations_mixin.py} +606 -122
edsl/{results/DatasetTree.py → dataset/dataset_tree.py} +156 -75
edsl/{results/TableDisplay.py → dataset/display/table_display.py} +18 -7
edsl/{results → dataset/display}/table_renderers.py +58 -2
edsl/{results → dataset}/file_exports.py +4 -5
edsl/{results → dataset}/smart_objects.py +2 -2
edsl/enums.py +5 -205
edsl/inference_services/__init__.py +5 -0
edsl/inference_services/{AvailableModelCacheHandler.py → available_model_cache_handler.py} +2 -3
edsl/inference_services/{AvailableModelFetcher.py → available_model_fetcher.py} +8 -14
edsl/inference_services/data_structures.py +3 -2
edsl/{exceptions/inference_services.py → inference_services/exceptions.py} +1 -1
edsl/inference_services/{InferenceServiceABC.py → inference_service_abc.py} +1 -1
edsl/inference_services/{InferenceServicesCollection.py → inference_services_collection.py} +8 -7
edsl/inference_services/registry.py +4 -41
edsl/inference_services/{ServiceAvailability.py → service_availability.py} +5 -25
edsl/inference_services/services/__init__.py +31 -0
edsl/inference_services/{AnthropicService.py → services/anthropic_service.py} +3 -3
edsl/inference_services/{AwsBedrock.py → services/aws_bedrock.py} +2 -2
edsl/inference_services/{AzureAI.py → services/azure_ai.py} +2 -2
edsl/inference_services/{DeepInfraService.py → services/deep_infra_service.py} +1 -3
edsl/inference_services/{DeepSeekService.py → services/deep_seek_service.py} +2 -4
edsl/inference_services/{GoogleService.py → services/google_service.py} +5 -4
edsl/inference_services/{GroqService.py → services/groq_service.py} +1 -1
edsl/inference_services/{MistralAIService.py → services/mistral_ai_service.py} +3 -3
edsl/inference_services/{OllamaService.py → services/ollama_service.py} +1 -7
edsl/inference_services/{OpenAIService.py → services/open_ai_service.py} +5 -6
edsl/inference_services/{PerplexityService.py → services/perplexity_service.py} +3 -7
edsl/inference_services/{TestService.py → services/test_service.py} +7 -6
edsl/inference_services/{TogetherAIService.py → services/together_ai_service.py} +2 -6
edsl/inference_services/{XAIService.py → services/xai_service.py} +1 -1
edsl/inference_services/write_available.py +1 -2
edsl/instructions/__init__.py +6 -0
edsl/{surveys/instructions/Instruction.py → instructions/instruction.py} +11 -6
edsl/{surveys/instructions/InstructionCollection.py → instructions/instruction_collection.py} +10 -5
edsl/{surveys/InstructionHandler.py → instructions/instruction_handler.py} +3 -3
edsl/{jobs/interviews → interviews}/ReportErrors.py +2 -2
edsl/interviews/__init__.py +4 -0
edsl/{jobs/AnswerQuestionFunctionConstructor.py → interviews/answering_function.py} +45 -18
edsl/{jobs/interviews/InterviewExceptionEntry.py → interviews/exception_tracking.py} +107 -22
edsl/interviews/interview.py +638 -0
edsl/{jobs/interviews/InterviewStatusDictionary.py → interviews/interview_status_dictionary.py} +21 -12
edsl/{jobs/interviews/InterviewStatusLog.py → interviews/interview_status_log.py} +16 -7
edsl/{jobs/InterviewTaskManager.py → interviews/interview_task_manager.py} +12 -7
edsl/{jobs/RequestTokenEstimator.py → interviews/request_token_estimator.py} +8 -3
edsl/{jobs/interviews/InterviewStatistic.py → interviews/statistics.py} +36 -10
edsl/invigilators/__init__.py +38 -0
edsl/invigilators/invigilator_base.py +477 -0
edsl/{agents/Invigilator.py → invigilators/invigilators.py} +263 -10
edsl/invigilators/prompt_constructor.py +476 -0
edsl/{agents → invigilators}/prompt_helpers.py +2 -1
edsl/{agents/QuestionInstructionPromptBuilder.py → invigilators/question_instructions_prompt_builder.py} +18 -13
edsl/{agents → invigilators}/question_option_processor.py +96 -21
edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} +64 -12
edsl/jobs/__init__.py +7 -1
edsl/jobs/async_interview_runner.py +99 -35
edsl/jobs/check_survey_scenario_compatibility.py +7 -5
edsl/jobs/data_structures.py +153 -22
edsl/{exceptions/jobs.py → jobs/exceptions.py} +2 -1
edsl/jobs/{FetchInvigilator.py → fetch_invigilator.py} +4 -4
edsl/jobs/{loggers/HTMLTableJobLogger.py → html_table_job_logger.py} +6 -2
edsl/jobs/{Jobs.py → jobs.py} +313 -167
edsl/jobs/{JobsChecks.py → jobs_checks.py} +15 -7
edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} +19 -17
edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} +10 -5
edsl/jobs/jobs_pricing_estimation.py +347 -0
edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} +4 -3
edsl/jobs/jobs_runner_asyncio.py +282 -0
edsl/jobs/{JobsRemoteInferenceHandler.py → remote_inference.py} +19 -22
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/key_management/__init__.py +28 -0
edsl/key_management/key_lookup.py +161 -0
edsl/{language_models/key_management/KeyLookupBuilder.py → key_management/key_lookup_builder.py} +118 -47
edsl/key_management/key_lookup_collection.py +82 -0
edsl/key_management/models.py +218 -0
edsl/language_models/__init__.py +7 -2
edsl/language_models/{ComputeCost.py → compute_cost.py} +18 -3
edsl/{exceptions/language_models.py → language_models/exceptions.py} +2 -1
edsl/language_models/language_model.py +1080 -0
edsl/language_models/model.py +10 -25
edsl/language_models/{ModelList.py → model_list.py} +9 -14
edsl/language_models/{RawResponseHandler.py → raw_response_handler.py} +1 -1
edsl/language_models/{RegisterLanguageModelsMeta.py → registry.py} +1 -1
edsl/language_models/repair.py +4 -4
edsl/language_models/utilities.py +4 -4
edsl/notebooks/__init__.py +3 -1
edsl/notebooks/{Notebook.py → notebook.py} +7 -8
edsl/prompts/__init__.py +1 -1
edsl/{exceptions/prompts.py → prompts/exceptions.py} +3 -1
edsl/prompts/{Prompt.py → prompt.py} +101 -95
edsl/questions/HTMLQuestion.py +1 -1
edsl/questions/__init__.py +154 -25
edsl/questions/answer_validator_mixin.py +1 -1
edsl/questions/compose_questions.py +4 -3
edsl/questions/derived/question_likert_five.py +166 -0
edsl/questions/derived/{QuestionLinearScale.py → question_linear_scale.py} +4 -4
edsl/questions/derived/{QuestionTopK.py → question_top_k.py} +4 -4
edsl/questions/derived/{QuestionYesNo.py → question_yes_no.py} +4 -5
edsl/questions/descriptors.py +24 -30
edsl/questions/loop_processor.py +65 -19
edsl/questions/question_base.py +881 -0
edsl/questions/question_base_gen_mixin.py +15 -16
edsl/questions/{QuestionBasePromptsMixin.py → question_base_prompts_mixin.py} +2 -2
edsl/questions/{QuestionBudget.py → question_budget.py} +3 -4
edsl/questions/{QuestionCheckBox.py → question_check_box.py} +16 -16
edsl/questions/{QuestionDict.py → question_dict.py} +39 -5
edsl/questions/{QuestionExtract.py → question_extract.py} +9 -9
edsl/questions/question_free_text.py +282 -0
edsl/questions/{QuestionFunctional.py → question_functional.py} +6 -5
edsl/questions/{QuestionList.py → question_list.py} +6 -7
edsl/questions/{QuestionMatrix.py → question_matrix.py} +6 -5
edsl/questions/{QuestionMultipleChoice.py → question_multiple_choice.py} +126 -21
edsl/questions/{QuestionNumerical.py → question_numerical.py} +5 -5
edsl/questions/{QuestionRank.py → question_rank.py} +6 -6
edsl/questions/question_registry.py +4 -9
edsl/questions/register_questions_meta.py +8 -4
edsl/questions/response_validator_abc.py +17 -16
edsl/results/__init__.py +4 -1
edsl/{exceptions/results.py → results/exceptions.py} +1 -1
edsl/results/report.py +197 -0
edsl/results/{Result.py → result.py} +131 -45
edsl/results/{Results.py → results.py} +365 -220
edsl/results/results_selector.py +344 -25
edsl/scenarios/__init__.py +30 -3
edsl/scenarios/{ConstructDownloadLink.py → construct_download_link.py} +7 -0
edsl/scenarios/directory_scanner.py +156 -13
edsl/scenarios/document_chunker.py +186 -0
edsl/scenarios/exceptions.py +101 -0
edsl/scenarios/file_methods.py +2 -3
edsl/scenarios/{FileStore.py → file_store.py} +275 -189
edsl/scenarios/handlers/__init__.py +14 -14
edsl/scenarios/handlers/{csv.py → csv_file_store.py} +1 -2
edsl/scenarios/handlers/{docx.py → docx_file_store.py} +8 -7
edsl/scenarios/handlers/{html.py → html_file_store.py} +1 -2
edsl/scenarios/handlers/{jpeg.py → jpeg_file_store.py} +1 -1
edsl/scenarios/handlers/{json.py → json_file_store.py} +1 -1
edsl/scenarios/handlers/latex_file_store.py +5 -0
edsl/scenarios/handlers/{md.py → md_file_store.py} +1 -1
edsl/scenarios/handlers/{pdf.py → pdf_file_store.py} +2 -2
edsl/scenarios/handlers/{png.py → png_file_store.py} +1 -1
edsl/scenarios/handlers/{pptx.py → pptx_file_store.py} +8 -7
edsl/scenarios/handlers/{py.py → py_file_store.py} +1 -3
edsl/scenarios/handlers/{sql.py → sql_file_store.py} +2 -1
edsl/scenarios/handlers/{sqlite.py → sqlite_file_store.py} +2 -3
edsl/scenarios/handlers/{txt.py → txt_file_store.py} +1 -1
edsl/scenarios/scenario.py +928 -0
edsl/scenarios/scenario_join.py +18 -5
edsl/scenarios/{ScenarioList.py → scenario_list.py} +294 -106
edsl/scenarios/{ScenarioListPdfMixin.py → scenario_list_pdf_tools.py} +16 -15
edsl/scenarios/scenario_selector.py +5 -1
edsl/study/ObjectEntry.py +2 -2
edsl/study/SnapShot.py +5 -5
edsl/study/Study.py +18 -19
edsl/study/__init__.py +6 -4
edsl/surveys/__init__.py +7 -4
edsl/surveys/dag/__init__.py +2 -0
edsl/surveys/{ConstructDAG.py → dag/construct_dag.py} +3 -3
edsl/surveys/{DAG.py → dag/dag.py} +13 -10
edsl/surveys/descriptors.py +1 -1
edsl/surveys/{EditSurvey.py → edit_survey.py} +9 -9
edsl/{exceptions/surveys.py → surveys/exceptions.py} +1 -2
edsl/surveys/memory/__init__.py +3 -0
edsl/surveys/{MemoryPlan.py → memory/memory_plan.py} +10 -9
edsl/surveys/rules/__init__.py +3 -0
edsl/surveys/{Rule.py → rules/rule.py} +103 -43
edsl/surveys/{RuleCollection.py → rules/rule_collection.py} +21 -30
edsl/surveys/{RuleManager.py → rules/rule_manager.py} +19 -13
edsl/surveys/survey.py +1743 -0
edsl/surveys/{SurveyExportMixin.py → survey_export.py} +22 -27
edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} +11 -2
edsl/surveys/{Simulator.py → survey_simulator.py} +10 -3
edsl/tasks/__init__.py +32 -0
edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} +115 -57
edsl/tasks/task_creators.py +135 -0
edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} +86 -47
edsl/{jobs/tasks → tasks}/task_status_enum.py +91 -7
edsl/tasks/task_status_log.py +85 -0
edsl/tokens/__init__.py +2 -0
edsl/tokens/interview_token_usage.py +53 -0
edsl/utilities/PrettyList.py +1 -1
edsl/utilities/SystemInfo.py +25 -22
edsl/utilities/__init__.py +29 -21
edsl/utilities/gcp_bucket/__init__.py +2 -0
edsl/utilities/gcp_bucket/cloud_storage.py +99 -96
edsl/utilities/interface.py +44 -536
edsl/{results/MarkdownToPDF.py → utilities/markdown_to_pdf.py} +13 -5
edsl/utilities/repair_functions.py +1 -1
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/METADATA +1 -1
edsl-0.1.48.dist-info/RECORD +347 -0
edsl/Base.py +0 -493
edsl/BaseDiff.py +0 -260
edsl/agents/InvigilatorBase.py +0 -260
edsl/agents/PromptConstructor.py +0 -318
edsl/coop/PriceFetcher.py +0 -54
edsl/data/Cache.py +0 -582
edsl/data/CacheEntry.py +0 -238
edsl/data/SQLiteDict.py +0 -292
edsl/data/__init__.py +0 -5
edsl/data/orm.py +0 -10
edsl/exceptions/cache.py +0 -5
edsl/exceptions/coop.py +0 -14
edsl/exceptions/data.py +0 -14
edsl/exceptions/scenarios.py +0 -29
edsl/jobs/Answers.py +0 -43
edsl/jobs/JobsPrompts.py +0 -354
edsl/jobs/buckets/BucketCollection.py +0 -134
edsl/jobs/buckets/ModelBuckets.py +0 -65
edsl/jobs/buckets/TokenBucket.py +0 -283
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/interviews/Interview.py +0 -395
edsl/jobs/interviews/InterviewExceptionCollection.py +0 -99
edsl/jobs/interviews/InterviewStatisticsCollection.py +0 -25
edsl/jobs/runners/JobsRunnerAsyncio.py +0 -163
edsl/jobs/runners/JobsRunnerStatusData.py +0 -0
edsl/jobs/tasks/TaskCreators.py +0 -64
edsl/jobs/tasks/TaskStatusLog.py +0 -23
edsl/jobs/tokens/InterviewTokenUsage.py +0 -27
edsl/language_models/LanguageModel.py +0 -635
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/models.py +0 -137
edsl/questions/QuestionBase.py +0 -544
edsl/questions/QuestionFreeText.py +0 -130
edsl/questions/derived/QuestionLikertFive.py +0 -76
edsl/results/ResultsExportMixin.py +0 -45
edsl/results/TextEditor.py +0 -50
edsl/results/results_fetch_mixin.py +0 -33
edsl/results/results_tools_mixin.py +0 -98
edsl/scenarios/DocumentChunker.py +0 -104
edsl/scenarios/Scenario.py +0 -548
edsl/scenarios/ScenarioHtmlMixin.py +0 -65
edsl/scenarios/ScenarioListExportMixin.py +0 -45
edsl/scenarios/handlers/latex.py +0 -5
edsl/shared.py +0 -1
edsl/surveys/Survey.py +0 -1301
edsl/surveys/SurveyQualtricsImport.py +0 -284
edsl/surveys/SurveyToApp.py +0 -141
edsl/surveys/instructions/__init__.py +0 -0
edsl/tools/__init__.py +0 -1
edsl/tools/clusters.py +0 -192
edsl/tools/embeddings.py +0 -27
edsl/tools/embeddings_plotting.py +0 -118
edsl/tools/plotting.py +0 -112
edsl/tools/summarize.py +0 -18
edsl/utilities/data/Registry.py +0 -6
edsl/utilities/data/__init__.py +0 -1
edsl/utilities/data/scooter_results.json +0 -1
edsl-0.1.47.dist-info/RECORD +0 -354
/edsl/coop/{CoopFunctionsMixin.py → coop_functions.py} +0 -0
/edsl/{results → dataset/display}/CSSParameterizer.py +0 -0
/edsl/{language_models/key_management → dataset/display}/__init__.py +0 -0
/edsl/{results → dataset/display}/table_data_class.py +0 -0
/edsl/{results → dataset/display}/table_display.css +0 -0
/edsl/{results/ResultsGGMixin.py → dataset/r/ggplot.py} +0 -0
/edsl/{results → dataset}/tree_explore.py +0 -0
/edsl/{surveys/instructions/ChangeInstruction.py → instructions/change_instruction.py} +0 -0
/edsl/{jobs/interviews → interviews}/interview_status_enum.py +0 -0
/edsl/jobs/{runners/JobsRunnerStatus.py → jobs_runner_status.py} +0 -0
/edsl/language_models/{PriceManager.py → price_manager.py} +0 -0
/edsl/language_models/{fake_openai_call.py → unused/fake_openai_call.py} +0 -0
/edsl/language_models/{fake_openai_service.py → unused/fake_openai_service.py} +0 -0
/edsl/notebooks/{NotebookToLaTeX.py → notebook_to_latex.py} +0 -0
/edsl/{exceptions/questions.py → questions/exceptions.py} +0 -0
/edsl/questions/{SimpleAskMixin.py → simple_ask_mixin.py} +0 -0
/edsl/surveys/{Memory.py → memory/memory.py} +0 -0
/edsl/surveys/{MemoryManagement.py → memory/memory_management.py} +0 -0
/edsl/surveys/{SurveyCSS.py → survey_css.py} +0 -0
/edsl/{jobs/tokens/TokenUsage.py → tokens/token_usage.py} +0 -0
/edsl/{results/MarkdownToDocx.py → utilities/markdown_to_docx.py} +0 -0
/edsl/{TemplateLoader.py → utilities/template_loader.py} +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/LICENSE +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/WHEEL +0 -0

edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} RENAMED Viewed

@@ -1,11 +1,47 @@
-from typing import List, Optional
+"""
+This module provides the TaskHistory class for tracking and analyzing task execution history.
+The TaskHistory class maintains a record of all interviews conducted by EDSL, including
+their task execution histories, exceptions, and performance metrics. It supports rich
+visualization and reporting to help users understand task execution patterns and diagnose
+issues.
+"""
+from typing import List, Optional, Dict, Any, Union
 from io import BytesIO
 import base64
-from edsl.jobs.tasks.task_status_enum import TaskStatus
-from edsl.Base import RepresentationMixin
+import os
+import tempfile
+from .task_status_enum import TaskStatus
+from ..base import RepresentationMixin
 class TaskHistory(RepresentationMixin):
+    """
+    Records and analyzes the execution history of tasks across multiple interviews.
+    The TaskHistory class serves as a central repository for tracking task execution
+    across multiple interviews. It provides methods for:
+    1. Error Analysis - Collecting, categorizing, and reporting exceptions
+    2. Execution Visualization - Generating plots of task status over time
+    3. Performance Metrics - Calculating timing statistics for tasks
+    4. HTML Reports - Creating detailed interactive reports of execution
+    This class is particularly useful for debugging complex interview workflows,
+    identifying performance bottlenecks, and understanding patterns in task execution.
+    It supports both interactive exploration in notebooks and standalone report
+    generation.
+    Key features:
+    - Tracks exceptions with optional traceback storage
+    - Provides visualizations of task status transitions
+    - Generates interactive HTML reports with filtering and drill-down
+    - Computes statistics across interviews (by model, question type, etc.)
+    - Exports to various formats (HTML, notebook, etc.)
+    """
     def __init__(
         self,
         interviews: List["Interview"] = None,
@@ -14,12 +50,16 @@ class TaskHistory(RepresentationMixin):
         interviews_with_exceptions_only: bool = False,
     ):
         """
-        The structure of a TaskHistory exception
-        [Interview.exceptions, Interview.exceptions, Interview.exceptions, ...]
-        >>> _ = TaskHistory.example()
-        ...
+        Initialize a TaskHistory to track execution across multiple interviews.
+        Parameters:
+            interviews: List of Interview objects to track
+            include_traceback: Whether to include full exception tracebacks
+            max_interviews: Maximum number of interviews to display in reports
+            interviews_with_exceptions_only: If True, only track interviews with exceptions
+        Example:
+            >>> _ = TaskHistory.example()  # Create a sample TaskHistory
         """
         self.interviews_with_exceptions_only = interviews_with_exceptions_only
         self._interviews = {}
@@ -34,10 +74,8 @@ class TaskHistory(RepresentationMixin):
         }
         self.max_interviews = max_interviews
-        # self.total_interviews = interviews
         self.include_traceback = include_traceback
-        # self._interviews = {index: i for index, i in enumerate(self.total_interviews)}
         self.max_interviews = max_interviews
     def add_interview(self, interview: "Interview"):
@@ -51,9 +89,8 @@ class TaskHistory(RepresentationMixin):
     @classmethod
     def example(cls):
         """ """
-        from edsl.jobs.interviews.Interview import Interview
-        from edsl.jobs.Jobs import Jobs
+        from ..interviews import Interview
+        from ..jobs import Jobs
         j = Jobs.example(throw_exception_probability=1, test_model=True)
@@ -120,7 +157,7 @@ class TaskHistory(RepresentationMixin):
         if data is None:
             return cls([], include_traceback=False)
-        from edsl.jobs.interviews.Interview import Interview
+        from ..interviews import Interview
         interviews = [Interview.from_dict(i) for i in data["interviews"]]
         return cls(interviews, include_traceback=data["include_traceback"])
@@ -273,15 +310,15 @@ class TaskHistory(RepresentationMixin):
                 for exception in exceptions:
                     key = (
                         exception.exception.__class__.__name__,  # Exception type
-                        interview.model._inference_service_,    # Service
-                        interview.model.model,                  # Model
-                        question_name                           # Question name
+                        interview.model._inference_service_,  # Service
+                        interview.model.model,  # Model
+                        question_name,  # Question name
                     )
                     if key not in exceptions_table:
                         exceptions_table[key] = 0
                     exceptions_table[key] += 1
         return exceptions_table
     @property
     def exceptions_by_type(self) -> dict:
         """Return a dictionary of exceptions tallied by type."""
@@ -342,27 +379,6 @@ class TaskHistory(RepresentationMixin):
         }
         return sorted_exceptions_by_question_name
-    # @property
-    # def exceptions_by_model(self) -> dict:
-    #     """Return a dictionary of exceptions tallied by model and question name."""
-    #     exceptions_by_model = {}
-    #     for interview in self.total_interviews:
-    #         model = interview.model.model
-    #         service = interview.model._inference_service_
-    #         if (service, model) not in exceptions_by_model:
-    #             exceptions_by_model[(service, model)] = 0
-    #         if interview.exceptions != {}:
-    #             exceptions_by_model[(service, model)] += len(interview.exceptions)
-    #     # sort the exceptions by model
-    #     sorted_exceptions_by_model = {
-    #         k: v
-    #         for k, v in sorted(
-    #             exceptions_by_model.items(), key=lambda item: item[1], reverse=True
-    #         )
-    #     }
-    #     return sorted_exceptions_by_model
     @property
     def exceptions_by_model(self) -> dict:
         """Return a dictionary of exceptions tallied by model and question name."""
@@ -389,7 +405,7 @@ class TaskHistory(RepresentationMixin):
         models_used = set([i.model.model for index, i in self._interviews.items()])
         from jinja2 import Environment, FileSystemLoader
-        from edsl.TemplateLoader import TemplateLoader
+        from edsl.utilities import TemplateLoader
         env = Environment(loader=TemplateLoader("edsl", "templates/error_reporting"))
@@ -417,12 +433,35 @@ class TaskHistory(RepresentationMixin):
     def html(
         self,
         filename: Optional[str] = None,
-        return_link=False,
-        css=None,
-        cta="<br><span style='font-size: 18px; font-weight: medium-bold; text-decoration: underline;'>Click to open the report in a new tab</span><br><br>",
-        open_in_browser=False,
-    ):
-        """Return an HTML report."""
+        return_link: bool = False,
+        css: Optional[str] = None,
+        cta: str = "<br><span style='font-size: 18px; font-weight: medium-bold; text-decoration: underline;'>Click to open the report in a new tab</span><br><br>",
+        open_in_browser: bool = False,
+    ) -> Optional[str]:
+        """
+        Generate and display an interactive HTML report of task execution.
+        This method creates a comprehensive HTML report showing task execution details,
+        exceptions, timing information, and statistics across all tracked interviews.
+        In notebook environments, it displays an embedded preview with a link to open
+        the full report in a new tab.
+        Parameters:
+            filename: Path to save the HTML report (if None, a temporary file is created)
+            return_link: If True, return the path to the saved HTML file
+            css: Custom CSS to apply to the report (if None, uses default styling)
+            cta: HTML for the "Call to Action" link text
+            open_in_browser: If True, automatically open the report in the default browser
+        Returns:
+            If return_link is True, returns the path to the saved HTML file; otherwise None
+        Notes:
+            - In Jupyter notebooks, displays an embedded preview with a link
+            - In terminal environments, saves the file and prints its location
+            - The report includes interactive elements for filtering and drill-down
+            - Exception details, status transitions, and timing are all included
+        """
         from IPython.display import display, HTML
         import tempfile
         import os

edsl/{jobs/tasks → tasks}/task_status_enum.py RENAMED Viewed

@@ -5,7 +5,27 @@ import time
 class TaskStatus(enum.Enum):
-    "These are the possible states a task can be in."
+    """
+    Enumeration of possible states for a task in the EDSL task system.
+    Each task moves through various states during its lifecycle, from creation
+    to completion. This enum defines all possible states to track task progress
+    and diagnose issues.
+    States:
+        NOT_STARTED: Initial state - task has been created but not yet started
+        WAITING_FOR_DEPENDENCIES: Task is waiting for prerequisite tasks to complete
+        CANCELLED: Task was explicitly cancelled by the user or system
+        PARENT_FAILED: Task cannot run because a dependency task failed
+        WAITING_FOR_REQUEST_CAPACITY: Task is waiting due to API rate limits
+        WAITING_FOR_TOKEN_CAPACITY: Task is waiting due to token usage limits
+        API_CALL_IN_PROGRESS: Task is actively executing an API call
+        SUCCESS: Task completed successfully
+        FAILED: Task encountered an error and failed to complete
+    These states are used throughout EDSL to track task progress, generate
+    visualizations, and provide detailed error reports.
+    """
     NOT_STARTED = enum.auto()
     WAITING_FOR_DEPENDENCIES = enum.auto()
     CANCELLED = enum.auto()
@@ -18,30 +38,80 @@ class TaskStatus(enum.Enum):
 class TaskStatusLogEntry(UserDict):
-    def __init__(self, log_time, value):
+    """
+    A timestamped record of a task's status change.
+    This class records both the time when a task's status changed and the new status value.
+    It uses the UserDict interface for convenient dictionary-like access while maintaining
+    the structured nature of status log entries.
+    Attributes:
+        log_time: The time (from time.monotonic()) when the status change occurred
+        value: The new TaskStatus value
+    """
+    def __init__(self, log_time: float, value: TaskStatus):
+        """
+        Create a new task status log entry.
+        Parameters:
+            log_time: The time when this status change occurred (from time.monotonic())
+            value: The TaskStatus value that the task transitioned to
+        """
         self.data = {"log_time": log_time, "value": value}
         super().__init__(self.data)
 class TaskStatusDescriptor:
-    "The descriptor ensures that the task status is always an instance of the TaskStatus enum."
+    """
+    A descriptor that enforces TaskStatus type safety and logs status changes.
+    This descriptor is used to create task_status properties in task-related classes.
+    It performs two key functions:
+    1. Type Enforcement: Ensures that task_status is always set to a valid TaskStatus enum
+    2. Logging: Automatically adds entries to the task's status_log when status changes
+    By using this descriptor, EDSL ensures consistent status tracking across all tasks
+    while providing a rich history of status changes for debugging and visualization.
+    """
     def __init__(self):
+        """Initialize the descriptor with a null status value."""
         self._task_status = None
     def __get__(self, instance, owner):
+        """Return the current task status."""
         return self._task_status
     def __set__(self, instance, value):
-        """Ensure that the value is an instance of TaskStatus."""
+        """
+        Set a new task status and record the change in the status log.
+        This method enforces that the value is a valid TaskStatus enum and
+        automatically adds an entry to the instance's status_log (if it exists).
+        Parameters:
+            instance: The object instance that owns this descriptor
+            value: The new TaskStatus value to set
+        Raises:
+            ValueError: If value is not an instance of TaskStatus enum
+        """
         if not isinstance(value, TaskStatus):
             raise ValueError("Value must be an instance of TaskStatus enum")
+        # Record the current time for the status change
         t = time.monotonic()
+        # Add an entry to the status log if the instance has one
         if hasattr(instance, "status_log"):
             instance.status_log.append(TaskStatusLogEntry(t, value))
+        # Update the actual status value
         self._task_status = value
     def __delete__(self, instance):
+        """Reset the task status to None when deleted."""
         self._task_status = None
@@ -69,9 +139,23 @@ def get_enum_from_string(str_key):
 class InterviewTaskLogDict(UserDict):
-    """A dictionary of TaskStatusLog objects.
-    The key is the name of the task.
+    """
+    A collection of task status logs for all tasks in an interview.
+    This dictionary-like object maps task names to their individual TaskStatusLog objects,
+    providing methods to analyze task execution across an entire interview. It supports
+    calculating timing metrics, generating status matrices for visualization, and
+    rendering graphical representations of task execution flow.
+    The InterviewTaskLogDict is a key component in EDSL's task monitoring system,
+    enabling both debugging of individual interviews and aggregate analysis of
+    execution patterns.
+    Key features:
+    - Temporal analysis (min/max execution times)
+    - Status matrix generation for visualization
+    - Visual representation of task status changes over time
+    - Color-coded status visualization
     """
     @property

edsl/tasks/task_status_log.py ADDED Viewed

@@ -0,0 +1,85 @@
+"""
+This module provides the TaskStatusLog class for tracking the status history of tasks.
+The TaskStatusLog class maintains an ordered list of status changes for a specific task,
+with timestamps and status values. This history allows for detailed analysis of task
+execution, including timing, state transitions, and status at any point in time.
+"""
+from collections import UserList
+from typing import List, Optional, Union
+from .task_status_enum import TaskStatus, TaskStatusLogEntry
+class TaskStatusLog(UserList):
+    """
+    An ordered history of status changes for a single task.
+    This class extends UserList to provide a chronological record of all status changes
+    that a task undergoes during its lifecycle. Each entry in the list is a
+    TaskStatusLogEntry object containing a timestamp and status value.
+    The TaskStatusLog provides methods to analyze the timing of task execution and
+    determine task status at any point in time. This information is valuable for
+    debugging, performance analysis, and visualization of task execution flow.
+    Key features:
+    - Records all status transitions with timestamps
+    - Provides min/max execution time calculations
+    - Supports interpolation to determine status at any given time
+    - Used by visualization tools to render task execution timelines
+    """
+    @property
+    def min_time(self) -> float:
+        """
+        Get the timestamp of the first status change.
+        Returns:
+            The timestamp (from time.monotonic()) of the earliest status entry
+        Note:
+            This is typically when the task was first created and set to NOT_STARTED
+        """
+        return self[0]["log_time"]
+    @property
+    def max_time(self) -> float:
+        """
+        Get the timestamp of the last status change.
+        Returns:
+            The timestamp (from time.monotonic()) of the most recent status entry
+        Note:
+            This is typically when the task reached its final state (SUCCESS, FAILED, etc.)
+        """
+        return self[-1]["log_time"]
+    def status_at_time(self, t: float) -> TaskStatus:
+        """
+        Determine what status the task had at a specific point in time.
+        This method interpolates between status log entries to determine the task's
+        status at any arbitrary time point. It searches for the first status change
+        that occurred after time t and returns the status that was active at that time.
+        Parameters:
+            t: The timestamp to query (from time.monotonic())
+        Returns:
+            The TaskStatus that was active at time t
+        Note:
+            If t is after the last recorded status change, the final status is returned.
+            If t is before the first recorded status change, this method may not behave
+            as expected since it assumes ordered traversal through the log.
+        TODO:
+            Could re-factor with bisect to make this faster for large logs.
+        """
+        for entry in self:
+            if entry["log_time"] > t:
+                return entry["value"]
+        return self[-1]["value"]

edsl/tokens/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ from .token_usage import TokenUsage
2	+ from .interview_token_usage import InterviewTokenUsage

edsl/tokens/interview_token_usage.py ADDED Viewed

@@ -0,0 +1,53 @@
+from typing import Optional
+from .token_usage import TokenUsage
+from edsl.enums import TokenPricing
+class InterviewTokenUsage:
+    """A class to represent the token usage of an interview."""
+    def __init__(
+        self, new_token_usage: Optional[TokenUsage] = None, cached_token_usage: Optional[TokenUsage] = None
+    ):
+        """Initialize the InterviewTokenUsage.
+        >>> usage = InterviewTokenUsage()
+        """
+        self.new_token_usage = new_token_usage or TokenUsage(from_cache=False)
+        self.cached_token_usage = cached_token_usage or TokenUsage(from_cache=True)
+    def __add__(self, other: "InterviewTokenUsage") -> "InterviewTokenUsage":
+        """Add two InterviewTokenUsage objects together.
+        >>> usage1 = InterviewTokenUsage()
+        >>> usage2 = InterviewTokenUsage()
+        >>> usage3 = usage1 + usage2
+        """
+        if not isinstance(other, InterviewTokenUsage):
+            raise ValueError(f"Can't add {type(other)} to InterviewTokenSummary")
+        return InterviewTokenUsage(
+            new_token_usage=self.new_token_usage + other.new_token_usage,
+            cached_token_usage=self.cached_token_usage + other.cached_token_usage,
+        )
+    def __repr__(self):
+        return f"InterviewTokenUsage(new_token_usage={self.new_token_usage}, cached_token_usage={self.cached_token_usage})"
+    def cost(self, prices: TokenPricing) -> float:
+        """Return the cost of the new and cached token usage.
+        >>> usage = InterviewTokenUsage()
+        >>> usage.cost(TokenPricing.example())
+        0.0
+        """
+        return self.new_token_usage.cost(prices)
+    def saved(self, prices: TokenPricing) -> float:
+        """Return the saved cost of the cached token usage.
+        """
+        return self.cached_token_usage.cost(prices)
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl/utilities/PrettyList.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from collections import UserList
-from edsl.results.Dataset import Dataset
+from ..dataset import Dataset
 class Markkdown:

edsl/utilities/SystemInfo.py CHANGED Viewed

@@ -1,28 +1,31 @@
 """Module to store system information."""
-from dataclasses import dataclass
-import getpass
-import platform
-import pkg_resources
+# This module is not currently used by any part of the codebase.
+# Keeping it commented out for potential future use.
+# from dataclasses import dataclass
+# import getpass
+# import platform
+# import pkg_resources
-@dataclass
-class SystemInfo:
-    """Dataclass to store system information."""
-    username: str
-    system_info: str
-    release_info: str
-    package_name: str
-    package_version: str
+# @dataclass
+# class SystemInfo:
+#     """Dataclass to store system information."""
-    def __init__(self, package_name: str):
-        """Initialize the dataclass with system."""
-        self.username = getpass.getuser()
-        self.system_info = platform.system()
-        self.release_info = platform.release()
-        self.package_name = package_name
-        try:
-            self.package_version = pkg_resources.get_distribution(package_name).version
-        except pkg_resources.DistributionNotFound:
-            self.package_version = "Not installed"
+#     username: str
+#     system_info: str
+#     release_info: str
+#     package_name: str
+#     package_version: str
+#     def __init__(self, package_name: str):
+#         """Initialize the dataclass with system."""
+#         self.username = getpass.getuser()
+#         self.system_info = platform.system()
+#         self.release_info = platform.release()
+#         self.package_name = package_name
+#         try:
+#             self.package_version = pkg_resources.get_distribution(package_name).version
+#         except pkg_resources.DistributionNotFound:
+#             self.package_version = "Not installed"

edsl/utilities/__init__.py CHANGED Viewed

@@ -1,22 +1,30 @@
-# from edsl.utilities.interface import (
-#     print_dict_as_html_table,
-#     print_dict_with_rich,
-#     print_list_of_dicts_as_html_table,
-#     print_table_with_rich,
-#     print_public_methods_with_doc,
-#     print_list_of_dicts_as_markdown_table,
-# )
+# Core utilities - used across the codebase
+from .template_loader import TemplateLoader
+from .PrettyList import PrettyList
+from .restricted_python import create_restricted_function
+from .remove_edsl_version import remove_edsl_version
+from .ast_utilities import extract_variable_names
+# Functions from utilities.py
+from .utilities import (
+    clean_json,
+    dict_hash,
+    hash_value,
+    repair_json,
+    create_valid_var_name,
+    random_string,
+    shorten_string,
+    is_gzipped
+)
+# Decorator utilities
+from .decorators import sync_wrapper, jupyter_nb_handler
+# Standalone utilities
+from .is_notebook import is_notebook
+from .is_valid_variable_name import is_valid_variable_name
+from .naming_utilities import sanitize_string
+# Interface module - note: print_results_long is imported directly in results.py
+from .interface import print_results_long
-# from edsl.utilities.utilities import (
-#     create_valid_var_name,
-#     dict_to_html,
-#     hash_value,
-#     HTMLSnippet,
-#     is_notebook,
-#     is_gzipped,
-#     is_valid_variable_name,
-#     random_string,
-#     repair_json,
-#     shorten_string,
-#     time_all_functions,
-# )

edsl/utilities/gcp_bucket/__init__.py CHANGED Viewed

	@@ -0,0 +1,2 @@
1	+ # GCP bucket utilities
2	+ # This package is currently not being used

edsl 0.1.47__py3-none-any.whl → 0.1.48__py3-none-any.whl

edsl 0.1.47py3-none-any.whl → 0.1.48py3-none-any.whl