PyPI - edsl - Versions diffs - 0.1.47__py3-none-any.whl → 0.1.49__py3-none-any.whl - Mend

edsl 0.1.47py3-none-any.whl → 0.1.49py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

edsl/__init__.py +44 -39
edsl/__version__.py +1 -1
edsl/agents/__init__.py +4 -2
edsl/agents/{Agent.py → agent.py} +442 -152
edsl/agents/{AgentList.py → agent_list.py} +220 -162
edsl/agents/descriptors.py +46 -7
edsl/{exceptions/agents.py → agents/exceptions.py} +3 -12
edsl/base/__init__.py +75 -0
edsl/base/base_class.py +1303 -0
edsl/base/data_transfer_models.py +114 -0
edsl/base/enums.py +215 -0
edsl/base.py +8 -0
edsl/buckets/__init__.py +25 -0
edsl/buckets/bucket_collection.py +324 -0
edsl/buckets/model_buckets.py +206 -0
edsl/buckets/token_bucket.py +502 -0
edsl/{jobs/buckets/TokenBucketAPI.py → buckets/token_bucket_api.py} +1 -1
edsl/buckets/token_bucket_client.py +509 -0
edsl/caching/__init__.py +20 -0
edsl/caching/cache.py +814 -0
edsl/caching/cache_entry.py +427 -0
edsl/{data/CacheHandler.py → caching/cache_handler.py} +14 -15
edsl/caching/exceptions.py +24 -0
edsl/caching/orm.py +30 -0
edsl/{data/RemoteCacheSync.py → caching/remote_cache_sync.py} +3 -3
edsl/caching/sql_dict.py +441 -0
edsl/config/__init__.py +8 -0
edsl/config/config_class.py +177 -0
edsl/config.py +4 -176
edsl/conversation/Conversation.py +7 -7
edsl/conversation/car_buying.py +4 -4
edsl/conversation/chips.py +6 -6
edsl/coop/__init__.py +25 -2
edsl/coop/coop.py +311 -75
edsl/coop/{ExpectedParrotKeyHandler.py → ep_key_handling.py} +86 -10
edsl/coop/exceptions.py +62 -0
edsl/coop/price_fetcher.py +126 -0
edsl/coop/utils.py +89 -24
edsl/data_transfer_models.py +5 -72
edsl/dataset/__init__.py +10 -0
edsl/{results/Dataset.py → dataset/dataset.py} +116 -36
edsl/{results/DatasetExportMixin.py → dataset/dataset_operations_mixin.py} +606 -122
edsl/{results/DatasetTree.py → dataset/dataset_tree.py} +156 -75
edsl/{results/TableDisplay.py → dataset/display/table_display.py} +18 -7
edsl/{results → dataset/display}/table_renderers.py +58 -2
edsl/{results → dataset}/file_exports.py +4 -5
edsl/{results → dataset}/smart_objects.py +2 -2
edsl/enums.py +5 -205
edsl/inference_services/__init__.py +5 -0
edsl/inference_services/{AvailableModelCacheHandler.py → available_model_cache_handler.py} +2 -3
edsl/inference_services/{AvailableModelFetcher.py → available_model_fetcher.py} +8 -14
edsl/inference_services/data_structures.py +3 -2
edsl/{exceptions/inference_services.py → inference_services/exceptions.py} +1 -1
edsl/inference_services/{InferenceServiceABC.py → inference_service_abc.py} +1 -1
edsl/inference_services/{InferenceServicesCollection.py → inference_services_collection.py} +8 -7
edsl/inference_services/registry.py +4 -41
edsl/inference_services/{ServiceAvailability.py → service_availability.py} +5 -25
edsl/inference_services/services/__init__.py +31 -0
edsl/inference_services/{AnthropicService.py → services/anthropic_service.py} +3 -3
edsl/inference_services/{AwsBedrock.py → services/aws_bedrock.py} +2 -2
edsl/inference_services/{AzureAI.py → services/azure_ai.py} +2 -2
edsl/inference_services/{DeepInfraService.py → services/deep_infra_service.py} +1 -3
edsl/inference_services/{DeepSeekService.py → services/deep_seek_service.py} +2 -4
edsl/inference_services/{GoogleService.py → services/google_service.py} +5 -4
edsl/inference_services/{GroqService.py → services/groq_service.py} +1 -1
edsl/inference_services/{MistralAIService.py → services/mistral_ai_service.py} +3 -3
edsl/inference_services/{OllamaService.py → services/ollama_service.py} +1 -7
edsl/inference_services/{OpenAIService.py → services/open_ai_service.py} +5 -6
edsl/inference_services/{PerplexityService.py → services/perplexity_service.py} +3 -7
edsl/inference_services/{TestService.py → services/test_service.py} +7 -6
edsl/inference_services/{TogetherAIService.py → services/together_ai_service.py} +2 -6
edsl/inference_services/{XAIService.py → services/xai_service.py} +1 -1
edsl/inference_services/write_available.py +1 -2
edsl/instructions/__init__.py +6 -0
edsl/{surveys/instructions/Instruction.py → instructions/instruction.py} +11 -6
edsl/{surveys/instructions/InstructionCollection.py → instructions/instruction_collection.py} +10 -5
edsl/{surveys/InstructionHandler.py → instructions/instruction_handler.py} +3 -3
edsl/{jobs/interviews → interviews}/ReportErrors.py +2 -2
edsl/interviews/__init__.py +4 -0
edsl/{jobs/AnswerQuestionFunctionConstructor.py → interviews/answering_function.py} +45 -18
edsl/{jobs/interviews/InterviewExceptionEntry.py → interviews/exception_tracking.py} +107 -22
edsl/interviews/interview.py +638 -0
edsl/{jobs/interviews/InterviewStatusDictionary.py → interviews/interview_status_dictionary.py} +21 -12
edsl/{jobs/interviews/InterviewStatusLog.py → interviews/interview_status_log.py} +16 -7
edsl/{jobs/InterviewTaskManager.py → interviews/interview_task_manager.py} +12 -7
edsl/{jobs/RequestTokenEstimator.py → interviews/request_token_estimator.py} +8 -3
edsl/{jobs/interviews/InterviewStatistic.py → interviews/statistics.py} +36 -10
edsl/invigilators/__init__.py +38 -0
edsl/invigilators/invigilator_base.py +477 -0
edsl/{agents/Invigilator.py → invigilators/invigilators.py} +263 -10
edsl/invigilators/prompt_constructor.py +476 -0
edsl/{agents → invigilators}/prompt_helpers.py +2 -1
edsl/{agents/QuestionInstructionPromptBuilder.py → invigilators/question_instructions_prompt_builder.py} +18 -13
edsl/{agents → invigilators}/question_option_processor.py +96 -21
edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} +64 -12
edsl/jobs/__init__.py +7 -1
edsl/jobs/async_interview_runner.py +99 -35
edsl/jobs/check_survey_scenario_compatibility.py +7 -5
edsl/jobs/data_structures.py +153 -22
edsl/{exceptions/jobs.py → jobs/exceptions.py} +2 -1
edsl/jobs/{FetchInvigilator.py → fetch_invigilator.py} +4 -4
edsl/jobs/{loggers/HTMLTableJobLogger.py → html_table_job_logger.py} +6 -2
edsl/jobs/{Jobs.py → jobs.py} +313 -167
edsl/jobs/{JobsChecks.py → jobs_checks.py} +15 -7
edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} +19 -17
edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} +10 -5
edsl/jobs/jobs_pricing_estimation.py +347 -0
edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} +4 -3
edsl/jobs/jobs_runner_asyncio.py +282 -0
edsl/jobs/{JobsRemoteInferenceHandler.py → remote_inference.py} +19 -22
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/key_management/__init__.py +28 -0
edsl/key_management/key_lookup.py +161 -0
edsl/{language_models/key_management/KeyLookupBuilder.py → key_management/key_lookup_builder.py} +118 -47
edsl/key_management/key_lookup_collection.py +82 -0
edsl/key_management/models.py +218 -0
edsl/language_models/__init__.py +7 -2
edsl/language_models/{ComputeCost.py → compute_cost.py} +18 -3
edsl/{exceptions/language_models.py → language_models/exceptions.py} +2 -1
edsl/language_models/language_model.py +1080 -0
edsl/language_models/model.py +10 -25
edsl/language_models/{ModelList.py → model_list.py} +9 -14
edsl/language_models/{RawResponseHandler.py → raw_response_handler.py} +1 -1
edsl/language_models/{RegisterLanguageModelsMeta.py → registry.py} +1 -1
edsl/language_models/repair.py +4 -4
edsl/language_models/utilities.py +4 -4
edsl/notebooks/__init__.py +3 -1
edsl/notebooks/{Notebook.py → notebook.py} +7 -8
edsl/prompts/__init__.py +1 -1
edsl/{exceptions/prompts.py → prompts/exceptions.py} +3 -1
edsl/prompts/{Prompt.py → prompt.py} +101 -95
edsl/questions/HTMLQuestion.py +1 -1
edsl/questions/__init__.py +154 -25
edsl/questions/answer_validator_mixin.py +1 -1
edsl/questions/compose_questions.py +4 -3
edsl/questions/derived/question_likert_five.py +166 -0
edsl/questions/derived/{QuestionLinearScale.py → question_linear_scale.py} +4 -4
edsl/questions/derived/{QuestionTopK.py → question_top_k.py} +4 -4
edsl/questions/derived/{QuestionYesNo.py → question_yes_no.py} +4 -5
edsl/questions/descriptors.py +24 -30
edsl/questions/loop_processor.py +65 -19
edsl/questions/question_base.py +881 -0
edsl/questions/question_base_gen_mixin.py +15 -16
edsl/questions/{QuestionBasePromptsMixin.py → question_base_prompts_mixin.py} +2 -2
edsl/questions/{QuestionBudget.py → question_budget.py} +3 -4
edsl/questions/{QuestionCheckBox.py → question_check_box.py} +16 -16
edsl/questions/{QuestionDict.py → question_dict.py} +39 -5
edsl/questions/{QuestionExtract.py → question_extract.py} +9 -9
edsl/questions/question_free_text.py +282 -0
edsl/questions/{QuestionFunctional.py → question_functional.py} +6 -5
edsl/questions/{QuestionList.py → question_list.py} +6 -7
edsl/questions/{QuestionMatrix.py → question_matrix.py} +6 -5
edsl/questions/{QuestionMultipleChoice.py → question_multiple_choice.py} +126 -21
edsl/questions/{QuestionNumerical.py → question_numerical.py} +5 -5
edsl/questions/{QuestionRank.py → question_rank.py} +6 -6
edsl/questions/question_registry.py +4 -9
edsl/questions/register_questions_meta.py +8 -4
edsl/questions/response_validator_abc.py +17 -16
edsl/results/__init__.py +4 -1
edsl/{exceptions/results.py → results/exceptions.py} +1 -1
edsl/results/report.py +197 -0
edsl/results/{Result.py → result.py} +131 -45
edsl/results/{Results.py → results.py} +365 -220
edsl/results/results_selector.py +344 -25
edsl/scenarios/__init__.py +30 -3
edsl/scenarios/{ConstructDownloadLink.py → construct_download_link.py} +7 -0
edsl/scenarios/directory_scanner.py +156 -13
edsl/scenarios/document_chunker.py +186 -0
edsl/scenarios/exceptions.py +101 -0
edsl/scenarios/file_methods.py +2 -3
edsl/scenarios/{FileStore.py → file_store.py} +275 -189
edsl/scenarios/handlers/__init__.py +14 -14
edsl/scenarios/handlers/{csv.py → csv_file_store.py} +1 -2
edsl/scenarios/handlers/{docx.py → docx_file_store.py} +8 -7
edsl/scenarios/handlers/{html.py → html_file_store.py} +1 -2
edsl/scenarios/handlers/{jpeg.py → jpeg_file_store.py} +1 -1
edsl/scenarios/handlers/{json.py → json_file_store.py} +1 -1
edsl/scenarios/handlers/latex_file_store.py +5 -0
edsl/scenarios/handlers/{md.py → md_file_store.py} +1 -1
edsl/scenarios/handlers/{pdf.py → pdf_file_store.py} +2 -2
edsl/scenarios/handlers/{png.py → png_file_store.py} +1 -1
edsl/scenarios/handlers/{pptx.py → pptx_file_store.py} +8 -7
edsl/scenarios/handlers/{py.py → py_file_store.py} +1 -3
edsl/scenarios/handlers/{sql.py → sql_file_store.py} +2 -1
edsl/scenarios/handlers/{sqlite.py → sqlite_file_store.py} +2 -3
edsl/scenarios/handlers/{txt.py → txt_file_store.py} +1 -1
edsl/scenarios/scenario.py +928 -0
edsl/scenarios/scenario_join.py +18 -5
edsl/scenarios/{ScenarioList.py → scenario_list.py} +294 -106
edsl/scenarios/{ScenarioListPdfMixin.py → scenario_list_pdf_tools.py} +16 -15
edsl/scenarios/scenario_selector.py +5 -1
edsl/study/ObjectEntry.py +2 -2
edsl/study/SnapShot.py +5 -5
edsl/study/Study.py +18 -19
edsl/study/__init__.py +6 -4
edsl/surveys/__init__.py +7 -4
edsl/surveys/dag/__init__.py +2 -0
edsl/surveys/{ConstructDAG.py → dag/construct_dag.py} +3 -3
edsl/surveys/{DAG.py → dag/dag.py} +13 -10
edsl/surveys/descriptors.py +1 -1
edsl/surveys/{EditSurvey.py → edit_survey.py} +9 -9
edsl/{exceptions/surveys.py → surveys/exceptions.py} +1 -2
edsl/surveys/memory/__init__.py +3 -0
edsl/surveys/{MemoryPlan.py → memory/memory_plan.py} +10 -9
edsl/surveys/rules/__init__.py +3 -0
edsl/surveys/{Rule.py → rules/rule.py} +103 -43
edsl/surveys/{RuleCollection.py → rules/rule_collection.py} +21 -30
edsl/surveys/{RuleManager.py → rules/rule_manager.py} +19 -13
edsl/surveys/survey.py +1743 -0
edsl/surveys/{SurveyExportMixin.py → survey_export.py} +22 -27
edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} +11 -2
edsl/surveys/{Simulator.py → survey_simulator.py} +10 -3
edsl/tasks/__init__.py +32 -0
edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} +115 -57
edsl/tasks/task_creators.py +135 -0
edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} +86 -47
edsl/{jobs/tasks → tasks}/task_status_enum.py +91 -7
edsl/tasks/task_status_log.py +85 -0
edsl/tokens/__init__.py +2 -0
edsl/tokens/interview_token_usage.py +53 -0
edsl/utilities/PrettyList.py +1 -1
edsl/utilities/SystemInfo.py +25 -22
edsl/utilities/__init__.py +29 -21
edsl/utilities/gcp_bucket/__init__.py +2 -0
edsl/utilities/gcp_bucket/cloud_storage.py +99 -96
edsl/utilities/interface.py +44 -536
edsl/{results/MarkdownToPDF.py → utilities/markdown_to_pdf.py} +13 -5
edsl/utilities/repair_functions.py +1 -1
{edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/METADATA +1 -1
edsl-0.1.49.dist-info/RECORD +347 -0
edsl/Base.py +0 -493
edsl/BaseDiff.py +0 -260
edsl/agents/InvigilatorBase.py +0 -260
edsl/agents/PromptConstructor.py +0 -318
edsl/coop/PriceFetcher.py +0 -54
edsl/data/Cache.py +0 -582
edsl/data/CacheEntry.py +0 -238
edsl/data/SQLiteDict.py +0 -292
edsl/data/__init__.py +0 -5
edsl/data/orm.py +0 -10
edsl/exceptions/cache.py +0 -5
edsl/exceptions/coop.py +0 -14
edsl/exceptions/data.py +0 -14
edsl/exceptions/scenarios.py +0 -29
edsl/jobs/Answers.py +0 -43
edsl/jobs/JobsPrompts.py +0 -354
edsl/jobs/buckets/BucketCollection.py +0 -134
edsl/jobs/buckets/ModelBuckets.py +0 -65
edsl/jobs/buckets/TokenBucket.py +0 -283
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/interviews/Interview.py +0 -395
edsl/jobs/interviews/InterviewExceptionCollection.py +0 -99
edsl/jobs/interviews/InterviewStatisticsCollection.py +0 -25
edsl/jobs/runners/JobsRunnerAsyncio.py +0 -163
edsl/jobs/runners/JobsRunnerStatusData.py +0 -0
edsl/jobs/tasks/TaskCreators.py +0 -64
edsl/jobs/tasks/TaskStatusLog.py +0 -23
edsl/jobs/tokens/InterviewTokenUsage.py +0 -27
edsl/language_models/LanguageModel.py +0 -635
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/models.py +0 -137
edsl/questions/QuestionBase.py +0 -544
edsl/questions/QuestionFreeText.py +0 -130
edsl/questions/derived/QuestionLikertFive.py +0 -76
edsl/results/ResultsExportMixin.py +0 -45
edsl/results/TextEditor.py +0 -50
edsl/results/results_fetch_mixin.py +0 -33
edsl/results/results_tools_mixin.py +0 -98
edsl/scenarios/DocumentChunker.py +0 -104
edsl/scenarios/Scenario.py +0 -548
edsl/scenarios/ScenarioHtmlMixin.py +0 -65
edsl/scenarios/ScenarioListExportMixin.py +0 -45
edsl/scenarios/handlers/latex.py +0 -5
edsl/shared.py +0 -1
edsl/surveys/Survey.py +0 -1301
edsl/surveys/SurveyQualtricsImport.py +0 -284
edsl/surveys/SurveyToApp.py +0 -141
edsl/surveys/instructions/__init__.py +0 -0
edsl/tools/__init__.py +0 -1
edsl/tools/clusters.py +0 -192
edsl/tools/embeddings.py +0 -27
edsl/tools/embeddings_plotting.py +0 -118
edsl/tools/plotting.py +0 -112
edsl/tools/summarize.py +0 -18
edsl/utilities/data/Registry.py +0 -6
edsl/utilities/data/__init__.py +0 -1
edsl/utilities/data/scooter_results.json +0 -1
edsl-0.1.47.dist-info/RECORD +0 -354
/edsl/coop/{CoopFunctionsMixin.py → coop_functions.py} +0 -0
/edsl/{results → dataset/display}/CSSParameterizer.py +0 -0
/edsl/{language_models/key_management → dataset/display}/__init__.py +0 -0
/edsl/{results → dataset/display}/table_data_class.py +0 -0
/edsl/{results → dataset/display}/table_display.css +0 -0
/edsl/{results/ResultsGGMixin.py → dataset/r/ggplot.py} +0 -0
/edsl/{results → dataset}/tree_explore.py +0 -0
/edsl/{surveys/instructions/ChangeInstruction.py → instructions/change_instruction.py} +0 -0
/edsl/{jobs/interviews → interviews}/interview_status_enum.py +0 -0
/edsl/jobs/{runners/JobsRunnerStatus.py → jobs_runner_status.py} +0 -0
/edsl/language_models/{PriceManager.py → price_manager.py} +0 -0
/edsl/language_models/{fake_openai_call.py → unused/fake_openai_call.py} +0 -0
/edsl/language_models/{fake_openai_service.py → unused/fake_openai_service.py} +0 -0
/edsl/notebooks/{NotebookToLaTeX.py → notebook_to_latex.py} +0 -0
/edsl/{exceptions/questions.py → questions/exceptions.py} +0 -0
/edsl/questions/{SimpleAskMixin.py → simple_ask_mixin.py} +0 -0
/edsl/surveys/{Memory.py → memory/memory.py} +0 -0
/edsl/surveys/{MemoryManagement.py → memory/memory_management.py} +0 -0
/edsl/surveys/{SurveyCSS.py → survey_css.py} +0 -0
/edsl/{jobs/tokens/TokenUsage.py → tokens/token_usage.py} +0 -0
/edsl/{results/MarkdownToDocx.py → utilities/markdown_to_docx.py} +0 -0
/edsl/{TemplateLoader.py → utilities/template_loader.py} +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/LICENSE +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/WHEEL +0 -0

edsl/surveys/{SurveyExportMixin.py → survey_export.py} RENAMED Viewed

@@ -1,4 +1,4 @@
-"""A mixin class for exporting surveys to different formats."""
+"""A class for exporting surveys to different formats."""
 from typing import Union, Optional
@@ -24,11 +24,15 @@ def open_docx(file_path):
         subprocess.call(("xdg-open", file_path))
-class SurveyExportMixin:
-    """A mixin class for exporting surveys to different formats."""
+class SurveyExport:
+    """A class for exporting surveys to different formats."""
+    def __init__(self, survey):
+        """Initialize with a Survey object."""
+        self.survey = survey
     def css(self):
-        from edsl.surveys.SurveyCSS import SurveyCSS
+        from .survey_css import SurveyCSS
         return SurveyCSS.default_style().generate_css()
@@ -36,7 +40,7 @@ class SurveyExportMixin:
         """Return the description of the survey."""
         from edsl import QuestionFreeText
-        question_texts = "\n".join([q.question_text for q in self._questions])
+        question_texts = "\n".join([q.question_text for q in self.survey._questions])
         q = QuestionFreeText(
             question_name="description",
             question_text=f"""A survey was conducted with the following questions:
@@ -58,7 +62,7 @@ class SurveyExportMixin:
         doc = Document()
         doc.add_heading("EDSL Survey")
         doc.add_paragraph(f"\n")
-        for index, question in enumerate(self._questions):
+        for index, question in enumerate(self.survey._questions):
             h = doc.add_paragraph()  # Add question as a paragraph
             h.add_run(f"Question {index + 1} ({question.question_name})").bold = True
             h.add_run(f"; {question.question_type}").italic = True
@@ -72,20 +76,13 @@ class SurveyExportMixin:
                     for option in getattr(question, "question_options", []):
                         doc.add_paragraph(str(option), style="ListBullet")
-        if return_document_object and filename is None:
+        if return_document_object:
             return doc
-        if filename is None:
-            with tempfile.NamedTemporaryFile(
-                "w", delete=False, suffix=".docx", dir=os.getcwd()
-            ) as f:
-                filename = f.name
-        doc.save(filename)
-        print("The survey has been saved to", filename)
-        if open_file:
-            open_docx(filename)
-        return
+        else:
+            doc.save(filename)
+            if open_file:
+                os.system(f"open {filename}")
+            return None
     def show(self):
         self.to_scenario_list(questions_only=False, rename=True).print(format="rich")
@@ -93,14 +90,12 @@ class SurveyExportMixin:
     def to_scenario_list(
         self, questions_only: bool = True, rename=False
     ) -> "ScenarioList":
-        from edsl import ScenarioList, Scenario
-        # from edsl.questions import QuestionBase
+        from ..scenarios import ScenarioList, Scenario
         if questions_only:
-            to_iterate_over = self._questions
+            to_iterate_over = self.survey._questions
         else:
-            to_iterate_over = self.recombined_questions_and_instructions()
+            to_iterate_over = self.survey.recombined_questions_and_instructions()
         if rename:
             renaming_dict = {
@@ -150,13 +145,13 @@ class SurveyExportMixin:
         header_lines = ["from edsl.surveys.Survey import Survey"]
         header_lines.append("from edsl import Question")
         lines = ["\n".join(header_lines)]
-        for question in self._questions:
+        for question in self.survey._questions:
             question.question_text = question["question_text"].replace("\n", " ")
             # remove dublicate spaces
             question.question_text = " ".join(question.question_text.split())
             lines.append(f"{question.question_name} = " + repr(question))
         lines.append(
-            f"{survey_var_name} = Survey(questions = [{', '.join(self.question_names)}])"
+            f"{survey_var_name} = Survey(questions = [{', '.join(self.survey.question_names)}])"
         )
         # return lines
         code_string = "\n".join(lines)
@@ -216,7 +211,7 @@ class SurveyExportMixin:
         with open(filename, "w") as f:
             f.write(html_header)
-            for question in self._questions:
+            for question in self.survey._questions:
                 f.write(
                     question.html(
                         scenario=scenario, include_question_name=include_question_name

edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} RENAMED Viewed

@@ -47,7 +47,12 @@ class SurveyFlowVisualization:
                 for param in question.detailed_parameters:
                     if "agent." in param:
                         # Handle agent trait references
-                        trait_name = param.replace("agent.", "")
+                        #trait_name = param.replace("agent.", "")
+                        params_and_refs.add(param)
+                        if param not in param_to_questions:
+                            param_to_questions[param] = []
+                        param_to_questions[param].append(index)
+                    if "scenario." in param:
                         params_and_refs.add(param)
                         if param not in param_to_questions:
                             param_to_questions[param] = []
@@ -108,7 +113,7 @@ class SurveyFlowVisualization:
                     "label": f"Agent Trait\n{{{{ {param} }}}}"
                 })
             # Check if parameter exists in scenario
-            elif self.scenario and param in self.scenario:
+            elif self.scenario and param.startswith("scenario."):
                 node_attrs.update({
                     "fillcolor": "lightgreen",
                     "label": f"Scenario\n{{{{ {param} }}}}"
@@ -207,6 +212,10 @@ class SurveyFlowVisualization:
                     """File not found. Most likely it's because you don't have graphviz installed. Please install it and try again.
                         On Ubuntu, you can install it by running:
                         $ sudo apt-get install graphviz
+                        On Mac, you can install it by running:
+                        $ brew install graphviz
+                        On Windows, you can install it by running:
+                        $ choco install graphviz
                     """
                 )
             from edsl.utilities.is_notebook import is_notebook

edsl/surveys/{Simulator.py → survey_simulator.py} RENAMED Viewed

@@ -1,8 +1,15 @@
+from typing import TYPE_CHECKING
 from typing import Callable
+from edsl.agents import Agent
+#from edsl.surveys import Survey
+if TYPE_CHECKING:
+    from edsl.surveys import Survey
+    from edsl.results import Results
+    from edsl.questions import QuestionBase
 class Simulator:
-    def __init__(self, survey):
+    def __init__(self, survey: "Survey"):
         self.survey = survey
     @classmethod
@@ -10,7 +17,7 @@ class Simulator:
         """Create a random survey."""
         from edsl.questions import QuestionMultipleChoice, QuestionFreeText
         from random import choice
-        from edsl.surveys.Survey import Survey
+        from edsl.surveys import Survey
         num_questions = 10
         questions = []
@@ -57,7 +64,7 @@ class Simulator:
     def create_agent(self) -> "Agent":
         """Create an agent from the simulated answers."""
         answers_dict = self.survey.simulate()
-        from edsl.agents.Agent import Agent
+        from edsl.agents import Agent
         def construct_answer_dict_function(traits: dict) -> Callable:
             def func(self, question: "QuestionBase", scenario=None):

edsl/tasks/__init__.py ADDED Viewed

@@ -0,0 +1,32 @@
+"""
+The tasks module provides EDSL's task management system for tracking and controlling
+interview execution.
+This module implements a comprehensive system for creating, scheduling, executing, and
+monitoring tasks in EDSL. Tasks represent individual units of work, typically answering
+a question with an LLM, with features for dependency management, error handling, and
+execution status tracking.
+Key components:
+1. TaskHistory - Records and analyzes the execution history of tasks with error reporting
+2. QuestionTaskCreator - Creates and manages tasks for individual questions
+3. TaskCreators - Manages collections of tasks for an entire interview
+4. TaskStatus - Enumeration of possible task states (running, waiting, success, etc.)
+5. TaskStatusLog - Records the status changes of tasks over time
+The tasks system helps EDSL manage complex interview workflows by:
+- Handling dependencies between questions
+- Managing API rate limits and token usage
+- Providing detailed execution metrics
+- Generating error reports and visualizations
+- Supporting both synchronous and asynchronous execution
+For most users, this module works behind the scenes, but understanding it can
+be helpful when debugging or optimizing complex EDSL workflows.
+"""
+from .task_history import TaskHistory
+from .question_task_creator import QuestionTaskCreator
+from .task_creators import TaskCreators
+from .task_status_enum import TaskStatus, TaskStatusDescriptor

edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} RENAMED Viewed

@@ -1,34 +1,77 @@
+"""
+This module provides the QuestionTaskCreator class for executing individual questions as tasks.
+The QuestionTaskCreator is responsible for executing a single question within the EDSL system.
+It manages the entire lifecycle of a question task, including dependency resolution, rate
+limiting, token management, execution, and status tracking. It serves as the fundamental
+execution unit in EDSL's task system.
+"""
 import asyncio
-from typing import Callable, Union, List, TYPE_CHECKING
+from typing import Callable, Union, List, Dict, Any, Optional, TYPE_CHECKING
 from collections import UserList, UserDict
-from edsl.exceptions.jobs import InterviewErrorPriorTaskCanceled
+from ..jobs.exceptions import InterviewErrorPriorTaskCanceled
+from ..tokens import TokenUsage
+from ..data_transfer_models import Answers
-from edsl.jobs.tasks.task_status_enum import TaskStatus, TaskStatusDescriptor
-from edsl.jobs.tasks.TaskStatusLog import TaskStatusLog
-from edsl.jobs.tokens.TokenUsage import TokenUsage
-from edsl.jobs.Answers import Answers
+from .task_status_enum import TaskStatus, TaskStatusDescriptor
+from .task_status_log import TaskStatusLog
 if TYPE_CHECKING:
-    from edsl.questions.QuestionBase import QuestionBase
-    from edsl.jobs.buckets import ModelBuckets
+    from ..questions import QuestionBase
+    from ..buckets import ModelBuckets
 class TokensUsed(UserDict):
-    """ "Container for tokens used by a task."""
+    """
+    Container for tracking token usage for a task, separating cached and new tokens.
+    This class provides a structured way to track token usage for a single task,
+    distinguishing between tokens reused from cache and tokens freshly generated.
+    It uses a UserDict interface for convenient access to the underlying data.
+    Attributes:
+        cached_tokens: TokenUsage object tracking reused tokens from cache
+        new_tokens: TokenUsage object tracking freshly generated tokens
+    """
-    def __init__(self, cached_tokens, new_tokens):
+    def __init__(self, cached_tokens: TokenUsage, new_tokens: TokenUsage):
+        """
+        Initialize a TokensUsed container.
+        Parameters:
+            cached_tokens: TokenUsage object for tokens reused from cache
+            new_tokens: TokenUsage object for newly generated tokens
+        """
         d = {"cached_tokens": cached_tokens, "new_tokens": new_tokens}
         super().__init__(d)
 class QuestionTaskCreator(UserList):
-    """Class to create and manage a single question and its dependencies.
-    It is a UserList with all the tasks that must be completed before the focal task can be run.
-    The focal task is the question that we are interested in answering.
     """
+    Creates and manages the execution of a single question as an asyncio task.
+    The QuestionTaskCreator is a fundamental component of EDSL's task system,
+    responsible for executing a single question with its dependencies. It extends
+    UserList to maintain a list of dependent tasks that must complete before this
+    task can execute.
+    Key responsibilities:
+    1. Task Dependency Management - Tracks prerequisite tasks that must complete first
+    2. Resource Management - Handles rate limiting and token quota management
+    3. Task Status Tracking - Monitors and logs task state transitions
+    4. Token Usage Tracking - Records token consumption for both cached and new tokens
+    5. Task Execution - Runs the question answering function when dependencies are met
+    The class follows the state machine pattern, with task_status transitioning through
+    various TaskStatus states (NOT_STARTED, WAITING_FOR_DEPENDENCIES, etc.) as execution
+    progresses. All status changes are automatically logged to enable detailed analysis
+    and visualization.
+    This class is designed to work with asyncio for concurrent task execution, enabling
+    efficient processing of interviews with multiple questions and dependencies.
+    """
     task_status = TaskStatusDescriptor()
     def __init__(
@@ -37,17 +80,24 @@ class QuestionTaskCreator(UserList):
         question: "QuestionBase",
         answer_question_func: Callable,
         model_buckets: "ModelBuckets",
-        token_estimator: Union[Callable, None] = None,
+        token_estimator: Optional[Callable] = None,
         iteration: int = 0,
     ):
-        """Initialize the QuestionTaskCreator instance.
-        :param question: the question that we are interested in answering.
-        :param answer_question_func: the function that will answer the question.
-        :param model_buckets: the bucket collection that contains the requests and tokens buckets which control the rate of API calls and token usage.
-        :param token_estimator: a function that estimates the number of tokens required to answer the question.
-        :param iteration: the iteration number of the question.
+        """
+        Initialize a QuestionTaskCreator for a specific question.
+        Parameters:
+            question: The Question object to be answered
+            answer_question_func: Function that will execute the LLM call to answer the question
+            model_buckets: Container for rate limiting buckets (requests and tokens)
+            token_estimator: Function to estimate token usage for the question (for quota management)
+            iteration: The iteration number of this question (for repeated questions)
+        Notes:
+            - The QuestionTaskCreator starts in the NOT_STARTED state
+            - Dependencies can be added after initialization with add_dependency()
+            - Token usage is tracked separately for cached vs. new tokens
+            - This class works with asyncio for concurrent execution
         """
         super().__init__([])
         self.answer_question_func = answer_question_func
@@ -159,8 +209,8 @@ class QuestionTaskCreator(UserList):
     @classmethod
     def example(cls):
         """Return an example instance of the class."""
-        from edsl.questions.QuestionFreeText import QuestionFreeText
-        from edsl.jobs.buckets.ModelBuckets import ModelBuckets
+        from ..questions import QuestionFreeText
+        from ..buckets import ModelBuckets
         m = ModelBuckets.infinity_bucket()
@@ -180,37 +230,45 @@ class QuestionTaskCreator(UserList):
             iteration=0,
         )
-    async def _run_task_async(self) -> None:
-        """Run the task asynchronously, awaiting the tasks that must be completed before this one can be run.
-        >>> qt1 = QuestionTaskCreator.example()
-        >>> qt2 = QuestionTaskCreator.example()
-        >>> qt2.add_dependency(qt1)
-        The method follows these steps:
-            1. Set the task_status to TaskStatus.WAITING_FOR_DEPENDENCIES, indicating that the task is waiting for its dependencies to complete.
-            2. Await asyncio.gather(*self, return_exceptions=True) to run all the dependent tasks concurrently.
-            - the return_exceptions=True flag ensures that the task does not raise an exception if any of the dependencies fail.
-            3. If any of the dependencies raise an exception:
-            - If it is a CancelledError, set the current task's task_status to TaskStatus.CANCELLED, and re-raise the CancelledError,
-                terminating the execution of the current task.
-            - If it is any other exception, set the task_status to TaskStatus.PARENT_FAILED, and raise a custom exception
-                InterviewErrorPriorTaskCanceled with the original exception as the cause, terminating the execution of the current task.
-            4. If all the dependencies complete successfully without raising any exceptions, the code reaches the else block.
-            5. In the else block, run the focal task (self._run_focal_task(debug)).
-            If any of the dependencies fail (raise an exception), the focal task will not run. The execution will be terminated,
-            and an exception will be raised to indicate the failure of the dependencies.
-            The focal task (self._run_focal_task(debug)) is only executed if all the dependencies complete successfully.
-            Args:
-                debug: A boolean value indicating whether to run the task in debug mode.
-            Returns:
-                None
+    async def _run_task_async(self) -> Answers:
+        """
+        Execute the task with its dependencies in an async workflow.
+        This method implements the core task execution logic with dependency handling.
+        It manages the complete lifecycle of a task:
+        1. Waiting for dependencies to complete
+        2. Handling dependency failures appropriately
+        3. Executing the task itself when dependencies are satisfied
+        4. Tracking status transitions throughout execution
+        The method maintains the state machine pattern by updating task_status
+        at each stage of execution, allowing for detailed monitoring and visualization
+        of task progress.
+        Returns:
+            Answers object containing the question's answer and metadata
+        Raises:
+            asyncio.CancelledError: If the task is cancelled
+            InterviewErrorPriorTaskCanceled: If any dependency task fails
+        Example:
+            >>> qt1 = QuestionTaskCreator.example()
+            >>> qt2 = QuestionTaskCreator.example()
+            >>> qt2.add_dependency(qt1)
+        Implementation details:
+        1. Set status to WAITING_FOR_DEPENDENCIES and await all dependencies
+           - Using gather with return_exceptions=True allows collecting all results
+        2. Check dependency results for exceptions:
+           - If CancelledError: Set status to CANCELLED and propagate the cancellation
+           - If other exception: Set status to PARENT_FAILED and wrap in InterviewErrorPriorTaskCanceled
+        3. If all dependencies succeed, execute the focal task (_run_focal_task)
+           - The focal task handles its own status transitions during execution
         """
         try:
             self.task_status = TaskStatus.WAITING_FOR_DEPENDENCIES

edsl/tasks/task_creators.py ADDED Viewed

@@ -0,0 +1,135 @@
+"""
+This module provides the TaskCreators class, which manages all task creators for an interview.
+The TaskCreators class maintains a dictionary of QuestionTaskCreator objects, each responsible
+for executing a single question within an interview. It aggregates status and token usage
+information across all tasks, providing a complete view of interview execution.
+"""
+from typing import Callable, Union, List, Dict, TYPE_CHECKING
+from collections import UserDict
+if TYPE_CHECKING:
+    from ..tokens import TokenUsage
+    from ..tokens import InterviewTokenUsage
+    from ..interviews import InterviewStatusDictionary
+    from .task_status_log import TaskStatusLog
+    from .question_task_creator import QuestionTaskCreator
+class TaskCreators(UserDict):
+    """
+    A collection manager for all question tasks within an interview.
+    The TaskCreators class maintains a dictionary of QuestionTaskCreator objects,
+    where each key is a question name and each value is the corresponding task creator.
+    This class provides methods to aggregate information across all tasks, such as
+    token usage and status counts, enabling a holistic view of interview execution.
+    In the EDSL architecture, an interview consists of multiple questions, each executed
+    as a separate task. The TaskCreators class helps track and manage these tasks,
+    maintaining their execution status and resource usage.
+    Key features:
+    - Maintains a mapping of question names to their task creators
+    - Aggregates token usage across all tasks
+    - Tracks the status of all tasks in the interview
+    - Provides access to status logs for visualization and analysis
+    This class is typically used by the Interview class to manage task execution
+    and track the overall status of the interview.
+    """
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+    @property
+    def token_usage(self) -> 'InterviewTokenUsage':
+        """
+        Calculate the total token usage across all tasks in the interview.
+        This property aggregates token usage statistics from all task creators,
+        separating cached tokens (reused from cache) from new tokens (freshly generated).
+        The resulting InterviewTokenUsage object provides a complete picture of token
+        consumption for the entire interview.
+        Returns:
+            An InterviewTokenUsage object containing:
+            - Cached token usage (tokens reused from cache)
+            - New token usage (tokens freshly generated)
+        Notes:
+            - This is useful for cost estimation and quota management
+            - The separation of cached vs. new tokens helps analyze caching effectiveness
+            - Token usage is tracked separately for prompts and completions
+        """
+        from ..tokens import TokenUsage
+        from ..tokens import InterviewTokenUsage
+        cached_tokens = TokenUsage(from_cache=True)
+        new_tokens = TokenUsage(from_cache=False)
+        for task_creator in self.values():
+            token_usage = task_creator.token_usage()
+            cached_tokens += token_usage["cached_tokens"]
+            new_tokens += token_usage["new_tokens"]
+        return InterviewTokenUsage(
+            new_token_usage=new_tokens, cached_token_usage=cached_tokens
+        )
+    @property
+    def interview_status(self) -> 'InterviewStatusDictionary':
+        """
+        Get a summary of task statuses across the entire interview.
+        This property counts how many tasks are in each possible status state,
+        providing a snapshot of the interview's current execution state. The
+        resulting InterviewStatusDictionary maps each TaskStatus to a count
+        of tasks in that state, plus a special 'number_from_cache' counter.
+        Returns:
+            An InterviewStatusDictionary with counts for each task status
+        Notes:
+            - Used for monitoring interview progress
+            - Helps identify bottlenecks (many tasks waiting for capacity)
+            - Tracks cache utilization via the 'number_from_cache' count
+            - Useful for status dashboards and progress reporting
+        Example:
+            >>> t = TaskCreators()
+            >>> status = t.interview_status
+            >>> 'number_from_cache' in status
+            True
+            >>> status['number_from_cache']  # Check the cache count
+            0
+        """
+        from ..interviews import InterviewStatusDictionary
+        status_dict = InterviewStatusDictionary()
+        for task_creator in self.values():
+            status_dict[task_creator.task_status] += 1
+            status_dict["number_from_cache"] += task_creator.from_cache
+        return status_dict
+    def status_logs(self) -> List['TaskStatusLog']:
+        """
+        Get all task status logs for the interview.
+        This method collects the status logs from all task creators, providing
+        a complete history of status changes for every task in the interview.
+        The resulting list can be used for detailed analysis of task execution
+        patterns, timing, and visualization.
+        Returns:
+            A list of TaskStatusLog objects, one for each task in the interview
+        Notes:
+            - Used by visualization tools like task timeline charts
+            - Helpful for performance analysis and bottleneck identification
+            - Provides data for execution reports and dashboards
+        """
+        return [task_creator.status_log for task_creator in self.values()]
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl 0.1.47__py3-none-any.whl → 0.1.49__py3-none-any.whl

edsl 0.1.47py3-none-any.whl → 0.1.49py3-none-any.whl