PyPI - edsl - Versions diffs - 0.1.47__py3-none-any.whl → 0.1.48__py3-none-any.whl - Mend

edsl 0.1.47py3-none-any.whl → 0.1.48py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

edsl/__init__.py +44 -39
edsl/__version__.py +1 -1
edsl/agents/__init__.py +4 -2
edsl/agents/{Agent.py → agent.py} +442 -152
edsl/agents/{AgentList.py → agent_list.py} +220 -162
edsl/agents/descriptors.py +46 -7
edsl/{exceptions/agents.py → agents/exceptions.py} +3 -12
edsl/base/__init__.py +75 -0
edsl/base/base_class.py +1303 -0
edsl/base/data_transfer_models.py +114 -0
edsl/base/enums.py +215 -0
edsl/base.py +8 -0
edsl/buckets/__init__.py +25 -0
edsl/buckets/bucket_collection.py +324 -0
edsl/buckets/model_buckets.py +206 -0
edsl/buckets/token_bucket.py +502 -0
edsl/{jobs/buckets/TokenBucketAPI.py → buckets/token_bucket_api.py} +1 -1
edsl/buckets/token_bucket_client.py +509 -0
edsl/caching/__init__.py +20 -0
edsl/caching/cache.py +814 -0
edsl/caching/cache_entry.py +427 -0
edsl/{data/CacheHandler.py → caching/cache_handler.py} +14 -15
edsl/caching/exceptions.py +24 -0
edsl/caching/orm.py +30 -0
edsl/{data/RemoteCacheSync.py → caching/remote_cache_sync.py} +3 -3
edsl/caching/sql_dict.py +441 -0
edsl/config/__init__.py +8 -0
edsl/config/config_class.py +177 -0
edsl/config.py +4 -176
edsl/conversation/Conversation.py +7 -7
edsl/conversation/car_buying.py +4 -4
edsl/conversation/chips.py +6 -6
edsl/coop/__init__.py +25 -2
edsl/coop/coop.py +303 -67
edsl/coop/{ExpectedParrotKeyHandler.py → ep_key_handling.py} +86 -10
edsl/coop/exceptions.py +62 -0
edsl/coop/price_fetcher.py +126 -0
edsl/coop/utils.py +89 -24
edsl/data_transfer_models.py +5 -72
edsl/dataset/__init__.py +10 -0
edsl/{results/Dataset.py → dataset/dataset.py} +116 -36
edsl/{results/DatasetExportMixin.py → dataset/dataset_operations_mixin.py} +606 -122
edsl/{results/DatasetTree.py → dataset/dataset_tree.py} +156 -75
edsl/{results/TableDisplay.py → dataset/display/table_display.py} +18 -7
edsl/{results → dataset/display}/table_renderers.py +58 -2
edsl/{results → dataset}/file_exports.py +4 -5
edsl/{results → dataset}/smart_objects.py +2 -2
edsl/enums.py +5 -205
edsl/inference_services/__init__.py +5 -0
edsl/inference_services/{AvailableModelCacheHandler.py → available_model_cache_handler.py} +2 -3
edsl/inference_services/{AvailableModelFetcher.py → available_model_fetcher.py} +8 -14
edsl/inference_services/data_structures.py +3 -2
edsl/{exceptions/inference_services.py → inference_services/exceptions.py} +1 -1
edsl/inference_services/{InferenceServiceABC.py → inference_service_abc.py} +1 -1
edsl/inference_services/{InferenceServicesCollection.py → inference_services_collection.py} +8 -7
edsl/inference_services/registry.py +4 -41
edsl/inference_services/{ServiceAvailability.py → service_availability.py} +5 -25
edsl/inference_services/services/__init__.py +31 -0
edsl/inference_services/{AnthropicService.py → services/anthropic_service.py} +3 -3
edsl/inference_services/{AwsBedrock.py → services/aws_bedrock.py} +2 -2
edsl/inference_services/{AzureAI.py → services/azure_ai.py} +2 -2
edsl/inference_services/{DeepInfraService.py → services/deep_infra_service.py} +1 -3
edsl/inference_services/{DeepSeekService.py → services/deep_seek_service.py} +2 -4
edsl/inference_services/{GoogleService.py → services/google_service.py} +5 -4
edsl/inference_services/{GroqService.py → services/groq_service.py} +1 -1
edsl/inference_services/{MistralAIService.py → services/mistral_ai_service.py} +3 -3
edsl/inference_services/{OllamaService.py → services/ollama_service.py} +1 -7
edsl/inference_services/{OpenAIService.py → services/open_ai_service.py} +5 -6
edsl/inference_services/{PerplexityService.py → services/perplexity_service.py} +3 -7
edsl/inference_services/{TestService.py → services/test_service.py} +7 -6
edsl/inference_services/{TogetherAIService.py → services/together_ai_service.py} +2 -6
edsl/inference_services/{XAIService.py → services/xai_service.py} +1 -1
edsl/inference_services/write_available.py +1 -2
edsl/instructions/__init__.py +6 -0
edsl/{surveys/instructions/Instruction.py → instructions/instruction.py} +11 -6
edsl/{surveys/instructions/InstructionCollection.py → instructions/instruction_collection.py} +10 -5
edsl/{surveys/InstructionHandler.py → instructions/instruction_handler.py} +3 -3
edsl/{jobs/interviews → interviews}/ReportErrors.py +2 -2
edsl/interviews/__init__.py +4 -0
edsl/{jobs/AnswerQuestionFunctionConstructor.py → interviews/answering_function.py} +45 -18
edsl/{jobs/interviews/InterviewExceptionEntry.py → interviews/exception_tracking.py} +107 -22
edsl/interviews/interview.py +638 -0
edsl/{jobs/interviews/InterviewStatusDictionary.py → interviews/interview_status_dictionary.py} +21 -12
edsl/{jobs/interviews/InterviewStatusLog.py → interviews/interview_status_log.py} +16 -7
edsl/{jobs/InterviewTaskManager.py → interviews/interview_task_manager.py} +12 -7
edsl/{jobs/RequestTokenEstimator.py → interviews/request_token_estimator.py} +8 -3
edsl/{jobs/interviews/InterviewStatistic.py → interviews/statistics.py} +36 -10
edsl/invigilators/__init__.py +38 -0
edsl/invigilators/invigilator_base.py +477 -0
edsl/{agents/Invigilator.py → invigilators/invigilators.py} +263 -10
edsl/invigilators/prompt_constructor.py +476 -0
edsl/{agents → invigilators}/prompt_helpers.py +2 -1
edsl/{agents/QuestionInstructionPromptBuilder.py → invigilators/question_instructions_prompt_builder.py} +18 -13
edsl/{agents → invigilators}/question_option_processor.py +96 -21
edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} +64 -12
edsl/jobs/__init__.py +7 -1
edsl/jobs/async_interview_runner.py +99 -35
edsl/jobs/check_survey_scenario_compatibility.py +7 -5
edsl/jobs/data_structures.py +153 -22
edsl/{exceptions/jobs.py → jobs/exceptions.py} +2 -1
edsl/jobs/{FetchInvigilator.py → fetch_invigilator.py} +4 -4
edsl/jobs/{loggers/HTMLTableJobLogger.py → html_table_job_logger.py} +6 -2
edsl/jobs/{Jobs.py → jobs.py} +313 -167
edsl/jobs/{JobsChecks.py → jobs_checks.py} +15 -7
edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} +19 -17
edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} +10 -5
edsl/jobs/jobs_pricing_estimation.py +347 -0
edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} +4 -3
edsl/jobs/jobs_runner_asyncio.py +282 -0
edsl/jobs/{JobsRemoteInferenceHandler.py → remote_inference.py} +19 -22
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/key_management/__init__.py +28 -0
edsl/key_management/key_lookup.py +161 -0
edsl/{language_models/key_management/KeyLookupBuilder.py → key_management/key_lookup_builder.py} +118 -47
edsl/key_management/key_lookup_collection.py +82 -0
edsl/key_management/models.py +218 -0
edsl/language_models/__init__.py +7 -2
edsl/language_models/{ComputeCost.py → compute_cost.py} +18 -3
edsl/{exceptions/language_models.py → language_models/exceptions.py} +2 -1
edsl/language_models/language_model.py +1080 -0
edsl/language_models/model.py +10 -25
edsl/language_models/{ModelList.py → model_list.py} +9 -14
edsl/language_models/{RawResponseHandler.py → raw_response_handler.py} +1 -1
edsl/language_models/{RegisterLanguageModelsMeta.py → registry.py} +1 -1
edsl/language_models/repair.py +4 -4
edsl/language_models/utilities.py +4 -4
edsl/notebooks/__init__.py +3 -1
edsl/notebooks/{Notebook.py → notebook.py} +7 -8
edsl/prompts/__init__.py +1 -1
edsl/{exceptions/prompts.py → prompts/exceptions.py} +3 -1
edsl/prompts/{Prompt.py → prompt.py} +101 -95
edsl/questions/HTMLQuestion.py +1 -1
edsl/questions/__init__.py +154 -25
edsl/questions/answer_validator_mixin.py +1 -1
edsl/questions/compose_questions.py +4 -3
edsl/questions/derived/question_likert_five.py +166 -0
edsl/questions/derived/{QuestionLinearScale.py → question_linear_scale.py} +4 -4
edsl/questions/derived/{QuestionTopK.py → question_top_k.py} +4 -4
edsl/questions/derived/{QuestionYesNo.py → question_yes_no.py} +4 -5
edsl/questions/descriptors.py +24 -30
edsl/questions/loop_processor.py +65 -19
edsl/questions/question_base.py +881 -0
edsl/questions/question_base_gen_mixin.py +15 -16
edsl/questions/{QuestionBasePromptsMixin.py → question_base_prompts_mixin.py} +2 -2
edsl/questions/{QuestionBudget.py → question_budget.py} +3 -4
edsl/questions/{QuestionCheckBox.py → question_check_box.py} +16 -16
edsl/questions/{QuestionDict.py → question_dict.py} +39 -5
edsl/questions/{QuestionExtract.py → question_extract.py} +9 -9
edsl/questions/question_free_text.py +282 -0
edsl/questions/{QuestionFunctional.py → question_functional.py} +6 -5
edsl/questions/{QuestionList.py → question_list.py} +6 -7
edsl/questions/{QuestionMatrix.py → question_matrix.py} +6 -5
edsl/questions/{QuestionMultipleChoice.py → question_multiple_choice.py} +126 -21
edsl/questions/{QuestionNumerical.py → question_numerical.py} +5 -5
edsl/questions/{QuestionRank.py → question_rank.py} +6 -6
edsl/questions/question_registry.py +4 -9
edsl/questions/register_questions_meta.py +8 -4
edsl/questions/response_validator_abc.py +17 -16
edsl/results/__init__.py +4 -1
edsl/{exceptions/results.py → results/exceptions.py} +1 -1
edsl/results/report.py +197 -0
edsl/results/{Result.py → result.py} +131 -45
edsl/results/{Results.py → results.py} +365 -220
edsl/results/results_selector.py +344 -25
edsl/scenarios/__init__.py +30 -3
edsl/scenarios/{ConstructDownloadLink.py → construct_download_link.py} +7 -0
edsl/scenarios/directory_scanner.py +156 -13
edsl/scenarios/document_chunker.py +186 -0
edsl/scenarios/exceptions.py +101 -0
edsl/scenarios/file_methods.py +2 -3
edsl/scenarios/{FileStore.py → file_store.py} +275 -189
edsl/scenarios/handlers/__init__.py +14 -14
edsl/scenarios/handlers/{csv.py → csv_file_store.py} +1 -2
edsl/scenarios/handlers/{docx.py → docx_file_store.py} +8 -7
edsl/scenarios/handlers/{html.py → html_file_store.py} +1 -2
edsl/scenarios/handlers/{jpeg.py → jpeg_file_store.py} +1 -1
edsl/scenarios/handlers/{json.py → json_file_store.py} +1 -1
edsl/scenarios/handlers/latex_file_store.py +5 -0
edsl/scenarios/handlers/{md.py → md_file_store.py} +1 -1
edsl/scenarios/handlers/{pdf.py → pdf_file_store.py} +2 -2
edsl/scenarios/handlers/{png.py → png_file_store.py} +1 -1
edsl/scenarios/handlers/{pptx.py → pptx_file_store.py} +8 -7
edsl/scenarios/handlers/{py.py → py_file_store.py} +1 -3
edsl/scenarios/handlers/{sql.py → sql_file_store.py} +2 -1
edsl/scenarios/handlers/{sqlite.py → sqlite_file_store.py} +2 -3
edsl/scenarios/handlers/{txt.py → txt_file_store.py} +1 -1
edsl/scenarios/scenario.py +928 -0
edsl/scenarios/scenario_join.py +18 -5
edsl/scenarios/{ScenarioList.py → scenario_list.py} +294 -106
edsl/scenarios/{ScenarioListPdfMixin.py → scenario_list_pdf_tools.py} +16 -15
edsl/scenarios/scenario_selector.py +5 -1
edsl/study/ObjectEntry.py +2 -2
edsl/study/SnapShot.py +5 -5
edsl/study/Study.py +18 -19
edsl/study/__init__.py +6 -4
edsl/surveys/__init__.py +7 -4
edsl/surveys/dag/__init__.py +2 -0
edsl/surveys/{ConstructDAG.py → dag/construct_dag.py} +3 -3
edsl/surveys/{DAG.py → dag/dag.py} +13 -10
edsl/surveys/descriptors.py +1 -1
edsl/surveys/{EditSurvey.py → edit_survey.py} +9 -9
edsl/{exceptions/surveys.py → surveys/exceptions.py} +1 -2
edsl/surveys/memory/__init__.py +3 -0
edsl/surveys/{MemoryPlan.py → memory/memory_plan.py} +10 -9
edsl/surveys/rules/__init__.py +3 -0
edsl/surveys/{Rule.py → rules/rule.py} +103 -43
edsl/surveys/{RuleCollection.py → rules/rule_collection.py} +21 -30
edsl/surveys/{RuleManager.py → rules/rule_manager.py} +19 -13
edsl/surveys/survey.py +1743 -0
edsl/surveys/{SurveyExportMixin.py → survey_export.py} +22 -27
edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} +11 -2
edsl/surveys/{Simulator.py → survey_simulator.py} +10 -3
edsl/tasks/__init__.py +32 -0
edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} +115 -57
edsl/tasks/task_creators.py +135 -0
edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} +86 -47
edsl/{jobs/tasks → tasks}/task_status_enum.py +91 -7
edsl/tasks/task_status_log.py +85 -0
edsl/tokens/__init__.py +2 -0
edsl/tokens/interview_token_usage.py +53 -0
edsl/utilities/PrettyList.py +1 -1
edsl/utilities/SystemInfo.py +25 -22
edsl/utilities/__init__.py +29 -21
edsl/utilities/gcp_bucket/__init__.py +2 -0
edsl/utilities/gcp_bucket/cloud_storage.py +99 -96
edsl/utilities/interface.py +44 -536
edsl/{results/MarkdownToPDF.py → utilities/markdown_to_pdf.py} +13 -5
edsl/utilities/repair_functions.py +1 -1
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/METADATA +1 -1
edsl-0.1.48.dist-info/RECORD +347 -0
edsl/Base.py +0 -493
edsl/BaseDiff.py +0 -260
edsl/agents/InvigilatorBase.py +0 -260
edsl/agents/PromptConstructor.py +0 -318
edsl/coop/PriceFetcher.py +0 -54
edsl/data/Cache.py +0 -582
edsl/data/CacheEntry.py +0 -238
edsl/data/SQLiteDict.py +0 -292
edsl/data/__init__.py +0 -5
edsl/data/orm.py +0 -10
edsl/exceptions/cache.py +0 -5
edsl/exceptions/coop.py +0 -14
edsl/exceptions/data.py +0 -14
edsl/exceptions/scenarios.py +0 -29
edsl/jobs/Answers.py +0 -43
edsl/jobs/JobsPrompts.py +0 -354
edsl/jobs/buckets/BucketCollection.py +0 -134
edsl/jobs/buckets/ModelBuckets.py +0 -65
edsl/jobs/buckets/TokenBucket.py +0 -283
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/interviews/Interview.py +0 -395
edsl/jobs/interviews/InterviewExceptionCollection.py +0 -99
edsl/jobs/interviews/InterviewStatisticsCollection.py +0 -25
edsl/jobs/runners/JobsRunnerAsyncio.py +0 -163
edsl/jobs/runners/JobsRunnerStatusData.py +0 -0
edsl/jobs/tasks/TaskCreators.py +0 -64
edsl/jobs/tasks/TaskStatusLog.py +0 -23
edsl/jobs/tokens/InterviewTokenUsage.py +0 -27
edsl/language_models/LanguageModel.py +0 -635
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/models.py +0 -137
edsl/questions/QuestionBase.py +0 -544
edsl/questions/QuestionFreeText.py +0 -130
edsl/questions/derived/QuestionLikertFive.py +0 -76
edsl/results/ResultsExportMixin.py +0 -45
edsl/results/TextEditor.py +0 -50
edsl/results/results_fetch_mixin.py +0 -33
edsl/results/results_tools_mixin.py +0 -98
edsl/scenarios/DocumentChunker.py +0 -104
edsl/scenarios/Scenario.py +0 -548
edsl/scenarios/ScenarioHtmlMixin.py +0 -65
edsl/scenarios/ScenarioListExportMixin.py +0 -45
edsl/scenarios/handlers/latex.py +0 -5
edsl/shared.py +0 -1
edsl/surveys/Survey.py +0 -1301
edsl/surveys/SurveyQualtricsImport.py +0 -284
edsl/surveys/SurveyToApp.py +0 -141
edsl/surveys/instructions/__init__.py +0 -0
edsl/tools/__init__.py +0 -1
edsl/tools/clusters.py +0 -192
edsl/tools/embeddings.py +0 -27
edsl/tools/embeddings_plotting.py +0 -118
edsl/tools/plotting.py +0 -112
edsl/tools/summarize.py +0 -18
edsl/utilities/data/Registry.py +0 -6
edsl/utilities/data/__init__.py +0 -1
edsl/utilities/data/scooter_results.json +0 -1
edsl-0.1.47.dist-info/RECORD +0 -354
/edsl/coop/{CoopFunctionsMixin.py → coop_functions.py} +0 -0
/edsl/{results → dataset/display}/CSSParameterizer.py +0 -0
/edsl/{language_models/key_management → dataset/display}/__init__.py +0 -0
/edsl/{results → dataset/display}/table_data_class.py +0 -0
/edsl/{results → dataset/display}/table_display.css +0 -0
/edsl/{results/ResultsGGMixin.py → dataset/r/ggplot.py} +0 -0
/edsl/{results → dataset}/tree_explore.py +0 -0
/edsl/{surveys/instructions/ChangeInstruction.py → instructions/change_instruction.py} +0 -0
/edsl/{jobs/interviews → interviews}/interview_status_enum.py +0 -0
/edsl/jobs/{runners/JobsRunnerStatus.py → jobs_runner_status.py} +0 -0
/edsl/language_models/{PriceManager.py → price_manager.py} +0 -0
/edsl/language_models/{fake_openai_call.py → unused/fake_openai_call.py} +0 -0
/edsl/language_models/{fake_openai_service.py → unused/fake_openai_service.py} +0 -0
/edsl/notebooks/{NotebookToLaTeX.py → notebook_to_latex.py} +0 -0
/edsl/{exceptions/questions.py → questions/exceptions.py} +0 -0
/edsl/questions/{SimpleAskMixin.py → simple_ask_mixin.py} +0 -0
/edsl/surveys/{Memory.py → memory/memory.py} +0 -0
/edsl/surveys/{MemoryManagement.py → memory/memory_management.py} +0 -0
/edsl/surveys/{SurveyCSS.py → survey_css.py} +0 -0
/edsl/{jobs/tokens/TokenUsage.py → tokens/token_usage.py} +0 -0
/edsl/{results/MarkdownToDocx.py → utilities/markdown_to_docx.py} +0 -0
/edsl/{TemplateLoader.py → utilities/template_loader.py} +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/LICENSE +0 -0
{edsl-0.1.47.dist-info → edsl-0.1.48.dist-info}/WHEEL +0 -0

edsl/{agents → invigilators}/question_option_processor.py RENAMED Viewed

@@ -2,6 +2,52 @@ from jinja2 import Environment, meta
 from typing import List, Optional, Union
+def extract_template_variables(ast) -> List[Union[str, tuple]]:
+    """
+    Extract variable expressions from a Jinja2 AST.
+    Args:
+        ast: Jinja2 AST
+    Returns:
+        List[Union[str, tuple]]: List of variable names or tuples for dotted paths
+    """
+    from jinja2 import nodes
+    from jinja2.visitor import NodeVisitor
+    variables = []
+    class VariableVisitor(NodeVisitor):
+        def visit_Name(self, node):
+            variables.append(node.name)
+        def visit_Getattr(self, node):
+            # For dotted access like scenario.question_options
+            parts = []
+            current = node
+            # Handle the leaf attribute
+            parts.append(node.attr)
+            # Walk up the chain to collect all parts
+            while isinstance(current.node, nodes.Getattr):
+                current = current.node
+                parts.append(current.attr)
+            # Add the root name
+            if isinstance(current.node, nodes.Name):
+                parts.append(current.node.name)
+            # Reverse to get the correct order
+            parts.reverse()
+            variables.append(tuple(parts))
+    visitor = VariableVisitor()
+    visitor.visit(ast)
+    return variables
 class QuestionOptionProcessor:
     """
     Class that manages the processing of question options.
@@ -16,7 +62,11 @@ class QuestionOptionProcessor:
         return cls(scenario, prior_answers_dict)
     def __init__(self, scenario: 'Scenario', prior_answers_dict: dict):
-        self.scenario = scenario
+        # This handles cases where the question has {{ scenario.key }} - eventually
+        # we might not allow 'naked' scenario keys w/o the scenario prefix
+        #new_scenario = scenario.copy()
+        #new_scenario.update({'scenario': new_scenario})
+        self.scenario = scenario
         self.prior_answers_dict = prior_answers_dict
     @staticmethod
@@ -25,18 +75,23 @@ class QuestionOptionProcessor:
         return [f"<< Option {i} - Placeholder >>" for i in range(1, 4)]
     @staticmethod
-    def _parse_template_variable(template_str: str) -> str:
+    def _parse_template_variable(template_str: str) -> Union[str, tuple]:
         """
         Extract the variable name from a template string.
+        If the variable contains dots (e.g., scenario.question_options),
+        returns a tuple of the path components.
         Args:
             template_str (str): Jinja template string
         Returns:
-            str: Name of the first undefined variable in the template
+            Union[str, tuple]: Name of the first undefined variable in the template,
+                              or a tuple of path components if the variable contains dots
         >>> QuestionOptionProcessor._parse_template_variable("Here are some {{ options }}")
         'options'
+        >>> QuestionOptionProcessor._parse_template_variable("Here are some {{ scenario.question_options }}")
+        ('scenario', 'question_options')
         >>> QuestionOptionProcessor._parse_template_variable("Here are some {{ options }} and {{ other }}")
         Traceback (most recent call last):
         ...
@@ -48,11 +103,13 @@ class QuestionOptionProcessor:
         """
         env = Environment()
         parsed_content = env.parse(template_str)
-        undeclared_variables = list(meta.find_undeclared_variables(parsed_content))
+        undeclared_variables = extract_template_variables(parsed_content)
         if not undeclared_variables:
             raise ValueError("No variables found in template string")
         if len(undeclared_variables) > 1:
             raise ValueError("Multiple variables found in template string")
         return undeclared_variables[0]
     @staticmethod
@@ -128,7 +185,7 @@ class QuestionOptionProcessor:
         The case where options are provided as a template string:
-        >>> question_data = {"question_options": "{{ options }}"}
+        >>> question_data = {"question_options": "{{ scenario.options }}"}
         >>> processor.get_question_options(question_data)
         ['Option 1', 'Option 2']
@@ -140,7 +197,7 @@ class QuestionOptionProcessor:
         >>> q0.answer = ["Option 1", "Option 2"]
         >>> mpc.prior_answers_dict = lambda: {'q0': q0}
         >>> processor = QuestionOptionProcessor.from_prompt_constructor(mpc)
-        >>> question_data = {"question_options": "{{ q0 }}"}
+        >>> question_data = {"question_options": "{{ q0.answer }}"}
         >>> processor.get_question_options(question_data)
         ['Option 1', 'Option 2']
@@ -156,21 +213,39 @@ class QuestionOptionProcessor:
             return options_entry if options_entry else self._get_default_options()
         # Parse template to get variable name
-        option_key = self._parse_template_variable(options_entry)
-        # Try getting options from scenario
-        scenario_options = self._get_options_from_scenario(
-            self.scenario, option_key
-        )
-        if scenario_options:
-            return scenario_options
-        # Try getting options from prior answers
-        prior_answer_options = self._get_options_from_prior_answers(
-            self.prior_answers_dict, option_key
-        )
-        if prior_answer_options:
-            return prior_answer_options
+        raw_option_key = self._parse_template_variable(options_entry)
+        source_type = None
+        if isinstance(raw_option_key, tuple):
+            if raw_option_key[0] == 'scenario':
+                source_type = 'scenario'
+                option_key = raw_option_key[-1]
+            else:
+                source_type = 'prior_answers'
+                option_key = raw_option_key[0]
+                #breakpoint()
+        else:
+            option_key = raw_option_key
+        #breakpoint()
+        if source_type == 'scenario':
+            # Try getting options from scenario
+            scenario_options = self._get_options_from_scenario(
+                self.scenario, option_key
+            )
+            if scenario_options:
+                return scenario_options
+        if source_type == 'prior_answers':
+            # Try getting options from prior answers
+            prior_answer_options = self._get_options_from_prior_answers(
+                self.prior_answers_dict, option_key
+            )
+            if prior_answer_options:
+                return prior_answer_options
         return self._get_default_options()

edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} RENAMED Viewed

@@ -1,11 +1,12 @@
 from jinja2 import Environment, meta, TemplateSyntaxError
 from typing import Any, Set, TYPE_CHECKING
+from ..agents import Agent
+from ..scenarios import Scenario
 if TYPE_CHECKING:
-    from edsl.agents.PromptConstructor import PromptConstructor
-    from edsl.scenarios.Scenario import Scenario
-    from edsl.questions.QuestionBase import QuestionBase
-    from edsl.agents.Agent import Agent
+    from .prompt_constructor import PromptConstructor
+    from ..questions import QuestionBase
 class QuestionTemplateReplacementsBuilder:
@@ -33,17 +34,29 @@ class QuestionTemplateReplacementsBuilder:
     def question_file_keys(self):
         """
-        >>> from edsl import QuestionMultipleChoice, Scenario
+        >>> from ..questions import QuestionMultipleChoice
+        >>> from ..scenarios import Scenario
         >>> q = QuestionMultipleChoice(question_text="Do you like school?", question_name = "q0", question_options = ["yes", "no"])
         >>> qtrb = QuestionTemplateReplacementsBuilder(scenario = {"file1": "file1"}, question = q, prior_answers_dict = {'q0': 'q0'}, agent = "agent")
         >>> qtrb.question_file_keys()
         []
-        >>> from edsl import FileStore
+        >>> from ..scenarios import FileStore
         >>> fs = FileStore.example()
+        >>> # Test direct key reference
         >>> q = QuestionMultipleChoice(question_text="What do you think of this file: {{ file1 }}", question_name = "q0", question_options = ["good", "bad"])
         >>> qtrb = QuestionTemplateReplacementsBuilder(scenario = Scenario({"file1": fs}), question = q, prior_answers_dict = {'q0': 'q0'}, agent = "agent")
         >>> qtrb.question_file_keys()
         ['file1']
+        >>> # Test scenario.key reference
+        >>> q = QuestionMultipleChoice(question_text="What do you think of this file: {{ scenario.file2 }}", question_name = "q0", question_options = ["good", "bad"])
+        >>> qtrb = QuestionTemplateReplacementsBuilder(scenario = Scenario({"file2": fs}), question = q, prior_answers_dict = {'q0': 'q0'}, agent = "agent")
+        >>> qtrb.question_file_keys()
+        ['file2']
+        >>> # Test both formats in the same question
+        >>> q = QuestionMultipleChoice(question_text="Compare {{ file1 }} with {{ scenario.file2 }}", question_name = "q0", question_options = ["good", "bad"])
+        >>> qtrb = QuestionTemplateReplacementsBuilder(scenario = Scenario({"file1": fs, "file2": fs}), question = q, prior_answers_dict = {'q0': 'q0'}, agent = "agent")
+        >>> sorted(qtrb.question_file_keys())
+        ['file1', 'file2']
         """
         question_text = self.question.question_text
         file_keys = self._find_file_keys(self.scenario)
@@ -76,8 +89,8 @@ class QuestionTemplateReplacementsBuilder:
         """We need to find all the keys in the scenario that refer to FileStore objects.
         These will be used to append to the prompt a list of files that are part of the scenario.
-        >>> from edsl import Scenario
-        >>> from edsl.scenarios.FileStore import FileStore
+        >>> from ..scenarios import Scenario
+        >>> from ..scenarios import FileStore
         >>> import tempfile
         >>> with tempfile.NamedTemporaryFile() as f:
         ...     _ = f.write(b"Hello, world!")
@@ -87,7 +100,7 @@ class QuestionTemplateReplacementsBuilder:
         ...     QuestionTemplateReplacementsBuilder._find_file_keys(scenario)
         ['fs_file']
         """
-        from edsl.scenarios.FileStore import FileStore
+        from ..scenarios import FileStore
         file_entries = []
         for key, value in scenario.items():
@@ -100,10 +113,11 @@ class QuestionTemplateReplacementsBuilder:
         question_text: str, scenario_file_keys: list
     ) -> list:
         """
-        Extracts the file keys from a question text.
+        Extracts the file keys from a question text, handling both direct references ({{ file_key }})
+        and scenario-prefixed references ({{ scenario.file_key }}).
         >>> from edsl import Scenario
-        >>> from edsl.scenarios.FileStore import FileStore
+        >>> from edsl.scenarios import FileStore
         >>> import tempfile
         >>> with tempfile.NamedTemporaryFile() as f:
         ...     _ = f.write(b"Hello, world!")
@@ -112,15 +126,53 @@ class QuestionTemplateReplacementsBuilder:
         ...     scenario = Scenario({"fs_file": fs, 'a': 1})
         ...     QuestionTemplateReplacementsBuilder._extract_file_keys_from_question_text("{{ fs_file }}", ['fs_file'])
         ['fs_file']
+        >>> with tempfile.NamedTemporaryFile() as f:
+        ...     _ = f.write(b"Hello, world!")
+        ...     _ = f.seek(0)
+        ...     fs = FileStore(f.name)
+        ...     scenario = Scenario({"print": fs, 'a': 1})
+        ...     QuestionTemplateReplacementsBuilder._extract_file_keys_from_question_text("{{ scenario.print }}", ['print'])
+        ['print']
+        >>> with tempfile.NamedTemporaryFile() as f:
+        ...     _ = f.write(b"Hello, world!")
+        ...     _ = f.seek(0)
+        ...     fs = FileStore(f.name)
+        ...     scenario = Scenario({"file1": fs, "file2": fs})
+        ...     sorted(QuestionTemplateReplacementsBuilder._extract_file_keys_from_question_text("Compare {{ file1 }} with {{ scenario.file2 }}", ['file1', 'file2']))
+        ['file1', 'file2']
         """
         variables = QuestionTemplateReplacementsBuilder.get_jinja2_variables(
             question_text
         )
         question_file_keys = []
+        # Direct references: {{ file_key }}
         for var in variables:
             if var in scenario_file_keys:
                 question_file_keys.append(var)
-        return question_file_keys
+        # Scenario-prefixed references: {{ scenario.file_key }}
+        for var in variables:
+            if var == "scenario":
+                # If we find a scenario variable, we need to check for nested references
+                # Create a modified template with just {{ scenario.* }} expressions to isolate them
+                scenario_template = "".join([
+                    "{% for key, value in scenario.items() %}{{ key }}{% endfor %}"
+                ])
+                try:
+                    # This is a check to make sure there's scenario.something syntax in the template
+                    if "scenario." in question_text:
+                        # Extract dot-notation scenario references by parsing the template
+                        import re
+                        scenario_refs = re.findall(r'{{\s*scenario\.(\w+)\s*}}', question_text)
+                        for key in scenario_refs:
+                            if key in scenario_file_keys:
+                                question_file_keys.append(key)
+                except:
+                    # If there's any issue parsing, just continue with what we have
+                    pass
+        return list(set(question_file_keys))  # Remove duplicates
     def _scenario_replacements(
         self, replacement_string: str = "<see file {key}>"

edsl/jobs/__init__.py CHANGED Viewed

@@ -1 +1,7 @@
-from edsl.jobs.Jobs import Jobs
+from .jobs import Jobs
+from .jobs import RunConfig, RunParameters, RunEnvironment
+from .remote_inference import JobsRemoteInferenceHandler
+from .jobs_runner_status import JobsRunnerStatusBase
+__all__ = ["Jobs"]

edsl/jobs/async_interview_runner.py CHANGED Viewed

@@ -1,43 +1,94 @@
+"""
+Asynchronous interview runner module for conducting interviews concurrently.
+This module provides functionality to run multiple interviews in parallel
+with controlled concurrency, supporting both error handling and result collection.
+"""
 from collections.abc import AsyncGenerator
-from typing import List, TypeVar, Generator, Tuple, TYPE_CHECKING
+from typing import List, Generator, Tuple, TYPE_CHECKING
 from dataclasses import dataclass
 import asyncio
-from contextlib import asynccontextmanager
 from edsl.data_transfer_models import EDSLResultObjectInput
-from edsl.results.Result import Result
-from edsl.jobs.interviews.Interview import Interview
-from edsl.config import Config
+from ..results import Result
+from ..interviews import Interview
+from ..config import Config
 config = Config()
 if TYPE_CHECKING:
-    from edsl.jobs.Jobs import Jobs
+    from ..jobs import Jobs
+from .data_structures import RunConfig
 @dataclass
 class InterviewResult:
+    """Container for the result of an interview along with metadata.
+    Attributes:
+        result: The Result object containing the interview answers
+        interview: The Interview object used to conduct the interview
+        order: The original position of this interview in the processing queue
+    """
     result: Result
     interview: Interview
     order: int
-from edsl.jobs.data_structures import RunConfig
 class AsyncInterviewRunner:
+    """
+    Runs interviews asynchronously with controlled concurrency.
+    This class manages the parallel execution of multiple interviews while
+    respecting concurrency limits and handling errors appropriately.
+    Examples:
+        >>> from unittest.mock import MagicMock, AsyncMock
+        >>> mock_jobs = MagicMock()
+        >>> mock_run_config = MagicMock()
+        >>> mock_run_config.parameters.n = 1
+        >>> mock_run_config.environment.cache = None
+        >>> runner = AsyncInterviewRunner(mock_jobs, mock_run_config)
+        >>> isinstance(runner._initialized, asyncio.Event)
+        True
+    """
     MAX_CONCURRENT = int(config.EDSL_MAX_CONCURRENT_TASKS)
     def __init__(self, jobs: "Jobs", run_config: RunConfig):
+        """
+        Initialize the AsyncInterviewRunner.
+        Args:
+            jobs: The Jobs object that generates interviews
+            run_config: Configuration for running the interviews
+        """
         self.jobs = jobs
         self.run_config = run_config
         self._initialized = asyncio.Event()
     def _expand_interviews(self) -> Generator["Interview", None, None]:
-        """Populates self.total_interviews with n copies of each interview.
-        It also has to set the cache for each interview.
-        :param n: how many times to run each interview.
+        """
+        Create multiple copies of each interview based on the run configuration.
+        This method expands interviews for repeated runs and ensures each has
+        the proper cache configuration.
+        Yields:
+            Interview objects ready to be conducted
+        Examples:
+            >>> from unittest.mock import MagicMock
+            >>> mock_jobs = MagicMock()
+            >>> mock_interview = MagicMock()
+            >>> mock_jobs.generate_interviews.return_value = [mock_interview]
+            >>> mock_run_config = MagicMock()
+            >>> mock_run_config.parameters.n = 2
+            >>> mock_run_config.environment.cache = "mock_cache"
+            >>> runner = AsyncInterviewRunner(mock_jobs, mock_run_config)
+            >>> interviews = list(runner._expand_interviews())
+            >>> len(interviews)
+            2
         """
         for interview in self.jobs.generate_interviews():
             for iteration in range(self.run_config.parameters.n):
@@ -52,21 +103,22 @@ class AsyncInterviewRunner:
     async def _conduct_interview(
         self, interview: "Interview"
     ) -> Tuple["Result", "Interview"]:
-        """Conducts an interview and returns the result object, along with the associated interview.
-        We return the interview because it is not populated with exceptions, if any.
-        :param interview: the interview to conduct
-        :return: the result of the interview
-        'extracted_answers' is a dictionary of the answers to the questions in the interview.
-        This is not the same as the generated_tokens---it can include substantial cleaning and processing / validation.
         """
-        # the model buckets are used to track usage rates
-        # model_buckets = self.bucket_collection[interview.model]
-        # model_buckets = self.run_config.environment.bucket_collection[interview.model]
-        # get the results of the interview e.g., {'how_are_you':"Good" 'how_are_you_generated_tokens': "Good"}
+        Asynchronously conduct a single interview.
+        This method performs the interview and creates a Result object with
+        the extracted answers and model responses.
+        Args:
+            interview: The interview to conduct
+        Returns:
+            Tuple containing the Result object and the Interview object
+        Notes:
+            'extracted_answers' contains the processed and validated answers
+            from the interview, which may differ from the raw model output.
+        """
         extracted_answers: dict[str, str]
         model_response_objects: List[EDSLResultObjectInput]
@@ -83,10 +135,20 @@ class AsyncInterviewRunner:
     async def run(
         self,
     ) -> AsyncGenerator[tuple[Result, Interview], None]:
-        """Creates and processes tasks asynchronously, yielding results as they complete.
-        Uses TaskGroup for structured concurrency and automated cleanup.
-        Results are yielded as they become available while maintaining controlled concurrency.
+        """
+        Run all interviews asynchronously and yield results as they complete.
+        This method processes interviews in chunks based on MAX_CONCURRENT,
+        maintaining controlled concurrency while yielding results as soon as
+        they become available.
+        Yields:
+            Tuples of (Result, Interview) as interviews complete
+        Notes:
+            - Uses structured concurrency patterns for proper resource management
+            - Handles exceptions according to the run configuration
+            - Ensures task cleanup even in case of failures
         """
         interviews = list(self._expand_interviews())
         self._initialized.set()
@@ -102,10 +164,8 @@ class AsyncInterviewRunner:
                 result.order = idx
                 return InterviewResult(result, interview, idx)
             except Exception as e:
-                # breakpoint()
                 if self.run_config.parameters.stop_on_exception:
                     raise
-                # logger.error(f"Task failed with error: {e}")
                 return None
         # Process interviews in chunks
@@ -130,7 +190,6 @@ class AsyncInterviewRunner:
             except Exception as e:
                 if self.run_config.parameters.stop_on_exception:
                     raise
-                # logger.error(f"Chunk processing failed with error: {e}")
                 continue
             finally:
@@ -138,3 +197,8 @@ class AsyncInterviewRunner:
                 for task in tasks:
                     if not task.done():
                         task.cancel()
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()

edsl/jobs/check_survey_scenario_compatibility.py CHANGED Viewed

@@ -1,5 +1,7 @@
 import warnings
 from typing import TYPE_CHECKING
+from edsl.scenarios import ScenarioList
+from edsl.surveys import Survey
 if TYPE_CHECKING:
     from edsl.surveys.Survey import Survey
@@ -15,10 +17,10 @@ class CheckSurveyScenarioCompatibility:
     def check(self, strict: bool = False, warn: bool = False) -> None:
         """Check if the parameters in the survey and scenarios are consistent.
-        >>> from edsl.jobs.Jobs import Jobs
-        >>> from edsl.questions.QuestionFreeText import QuestionFreeText
-        >>> from edsl.surveys.Survey import Survey
-        >>> from edsl.scenarios.Scenario import Scenario
+        >>> from edsl.jobs import Jobs
+        >>> from edsl.questions import QuestionFreeText
+        >>> from edsl.surveys import Survey
+        >>> from edsl.scenarios import Scenario
         >>> q = QuestionFreeText(question_text = "{{poo}}", question_name = "ugly_question")
         >>> j = Jobs(survey = Survey(questions=[q]))
         >>> cs = CheckSurveyScenarioCompatibility(j.survey, j.scenarios)
@@ -39,7 +41,7 @@ class CheckSurveyScenarioCompatibility:
         >>> q = QuestionFreeText(question_text = "Hello", question_name = "ugly_question")
         >>> s = Scenario({'ugly_question': "B"})
-        >>> from edsl.scenarios.ScenarioList import ScenarioList
+        >>> from edsl.scenarios import ScenarioList
         >>> cs = CheckSurveyScenarioCompatibility(Survey(questions=[q]), ScenarioList([s]))
         >>> cs.check()
         Traceback (most recent call last):

edsl 0.1.47__py3-none-any.whl → 0.1.48__py3-none-any.whl

edsl 0.1.47py3-none-any.whl → 0.1.48py3-none-any.whl