PyPI - edsl - Versions diffs - 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl - Mend

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (407) hide show

edsl/Base.py +348 -38
edsl/BaseDiff.py +260 -0
edsl/TemplateLoader.py +24 -0
edsl/__init__.py +46 -10
edsl/__version__.py +1 -0
edsl/agents/Agent.py +842 -144
edsl/agents/AgentList.py +521 -25
edsl/agents/Invigilator.py +250 -374
edsl/agents/InvigilatorBase.py +257 -0
edsl/agents/PromptConstructor.py +272 -0
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/descriptors.py +43 -13
edsl/agents/prompt_helpers.py +129 -0
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +130 -0
edsl/auto/StageBase.py +243 -0
edsl/auto/StageGenerateSurvey.py +178 -0
edsl/auto/StageLabelQuestions.py +125 -0
edsl/auto/StagePersona.py +61 -0
edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
edsl/auto/StagePersonaDimensionValues.py +74 -0
edsl/auto/StagePersonaDimensions.py +69 -0
edsl/auto/StageQuestions.py +74 -0
edsl/auto/SurveyCreatorPipeline.py +21 -0
edsl/auto/utilities.py +218 -0
edsl/base/Base.py +279 -0
edsl/config.py +121 -104
edsl/conversation/Conversation.py +290 -0
edsl/conversation/car_buying.py +59 -0
edsl/conversation/chips.py +95 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +54 -0
edsl/coop/__init__.py +1 -0
edsl/coop/coop.py +1029 -134
edsl/coop/utils.py +131 -0
edsl/data/Cache.py +560 -89
edsl/data/CacheEntry.py +230 -0
edsl/data/CacheHandler.py +168 -0
edsl/data/RemoteCacheSync.py +186 -0
edsl/data/SQLiteDict.py +292 -0
edsl/data/__init__.py +5 -3
edsl/data/orm.py +6 -33
edsl/data_transfer_models.py +74 -27
edsl/enums.py +165 -8
edsl/exceptions/BaseException.py +21 -0
edsl/exceptions/__init__.py +52 -46
edsl/exceptions/agents.py +33 -15
edsl/exceptions/cache.py +5 -0
edsl/exceptions/coop.py +8 -0
edsl/exceptions/general.py +34 -0
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/jobs.py +15 -0
edsl/exceptions/language_models.py +46 -1
edsl/exceptions/questions.py +80 -5
edsl/exceptions/results.py +16 -5
edsl/exceptions/scenarios.py +29 -0
edsl/exceptions/surveys.py +13 -10
edsl/inference_services/AnthropicService.py +106 -0
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +118 -0
edsl/inference_services/AzureAI.py +215 -0
edsl/inference_services/DeepInfraService.py +18 -0
edsl/inference_services/GoogleService.py +143 -0
edsl/inference_services/GroqService.py +20 -0
edsl/inference_services/InferenceServiceABC.py +80 -0
edsl/inference_services/InferenceServicesCollection.py +138 -0
edsl/inference_services/MistralAIService.py +120 -0
edsl/inference_services/OllamaService.py +18 -0
edsl/inference_services/OpenAIService.py +236 -0
edsl/inference_services/PerplexityService.py +160 -0
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +90 -0
edsl/inference_services/TogetherAIService.py +172 -0
edsl/inference_services/data_structures.py +134 -0
edsl/inference_services/models_available_cache.py +118 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/registry.py +41 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +21 -20
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +684 -204
edsl/jobs/JobsChecks.py +172 -0
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +270 -0
edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +104 -0
edsl/jobs/buckets/ModelBuckets.py +65 -0
edsl/jobs/buckets/TokenBucket.py +283 -0
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +392 -0
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
edsl/jobs/interviews/InterviewStatistic.py +63 -0
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
edsl/jobs/interviews/InterviewStatusLog.py +92 -0
edsl/jobs/interviews/ReportErrors.py +66 -0
edsl/jobs/interviews/interview_status_enum.py +9 -0
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
edsl/jobs/runners/JobsRunnerStatus.py +298 -0
edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
edsl/jobs/tasks/TaskCreators.py +64 -0
edsl/jobs/tasks/TaskHistory.py +470 -0
edsl/jobs/tasks/TaskStatusLog.py +23 -0
edsl/jobs/tasks/task_status_enum.py +161 -0
edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
edsl/jobs/tokens/TokenUsage.py +34 -0
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +507 -386
edsl/language_models/ModelList.py +164 -0
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
edsl/language_models/__init__.py +1 -8
edsl/language_models/fake_openai_call.py +15 -0
edsl/language_models/fake_openai_service.py +61 -0
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +109 -41
edsl/language_models/utilities.py +65 -0
edsl/notebooks/Notebook.py +263 -0
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/notebooks/__init__.py +1 -0
edsl/prompts/Prompt.py +222 -93
edsl/prompts/__init__.py +1 -1
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +518 -0
edsl/questions/QuestionBasePromptsMixin.py +221 -0
edsl/questions/QuestionBudget.py +164 -67
edsl/questions/QuestionCheckBox.py +281 -62
edsl/questions/QuestionDict.py +343 -0
edsl/questions/QuestionExtract.py +136 -50
edsl/questions/QuestionFreeText.py +79 -55
edsl/questions/QuestionFunctional.py +138 -41
edsl/questions/QuestionList.py +184 -57
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +293 -69
edsl/questions/QuestionNumerical.py +109 -56
edsl/questions/QuestionRank.py +244 -49
edsl/questions/Quick.py +41 -0
edsl/questions/SimpleAskMixin.py +74 -0
edsl/questions/__init__.py +9 -6
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
edsl/questions/compose_questions.py +13 -7
edsl/questions/data_structures.py +20 -0
edsl/questions/decorators.py +21 -0
edsl/questions/derived/QuestionLikertFive.py +28 -26
edsl/questions/derived/QuestionLinearScale.py +41 -28
edsl/questions/derived/QuestionTopK.py +34 -26
edsl/questions/derived/QuestionYesNo.py +40 -27
edsl/questions/descriptors.py +228 -74
edsl/questions/loop_processor.py +149 -0
edsl/questions/prompt_templates/question_budget.jinja +13 -0
edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
edsl/questions/prompt_templates/question_extract.jinja +11 -0
edsl/questions/prompt_templates/question_free_text.jinja +3 -0
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
edsl/questions/prompt_templates/question_list.jinja +17 -0
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
edsl/questions/prompt_templates/question_numerical.jinja +37 -0
edsl/questions/question_base_gen_mixin.py +168 -0
edsl/questions/question_registry.py +130 -46
edsl/questions/register_questions_meta.py +71 -0
edsl/questions/response_validator_abc.py +188 -0
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/settings.py +5 -2
edsl/questions/templates/__init__.py +0 -0
edsl/questions/templates/budget/__init__.py +0 -0
edsl/questions/templates/budget/answering_instructions.jinja +7 -0
edsl/questions/templates/budget/question_presentation.jinja +7 -0
edsl/questions/templates/checkbox/__init__.py +0 -0
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
edsl/questions/templates/dict/__init__.py +0 -0
edsl/questions/templates/dict/answering_instructions.jinja +21 -0
edsl/questions/templates/dict/question_presentation.jinja +1 -0
edsl/questions/templates/extract/__init__.py +0 -0
edsl/questions/templates/extract/answering_instructions.jinja +7 -0
edsl/questions/templates/extract/question_presentation.jinja +1 -0
edsl/questions/templates/free_text/__init__.py +0 -0
edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
edsl/questions/templates/free_text/question_presentation.jinja +1 -0
edsl/questions/templates/likert_five/__init__.py +0 -0
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
edsl/questions/templates/linear_scale/__init__.py +0 -0
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
edsl/questions/templates/list/__init__.py +0 -0
edsl/questions/templates/list/answering_instructions.jinja +4 -0
edsl/questions/templates/list/question_presentation.jinja +5 -0
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/questions/templates/multiple_choice/__init__.py +0 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
edsl/questions/templates/multiple_choice/html.jinja +0 -0
edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
edsl/questions/templates/numerical/__init__.py +0 -0
edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
edsl/questions/templates/numerical/question_presentation.jinja +7 -0
edsl/questions/templates/rank/__init__.py +0 -0
edsl/questions/templates/rank/answering_instructions.jinja +11 -0
edsl/questions/templates/rank/question_presentation.jinja +15 -0
edsl/questions/templates/top_k/__init__.py +0 -0
edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
edsl/questions/templates/top_k/question_presentation.jinja +22 -0
edsl/questions/templates/yes_no/__init__.py +0 -0
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +550 -19
edsl/results/DatasetExportMixin.py +594 -0
edsl/results/DatasetTree.py +295 -0
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +477 -173
edsl/results/Results.py +987 -269
edsl/results/ResultsExportMixin.py +28 -125
edsl/results/ResultsGGMixin.py +83 -15
edsl/results/TableDisplay.py +125 -0
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +1 -1
edsl/results/file_exports.py +252 -0
edsl/results/results_fetch_mixin.py +33 -0
edsl/results/results_selector.py +145 -0
edsl/results/results_tools_mixin.py +98 -0
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_display.css +78 -0
edsl/results/table_renderers.py +118 -0
edsl/results/tree_explore.py +115 -0
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +543 -0
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +431 -62
edsl/scenarios/ScenarioHtmlMixin.py +65 -0
edsl/scenarios/ScenarioList.py +1415 -45
edsl/scenarios/ScenarioListExportMixin.py +45 -0
edsl/scenarios/ScenarioListPdfMixin.py +239 -0
edsl/scenarios/__init__.py +2 -0
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +49 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/scenario_join.py +131 -0
edsl/scenarios/scenario_selector.py +156 -0
edsl/shared.py +1 -0
edsl/study/ObjectEntry.py +173 -0
edsl/study/ProofOfWork.py +113 -0
edsl/study/SnapShot.py +80 -0
edsl/study/Study.py +521 -0
edsl/study/__init__.py +4 -0
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/DAG.py +92 -11
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/Memory.py +9 -4
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/MemoryPlan.py +156 -35
edsl/surveys/Rule.py +221 -74
edsl/surveys/RuleCollection.py +241 -61
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +1079 -339
edsl/surveys/SurveyCSS.py +273 -0
edsl/surveys/SurveyExportMixin.py +235 -40
edsl/surveys/SurveyFlowVisualization.py +181 -0
edsl/surveys/SurveyQualtricsImport.py +284 -0
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +4 -2
edsl/surveys/base.py +19 -3
edsl/surveys/descriptors.py +17 -6
edsl/surveys/instructions/ChangeInstruction.py +48 -0
edsl/surveys/instructions/Instruction.py +56 -0
edsl/surveys/instructions/InstructionCollection.py +82 -0
edsl/surveys/instructions/__init__.py +0 -0
edsl/templates/error_reporting/base.html +24 -0
edsl/templates/error_reporting/exceptions_by_model.html +35 -0
edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
edsl/templates/error_reporting/exceptions_by_type.html +17 -0
edsl/templates/error_reporting/interview_details.html +116 -0
edsl/templates/error_reporting/interviews.html +19 -0
edsl/templates/error_reporting/overview.html +5 -0
edsl/templates/error_reporting/performance_plot.html +2 -0
edsl/templates/error_reporting/report.css +74 -0
edsl/templates/error_reporting/report.html +118 -0
edsl/templates/error_reporting/report.js +25 -0
edsl/tools/__init__.py +1 -0
edsl/tools/clusters.py +192 -0
edsl/tools/embeddings.py +27 -0
edsl/tools/embeddings_plotting.py +118 -0
edsl/tools/plotting.py +112 -0
edsl/tools/summarize.py +18 -0
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/SystemInfo.py +5 -0
edsl/utilities/__init__.py +21 -20
edsl/utilities/ast_utilities.py +3 -0
edsl/utilities/data/Registry.py +2 -0
edsl/utilities/decorators.py +41 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/interface.py +310 -60
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/naming_utilities.py +263 -0
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/restricted_python.py +70 -0
edsl/utilities/utilities.py +203 -13
edsl-0.1.40.dist-info/METADATA +111 -0
edsl-0.1.40.dist-info/RECORD +362 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
edsl/agents/AgentListExportMixin.py +0 -24
edsl/coop/old.py +0 -31
edsl/data/Database.py +0 -141
edsl/data/crud.py +0 -121
edsl/jobs/Interview.py +0 -417
edsl/jobs/JobsRunner.py +0 -63
edsl/jobs/JobsRunnerStatusMixin.py +0 -115
edsl/jobs/base.py +0 -47
edsl/jobs/buckets.py +0 -166
edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
edsl/jobs/task_management.py +0 -218
edsl/jobs/token_tracking.py +0 -78
edsl/language_models/DeepInfra.py +0 -69
edsl/language_models/OpenAI.py +0 -98
edsl/language_models/model_interfaces/GeminiPro.py +0 -66
edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
edsl/language_models/registry.py +0 -81
edsl/language_models/schemas.py +0 -15
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/prompts/QuestionInstructionsBase.py +0 -6
edsl/prompts/library/agent_instructions.py +0 -29
edsl/prompts/library/agent_persona.py +0 -17
edsl/prompts/library/question_budget.py +0 -26
edsl/prompts/library/question_checkbox.py +0 -32
edsl/prompts/library/question_extract.py +0 -19
edsl/prompts/library/question_freetext.py +0 -14
edsl/prompts/library/question_linear_scale.py +0 -20
edsl/prompts/library/question_list.py +0 -22
edsl/prompts/library/question_multiple_choice.py +0 -44
edsl/prompts/library/question_numerical.py +0 -31
edsl/prompts/library/question_rank.py +0 -21
edsl/prompts/prompt_config.py +0 -33
edsl/prompts/registry.py +0 -185
edsl/questions/Question.py +0 -240
edsl/report/InputOutputDataTypes.py +0 -134
edsl/report/RegressionMixin.py +0 -28
edsl/report/ReportOutputs.py +0 -1228
edsl/report/ResultsFetchMixin.py +0 -106
edsl/report/ResultsOutputMixin.py +0 -14
edsl/report/demo.ipynb +0 -645
edsl/results/ResultsDBMixin.py +0 -184
edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
edsl/trackers/Tracker.py +0 -91
edsl/trackers/TrackerAPI.py +0 -196
edsl/trackers/TrackerTasks.py +0 -70
edsl/utilities/pastebin.py +0 -141
edsl-0.1.14.dist-info/METADATA +0 -69
edsl-0.1.14.dist-info/RECORD +0 -141
/edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
/edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
/edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0

edsl/agents/Invigilator.py CHANGED Viewed

@@ -1,409 +1,285 @@
-from abc import ABC, abstractmethod
-import asyncio
-import json
-from typing import Coroutine, Dict, Any
-from collections import UserDict
-from edsl.exceptions import AgentRespondedWithBadJSONError
-from edsl.prompts.Prompt import Prompt
-from edsl.utilities.decorators import sync_wrapper, jupyter_nb_handler
-from edsl.prompts.registry import get_classes
-from edsl.exceptions import QuestionScenarioRenderError
-from edsl.data_transfer_models import AgentResponseDict
-from edsl.exceptions.agents import FailedTaskException
-class InvigilatorBase(ABC):
-    """An invigiator (someone who administers an exam) is a class that is responsible for administering a question to an agent."""
-    def __init__(
-        self, agent, question, scenario, model, memory_plan, current_answers: dict
-    ):
-        self.agent = agent
-        self.question = question
-        self.scenario = scenario
-        self.model = model
-        self.memory_plan = memory_plan
-        self.current_answers = current_answers
-    def get_failed_task_result(self):
-        return AgentResponseDict(
-            answer=None,
-            comment="Failed to get response",
-            question_name=self.question.question_name,
-            prompts=self.get_prompts(),
-        )
-    def get_prompts(self) -> Dict[str, Prompt]:
-        return {
-            "user_prompt": Prompt("NA").text,
-            "system_prompt": Prompt("NA").text,
-        }
+"""Module for creating Invigilators, which are objects to administer a question to an Agent."""
-    @classmethod
-    def example(cls):
-        """Returns an example invigilator."""
-        from edsl.agents.Agent import Agent
-        from edsl.questions import QuestionMultipleChoice
-        from edsl.scenarios.Scenario import Scenario
-        from edsl.language_models import LanguageModel
-        from edsl.enums import LanguageModelType, InferenceServiceType
-        class TestLanguageModelGood(LanguageModel):
-            _model_ = LanguageModelType.TEST.value
-            _parameters_ = {"temperature": 0.5}
-            _inference_service_ = InferenceServiceType.TEST.value
-            async def async_execute_model_call(
-                self, user_prompt: str, system_prompt: str
-            ) -> dict[str, Any]:
-                await asyncio.sleep(0.1)
-                return {"message": """{"answer": "SPAM!"}"""}
-            def parse_response(self, raw_response: dict[str, Any]) -> str:
-                return raw_response["message"]
-        model = TestLanguageModelGood()
-        agent = Agent.example()
-        question = QuestionMultipleChoice.example()
-        scenario = Scenario.example()
-        #        model = LanguageModel.example()
-        memory_plan = None
-        current_answers = None
-        return cls(
-            agent=agent,
-            question=question,
-            scenario=scenario,
-            model=model,
-            memory_plan=memory_plan,
-            current_answers=current_answers,
-        )
+from typing import Dict, Any, Optional, TYPE_CHECKING
-    @abstractmethod
-    async def async_answer_question(self):
-        "This is the async method that actually answers the question."
-        pass
+from edsl.utilities.decorators import sync_wrapper
+from edsl.exceptions.questions import QuestionAnswerValidationError
+from edsl.agents.InvigilatorBase import InvigilatorBase
+from edsl.data_transfer_models import AgentResponseDict, EDSLResultObjectInput
-    @jupyter_nb_handler
-    def answer_question(self) -> Coroutine:
-        async def main():
-            results = await asyncio.gather(self.async_answer_question())
-            return results[0]  # Since there's only one task, return its result
+if TYPE_CHECKING:
+    from edsl.prompts.Prompt import Prompt
+    from edsl.scenarios.Scenario import Scenario
+    from edsl.surveys.Survey import Survey
-        return main()
-    def create_memory_prompt(self, question_name):
-        """Creates a memory for the agent."""
-        return self.memory_plan.get_memory_prompt_fragment(
-            question_name, self.current_answers
-        )
+NA = "Not Applicable"
 class InvigilatorAI(InvigilatorBase):
     """An invigilator that uses an AI model to answer questions."""
-    async def async_answer_question(self, failed=False) -> AgentResponseDict:
-        data = {
-            "agent": self.agent,
-            "question": self.question,
-            "scenario": self.scenario,
-        }
-        # This calls the self.async_get_response method w/ the prompts
-        # The raw response is a dictionary.
-        raw_response = await self.async_get_response(**self.get_prompts())
-        assert "raw_model_response" in raw_response
-        response = self._format_raw_response(
-            **(
-                data
-                | {
-                    "raw_response": raw_response,
-                    "raw_model_response": raw_response["raw_model_response"],
-                }
-            )
-        )
-        return response
+    def get_prompts(self) -> Dict[str, "Prompt"]:
+        """Return the prompts used."""
+        return self.prompt_constructor.get_prompts()
-    async def async_get_response(self, user_prompt: Prompt, system_prompt: Prompt):
-        """Calls the LLM and gets a response. Used in the `answer_question` method."""
-        try:
-            response = await self.model.async_get_response(
-                user_prompt.text, system_prompt.text
-            )
-        except json.JSONDecodeError as e:
-            raise AgentRespondedWithBadJSONError(
-                f"Returned bad JSON: {e}"
-                f"Prompt: {user_prompt}"
-                f"System Prompt: {system_prompt}"
-            )
-        return response
-    def _format_raw_response(
-        self, agent, question, scenario, raw_response, raw_model_response
-    ) -> AgentResponseDict:
-        response = question.validate_answer(raw_response)
-        comment = response.get("comment", "")
-        answer_code = response["answer"]
-        answer = question.translate_answer_code_to_answer(answer_code, scenario)
-        raw_model_response = raw_model_response
-        data = {
-            "answer": answer,
-            "comment": comment,
-            "question_name": question.question_name,
-            "prompts": {k: v.to_dict() for k, v in self.get_prompts().items()},
-            "cached_response": raw_response["cached_response"],
-            "usage": raw_response.get("usage", {}),
-            "raw_model_response": raw_model_response,
+    async def async_get_agent_response(self) -> AgentResponseDict:
+        prompts = self.get_prompts()
+        params = {
+            "user_prompt": prompts["user_prompt"].text,
+            "system_prompt": prompts["system_prompt"].text,
         }
-        return AgentResponseDict(**data)
-    get_response = sync_wrapper(async_get_response)
-    def construct_system_prompt(self) -> Prompt:
-        """Constructs the system prompt for the LLM call."""
-        applicable_prompts = get_classes(
-            component_type="agent_instructions",
-            model=self.model.model,
-        )
-        if len(applicable_prompts) == 0:
-            raise Exception("No applicable prompts found")
-        agent_instructions = applicable_prompts[0](text=self.agent.instruction)
-        if not hasattr(self.agent, "agent_persona"):
-            applicable_prompts = get_classes(
-                component_type="agent_persona",
-                model=self.model.model,
-            )
-            persona_prompt_template = applicable_prompts[0]()
-        else:
-            persona_prompt_template = self.agent.agent_persona
-        if undefined := persona_prompt_template.undefined_template_variables(
-            self.agent.traits
-            | {"traits": self.agent.traits}
-            | {"codebook": self.agent.codebook}
-            | {"traits": self.agent.traits}
-        ):
-            raise QuestionScenarioRenderError(
-                f"Agent persona still has variables that were not rendered: {undefined}"
-            )
-        persona_prompt = persona_prompt_template.render(
-            self.agent.traits | {"traits": self.agent.traits},
-            codebook=self.agent.codebook,
-            traits=self.agent.traits,
-        )
-        if persona_prompt.has_variables:
-            raise QuestionScenarioRenderError(
-                "Agent persona still has variables that were not rendered."
-            )
-        return (
-            agent_instructions
-            + " " * int(len(persona_prompt.text) > 0)
-            + persona_prompt
+        if "encoded_image" in prompts:
+            params["encoded_image"] = prompts["encoded_image"]
+            raise NotImplementedError("encoded_image not implemented")
+        if "files_list" in prompts:
+            params["files_list"] = prompts["files_list"]
+        params.update({"iteration": self.iteration, "cache": self.cache})
+        params.update({"invigilator": self})
+        if self.key_lookup:
+            self.model.set_key_lookup(self.key_lookup)
+        return await self.model.async_get_response(**params)
+    def store_response(self, agent_response_dict: AgentResponseDict) -> None:
+        """Store the response in the invigilator, in case it is needed later because of validation failure."""
+        self.raw_model_response = agent_response_dict.model_outputs.response
+        self.generated_tokens = agent_response_dict.edsl_dict.generated_tokens
+        self.cache_key = agent_response_dict.model_outputs.cache_key
+    async def async_answer_question(self) -> EDSLResultObjectInput:
+        """Answer a question using the AI model.
+        >>> i = InvigilatorAI.example()
+        """
+        agent_response_dict: AgentResponseDict = await self.async_get_agent_response()
+        self.store_response(agent_response_dict)
+        return self._extract_edsl_result_entry_and_validate(agent_response_dict)
+    def _remove_from_cache(self, cache_key) -> None:
+        """Remove an entry from the cache."""
+        if cache_key:
+            del self.cache.data[cache_key]
+    def _determine_answer(self, raw_answer: str) -> Any:
+        """Determine the answer from the raw answer.
+        >>> i = InvigilatorAI.example()
+        >>> i._determine_answer("SPAM!")
+        'SPAM!'
+        >>> from edsl.questions import QuestionMultipleChoice
+        >>> q = QuestionMultipleChoice(question_text = "How are you?", question_name = "how_are_you", question_options = ["Good", "Bad"], use_code = True)
+        >>> i = InvigilatorAI.example(question = q)
+        >>> i._determine_answer("1")
+        'Bad'
+        >>> i._determine_answer("0")
+        'Good'
+        This shows how the answer can depend on scenario details
+        >>> from edsl import Scenario
+        >>> s = Scenario({'feeling_options':['Good', 'Bad']})
+        >>> q = QuestionMultipleChoice(question_text = "How are you?", question_name = "how_are_you", question_options = "{{ feeling_options }}", use_code = True)
+        >>> i = InvigilatorAI.example(question = q, scenario = s)
+        >>> i._determine_answer("1")
+        'Bad'
+        >>> from edsl import QuestionList, QuestionMultipleChoice, Survey
+        >>> q1 = QuestionList(question_name = "favs", question_text = "What are your top 3 colors?")
+        >>> q2 = QuestionMultipleChoice(question_text = "What is your favorite color?", question_name = "best", question_options = "{{ favs.answer }}", use_code = True)
+        >>> survey = Survey([q1, q2])
+        >>> i = InvigilatorAI.example(question = q2, scenario = s, survey = survey)
+        >>> i.current_answers = {"favs": ["Green", "Blue", "Red"]}
+        >>> i._determine_answer("2")
+        'Red'
+        """
+        substitution_dict = self._prepare_substitution_dict(
+            self.survey, self.current_answers, self.scenario
         )
-    def get_question_instructions(self) -> Prompt:
-        """Gets the instructions for the question."""
-        applicable_prompts = get_classes(
-            component_type="question_instructions",
-            question_type=self.question.question_type,
-            model=self.model.model,
+        return self.question._translate_answer_code_to_answer(
+            raw_answer, substitution_dict
         )
-        ## Get the question instructions and renders with the scenario & question.data
-        question_prompt = applicable_prompts[0]()
-        undefined_template_variables = question_prompt.undefined_template_variables(
-            self.question.data | self.scenario
-        )
-        if undefined_template_variables:
-            print(undefined_template_variables)
-            raise QuestionScenarioRenderError(
-                "Question instructions still has variables"
-            )
-        return question_prompt.render(self.question.data | self.scenario)
-    def construct_user_prompt(self) -> Prompt:
-        """Gets the user prompt for the LLM call."""
-        user_prompt = self.get_question_instructions()
-        if self.memory_plan is not None:
-            user_prompt += self.create_memory_prompt(self.question.question_name)
-        return user_prompt
-    def get_prompts(self) -> Dict[str, Prompt]:
-        """Gets the prompts for the LLM call."""
-        system_prompt = self.construct_system_prompt()
-        user_prompt = self.construct_user_prompt()
-        return {
-            "user_prompt": user_prompt,
-            "system_prompt": system_prompt,
-        }
+    @staticmethod
+    def _prepare_substitution_dict(
+        survey: "Survey", current_answers: dict, scenario: "Scenario"
+    ) -> Dict[str, Any]:
+        """Prepares a substitution dictionary for the question based on the survey, current answers, and scenario.
+        This is necessary beause sometimes the model's answer to a question could depend on details in
+        the prompt that were provided by the answer to a previous question or a scenario detail.
+        Note that the question object is getting the answer & a the comment appended to it, as the
+        jinja2 template might be referencing these values with a dot notation.
+        """
+        question_dict = survey.duplicate().question_names_to_questions()
+        # iterates through the current answers and updates the question_dict (which is all questions)
+        for other_question, answer in current_answers.items():
+            if other_question in question_dict:
+                question_dict[other_question].answer = answer
+            else:
+                # it might be a comment
+                if (
+                    new_question := other_question.split("_comment")[0]
+                ) in question_dict:
+                    question_dict[new_question].comment = answer
+        return {**question_dict, **scenario}
+    def _extract_edsl_result_entry_and_validate(
+        self, agent_response_dict: AgentResponseDict
+    ) -> EDSLResultObjectInput:
+        """Extract the EDSL result entry and validate it."""
+        edsl_dict = agent_response_dict.edsl_dict._asdict()
+        exception_occurred = None
+        validated = False
+        try:
+            # if the question has jinja parameters, it is easier to make a new question with the parameters
+            if self.question.parameters:
+                prior_answers_dict = self.prompt_constructor.prior_answers_dict()
+                # question options have be treated differently because of dynamic question
+                # this logic is all in the prompt constructor
+                if "question_options" in self.question.data:
+                    new_question_options = self.prompt_constructor.get_question_options(
+                        self.question.data
+                    )
+                    if new_question_options != self.question.data["question_options"]:
+                        # I don't love this direct writing but it seems to work
+                        self.question.question_options = new_question_options
+                question_with_validators = self.question.render(
+                    self.scenario | prior_answers_dict
+                )
+                question_with_validators.use_code = self.question.use_code
+            else:
+                question_with_validators = self.question
+            validated_edsl_dict = question_with_validators._validate_answer(edsl_dict)
+            answer = self._determine_answer(validated_edsl_dict["answer"])
+            comment = validated_edsl_dict.get("comment", "")
+            validated = True
+        except QuestionAnswerValidationError as e:
+            answer = None
+            comment = "The response was not valid."
+            # if self.raise_validation_errors:
+            exception_occurred = e
+        except Exception as non_validation_error:
+            answer = None
+            comment = "Some other error occurred."
+            exception_occurred = non_validation_error
+        finally:
+            # even if validation failes, we still return the result
+            data = {
+                "answer": answer,
+                "comment": comment,
+                "generated_tokens": agent_response_dict.edsl_dict.generated_tokens,
+                "question_name": self.question.question_name,
+                "prompts": self.get_prompts(),
+                "cached_response": agent_response_dict.model_outputs.cached_response,
+                "raw_model_response": agent_response_dict.model_outputs.response,
+                "cache_used": agent_response_dict.model_outputs.cache_used,
+                "cache_key": agent_response_dict.model_outputs.cache_key,
+                "validated": validated,
+                "exception_occurred": exception_occurred,
+                "cost": agent_response_dict.model_outputs.cost,
+            }
+            result = EDSLResultObjectInput(**data)
+            return result
     answer_question = sync_wrapper(async_answer_question)
-class InvigilatorDebug(InvigilatorBase):
-    async def async_answer_question(self) -> AgentResponseDict:
-        results = self.question.simulate_answer(human_readable=True)
-        results["prompts"] = self.get_prompts()
-        results["question_name"] = self.question.question_name
-        results["comment"] = "Debug comment"
-        return AgentResponseDict(**results)
+class InvigilatorHuman(InvigilatorBase):
+    """An invigilator for when a human is answering the question."""
-    def get_prompts(self) -> Dict[str, Prompt]:
-        return {
-            "user_prompt": Prompt("NA").text,
-            "system_prompt": Prompt("NA").text,
-        }
+    validate_response: bool = False
+    translate_response: bool = False
+    async def async_answer_question(self, iteration: int = 0) -> AgentResponseDict:
+        """Return the answer to the question."""
+        comment = "This is a real survey response from a human."
-class InvigilatorHuman(InvigilatorBase):
-    async def async_answer_question(self) -> AgentResponseDict:
-        data = {
-            "comment": "This is a real survey response from a human.",
-            "answer": None,
-            "prompts": self.get_prompts(),
-            "question_name": self.question.question_name,
-        }
+        def __repr__(self):
+            return f"{self.literal}"
+        exception_occurred = None
+        validated = False
         try:
             answer = self.agent.answer_question_directly(self.question, self.scenario)
-            return AgentResponseDict(**(data | {"answer": answer}))
+            self.raw_model_response = answer
+            if self.validate_response:
+                _ = self.question._validate_answer({"answer": answer})
+            if self.translate_response:
+                answer = self.question._translate_answer_code_to_answer(
+                    answer, self.scenario
+                )
+            validated = True
+        except QuestionAnswerValidationError as e:
+            answer = None
+            if self.raise_validation_errors:
+                exception_occurred = e
         except Exception as e:
-            agent_response_dict = AgentResponseDict(
-                **(data | {"answer": None, "comment": str(e)})
-            )
-            raise FailedTaskException(
-                f"Failed to get response. The exception is {str(e)}",
-                agent_response_dict,
-            ) from e
+            answer = None
+            if self.raise_validation_errors:
+                exception_occurred = e
+        finally:
+            data = {
+                "generated_tokens": NA,  # NotApplicable(),
+                "question_name": self.question.question_name,
+                "prompts": self.get_prompts(),
+                "cached_response": NA,
+                "raw_model_response": NA,
+                "cache_used": NA,
+                "cache_key": NA,
+                "answer": answer,
+                "comment": comment,
+                "validated": validated,
+                "exception_occurred": exception_occurred,
+            }
+            return EDSLResultObjectInput(**data)
 class InvigilatorFunctional(InvigilatorBase):
-    async def async_answer_question(self) -> AgentResponseDict:
+    """A Invigilator for when the question has a answer_question_directly function."""
+    async def async_answer_question(self, iteration: int = 0) -> AgentResponseDict:
+        """Return the answer to the question."""
         func = self.question.answer_question_directly
-        data = {
-            "comment": "Functional.",
-            "prompts": self.get_prompts(),
-            "question_name": self.question.question_name,
-        }
-        try:
-            answer = func(scenario=self.scenario, agent_traits=self.agent.traits)
-            return AgentResponseDict(**(data | {"answer": answer}))
-        except Exception as e:
-            agent_response_dict = AgentResponseDict(
-                **(data | {"answer": None, "comment": str(e)})
-            )
-            raise FailedTaskException(
-                f"Failed to get response. The exception is {str(e)}",
-                agent_response_dict,
-            ) from e
-    def get_prompts(self) -> Dict[str, Prompt]:
+        answer = func(scenario=self.scenario, agent_traits=self.agent.traits)
+        return EDSLResultObjectInput(
+            generated_tokens=str(answer),
+            question_name=self.question.question_name,
+            prompts=self.get_prompts(),
+            cached_response=NA,
+            raw_model_response=NA,
+            cache_used=NA,
+            cache_key=NA,
+            answer=answer["answer"],
+            comment="This is the result of a functional question.",
+            validated=True,
+            exception_occurred=None,
+        )
+    def get_prompts(self) -> Dict[str, "Prompt"]:
+        from edsl.prompts.Prompt import Prompt
+        """Return the prompts used."""
         return {
-            "user_prompt": Prompt("NA").text,
-            "system_prompt": Prompt("NA").text,
+            "user_prompt": Prompt("NA"),
+            "system_prompt": Prompt("NA"),
         }
 if __name__ == "__main__":
-    from edsl.enums import LanguageModelType
-    from edsl.agents.Agent import Agent
-    a = Agent(
-        instruction="You are a happy-go lucky agent.",
-        traits={"feeling": "happy", "age": "Young at heart"},
-        codebook={"feeling": "Feelings right now", "age": "Age in years"},
-        trait_presentation_template="",
-    )
-    class MockModel:
-        model = LanguageModelType.GPT_4.value
-    class MockQuestion:
-        question_type = "free_text"
-        question_text = "How are you feeling?"
-        question_name = "feelings_question"
-        data = {
-            "question_name": "feelings",
-            "question_text": "How are you feeling?",
-            "question_type": "feelings_question",
-        }
+    import doctest
-    i = InvigilatorAI(
-        agent=a,
-        question=MockQuestion(),
-        scenario={},
-        model=MockModel(),
-        memory_plan=None,
-        current_answers=None,
-    )
-    print(i.get_prompts()["system_prompt"])
-    assert i.get_prompts()["system_prompt"].text == "You are a happy-go lucky agent."
-    ###############
-    ## Render one
-    ###############
-    a = Agent(
-        instruction="You are a happy-go lucky agent.",
-        traits={"feeling": "happy", "age": "Young at heart"},
-        codebook={"feeling": "Feelings right now", "age": "Age in years"},
-        trait_presentation_template="You are feeling {{ feeling }}.",
-    )
-    i = InvigilatorAI(
-        agent=a,
-        question=MockQuestion(),
-        scenario={},
-        model=MockModel(),
-        memory_plan=None,
-        current_answers=None,
-    )
-    print(i.get_prompts()["system_prompt"])
-    assert (
-        i.get_prompts()["system_prompt"].text
-        == "You are a happy-go lucky agent. You are feeling happy."
-    )
-    try:
-        assert i.get_prompts()["system_prompt"].unused_traits(a.traits) == ["age"]
-    except AssertionError:
-        unused_traits = i.get_prompts()["system_prompt"].unused_traits(a.traits)
-        print(f"System prompt: {i.get_prompts()['system_prompt']}")
-        print(f"Agent traits: {a.traits}")
-        print(f"Unused_traits: {unused_traits}")
-        # breakpoint()
-    ###############
-    ## Render one
-    ###############
-    a = Agent(
-        instruction="You are a happy-go lucky agent.",
-        traits={"feeling": "happy", "age": "Young at heart"},
-        codebook={"feeling": "Feelings right now", "age": "Age in years"},
-        trait_presentation_template="You are feeling {{ feeling }}. You eat lots of {{ food }}.",
-    )
-    i = InvigilatorAI(
-        agent=a,
-        question=MockQuestion(),
-        scenario={},
-        model=MockModel(),
-        memory_plan=None,
-        current_answers=None,
-    )
-    print(i.get_prompts()["system_prompt"])
-    ## Should raise a QuestionScenarioRenderError
-    assert (
-        i.get_prompts()["system_prompt"].text
-        == "You are a happy-go lucky agent. You are feeling happy."
-    )
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl