edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- edsl/Base.py +348 -38
- edsl/BaseDiff.py +260 -0
- edsl/TemplateLoader.py +24 -0
- edsl/__init__.py +46 -10
- edsl/__version__.py +1 -0
- edsl/agents/Agent.py +842 -144
- edsl/agents/AgentList.py +521 -25
- edsl/agents/Invigilator.py +250 -374
- edsl/agents/InvigilatorBase.py +257 -0
- edsl/agents/PromptConstructor.py +272 -0
- edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
- edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
- edsl/agents/descriptors.py +43 -13
- edsl/agents/prompt_helpers.py +129 -0
- edsl/agents/question_option_processor.py +172 -0
- edsl/auto/AutoStudy.py +130 -0
- edsl/auto/StageBase.py +243 -0
- edsl/auto/StageGenerateSurvey.py +178 -0
- edsl/auto/StageLabelQuestions.py +125 -0
- edsl/auto/StagePersona.py +61 -0
- edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
- edsl/auto/StagePersonaDimensionValues.py +74 -0
- edsl/auto/StagePersonaDimensions.py +69 -0
- edsl/auto/StageQuestions.py +74 -0
- edsl/auto/SurveyCreatorPipeline.py +21 -0
- edsl/auto/utilities.py +218 -0
- edsl/base/Base.py +279 -0
- edsl/config.py +121 -104
- edsl/conversation/Conversation.py +290 -0
- edsl/conversation/car_buying.py +59 -0
- edsl/conversation/chips.py +95 -0
- edsl/conversation/mug_negotiation.py +81 -0
- edsl/conversation/next_speaker_utilities.py +93 -0
- edsl/coop/CoopFunctionsMixin.py +15 -0
- edsl/coop/ExpectedParrotKeyHandler.py +125 -0
- edsl/coop/PriceFetcher.py +54 -0
- edsl/coop/__init__.py +1 -0
- edsl/coop/coop.py +1029 -134
- edsl/coop/utils.py +131 -0
- edsl/data/Cache.py +560 -89
- edsl/data/CacheEntry.py +230 -0
- edsl/data/CacheHandler.py +168 -0
- edsl/data/RemoteCacheSync.py +186 -0
- edsl/data/SQLiteDict.py +292 -0
- edsl/data/__init__.py +5 -3
- edsl/data/orm.py +6 -33
- edsl/data_transfer_models.py +74 -27
- edsl/enums.py +165 -8
- edsl/exceptions/BaseException.py +21 -0
- edsl/exceptions/__init__.py +52 -46
- edsl/exceptions/agents.py +33 -15
- edsl/exceptions/cache.py +5 -0
- edsl/exceptions/coop.py +8 -0
- edsl/exceptions/general.py +34 -0
- edsl/exceptions/inference_services.py +5 -0
- edsl/exceptions/jobs.py +15 -0
- edsl/exceptions/language_models.py +46 -1
- edsl/exceptions/questions.py +80 -5
- edsl/exceptions/results.py +16 -5
- edsl/exceptions/scenarios.py +29 -0
- edsl/exceptions/surveys.py +13 -10
- edsl/inference_services/AnthropicService.py +106 -0
- edsl/inference_services/AvailableModelCacheHandler.py +184 -0
- edsl/inference_services/AvailableModelFetcher.py +215 -0
- edsl/inference_services/AwsBedrock.py +118 -0
- edsl/inference_services/AzureAI.py +215 -0
- edsl/inference_services/DeepInfraService.py +18 -0
- edsl/inference_services/GoogleService.py +143 -0
- edsl/inference_services/GroqService.py +20 -0
- edsl/inference_services/InferenceServiceABC.py +80 -0
- edsl/inference_services/InferenceServicesCollection.py +138 -0
- edsl/inference_services/MistralAIService.py +120 -0
- edsl/inference_services/OllamaService.py +18 -0
- edsl/inference_services/OpenAIService.py +236 -0
- edsl/inference_services/PerplexityService.py +160 -0
- edsl/inference_services/ServiceAvailability.py +135 -0
- edsl/inference_services/TestService.py +90 -0
- edsl/inference_services/TogetherAIService.py +172 -0
- edsl/inference_services/data_structures.py +134 -0
- edsl/inference_services/models_available_cache.py +118 -0
- edsl/inference_services/rate_limits_cache.py +25 -0
- edsl/inference_services/registry.py +41 -0
- edsl/inference_services/write_available.py +10 -0
- edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
- edsl/jobs/Answers.py +21 -20
- edsl/jobs/FetchInvigilator.py +47 -0
- edsl/jobs/InterviewTaskManager.py +98 -0
- edsl/jobs/InterviewsConstructor.py +50 -0
- edsl/jobs/Jobs.py +684 -204
- edsl/jobs/JobsChecks.py +172 -0
- edsl/jobs/JobsComponentConstructor.py +189 -0
- edsl/jobs/JobsPrompts.py +270 -0
- edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
- edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
- edsl/jobs/RequestTokenEstimator.py +30 -0
- edsl/jobs/async_interview_runner.py +138 -0
- edsl/jobs/buckets/BucketCollection.py +104 -0
- edsl/jobs/buckets/ModelBuckets.py +65 -0
- edsl/jobs/buckets/TokenBucket.py +283 -0
- edsl/jobs/buckets/TokenBucketAPI.py +211 -0
- edsl/jobs/buckets/TokenBucketClient.py +191 -0
- edsl/jobs/check_survey_scenario_compatibility.py +85 -0
- edsl/jobs/data_structures.py +120 -0
- edsl/jobs/decorators.py +35 -0
- edsl/jobs/interviews/Interview.py +392 -0
- edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
- edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
- edsl/jobs/interviews/InterviewStatistic.py +63 -0
- edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
- edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
- edsl/jobs/interviews/InterviewStatusLog.py +92 -0
- edsl/jobs/interviews/ReportErrors.py +66 -0
- edsl/jobs/interviews/interview_status_enum.py +9 -0
- edsl/jobs/jobs_status_enums.py +9 -0
- edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
- edsl/jobs/results_exceptions_handler.py +98 -0
- edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
- edsl/jobs/runners/JobsRunnerStatus.py +298 -0
- edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
- edsl/jobs/tasks/TaskCreators.py +64 -0
- edsl/jobs/tasks/TaskHistory.py +470 -0
- edsl/jobs/tasks/TaskStatusLog.py +23 -0
- edsl/jobs/tasks/task_status_enum.py +161 -0
- edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
- edsl/jobs/tokens/TokenUsage.py +34 -0
- edsl/language_models/ComputeCost.py +63 -0
- edsl/language_models/LanguageModel.py +507 -386
- edsl/language_models/ModelList.py +164 -0
- edsl/language_models/PriceManager.py +127 -0
- edsl/language_models/RawResponseHandler.py +106 -0
- edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
- edsl/language_models/__init__.py +1 -8
- edsl/language_models/fake_openai_call.py +15 -0
- edsl/language_models/fake_openai_service.py +61 -0
- edsl/language_models/key_management/KeyLookup.py +63 -0
- edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
- edsl/language_models/key_management/KeyLookupCollection.py +38 -0
- edsl/language_models/key_management/__init__.py +0 -0
- edsl/language_models/key_management/models.py +131 -0
- edsl/language_models/model.py +256 -0
- edsl/language_models/repair.py +109 -41
- edsl/language_models/utilities.py +65 -0
- edsl/notebooks/Notebook.py +263 -0
- edsl/notebooks/NotebookToLaTeX.py +142 -0
- edsl/notebooks/__init__.py +1 -0
- edsl/prompts/Prompt.py +222 -93
- edsl/prompts/__init__.py +1 -1
- edsl/questions/ExceptionExplainer.py +77 -0
- edsl/questions/HTMLQuestion.py +103 -0
- edsl/questions/QuestionBase.py +518 -0
- edsl/questions/QuestionBasePromptsMixin.py +221 -0
- edsl/questions/QuestionBudget.py +164 -67
- edsl/questions/QuestionCheckBox.py +281 -62
- edsl/questions/QuestionDict.py +343 -0
- edsl/questions/QuestionExtract.py +136 -50
- edsl/questions/QuestionFreeText.py +79 -55
- edsl/questions/QuestionFunctional.py +138 -41
- edsl/questions/QuestionList.py +184 -57
- edsl/questions/QuestionMatrix.py +265 -0
- edsl/questions/QuestionMultipleChoice.py +293 -69
- edsl/questions/QuestionNumerical.py +109 -56
- edsl/questions/QuestionRank.py +244 -49
- edsl/questions/Quick.py +41 -0
- edsl/questions/SimpleAskMixin.py +74 -0
- edsl/questions/__init__.py +9 -6
- edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
- edsl/questions/compose_questions.py +13 -7
- edsl/questions/data_structures.py +20 -0
- edsl/questions/decorators.py +21 -0
- edsl/questions/derived/QuestionLikertFive.py +28 -26
- edsl/questions/derived/QuestionLinearScale.py +41 -28
- edsl/questions/derived/QuestionTopK.py +34 -26
- edsl/questions/derived/QuestionYesNo.py +40 -27
- edsl/questions/descriptors.py +228 -74
- edsl/questions/loop_processor.py +149 -0
- edsl/questions/prompt_templates/question_budget.jinja +13 -0
- edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
- edsl/questions/prompt_templates/question_extract.jinja +11 -0
- edsl/questions/prompt_templates/question_free_text.jinja +3 -0
- edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
- edsl/questions/prompt_templates/question_list.jinja +17 -0
- edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
- edsl/questions/prompt_templates/question_numerical.jinja +37 -0
- edsl/questions/question_base_gen_mixin.py +168 -0
- edsl/questions/question_registry.py +130 -46
- edsl/questions/register_questions_meta.py +71 -0
- edsl/questions/response_validator_abc.py +188 -0
- edsl/questions/response_validator_factory.py +34 -0
- edsl/questions/settings.py +5 -2
- edsl/questions/templates/__init__.py +0 -0
- edsl/questions/templates/budget/__init__.py +0 -0
- edsl/questions/templates/budget/answering_instructions.jinja +7 -0
- edsl/questions/templates/budget/question_presentation.jinja +7 -0
- edsl/questions/templates/checkbox/__init__.py +0 -0
- edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
- edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
- edsl/questions/templates/dict/__init__.py +0 -0
- edsl/questions/templates/dict/answering_instructions.jinja +21 -0
- edsl/questions/templates/dict/question_presentation.jinja +1 -0
- edsl/questions/templates/extract/__init__.py +0 -0
- edsl/questions/templates/extract/answering_instructions.jinja +7 -0
- edsl/questions/templates/extract/question_presentation.jinja +1 -0
- edsl/questions/templates/free_text/__init__.py +0 -0
- edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
- edsl/questions/templates/free_text/question_presentation.jinja +1 -0
- edsl/questions/templates/likert_five/__init__.py +0 -0
- edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
- edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
- edsl/questions/templates/linear_scale/__init__.py +0 -0
- edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
- edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
- edsl/questions/templates/list/__init__.py +0 -0
- edsl/questions/templates/list/answering_instructions.jinja +4 -0
- edsl/questions/templates/list/question_presentation.jinja +5 -0
- edsl/questions/templates/matrix/__init__.py +1 -0
- edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
- edsl/questions/templates/matrix/question_presentation.jinja +20 -0
- edsl/questions/templates/multiple_choice/__init__.py +0 -0
- edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
- edsl/questions/templates/multiple_choice/html.jinja +0 -0
- edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
- edsl/questions/templates/numerical/__init__.py +0 -0
- edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
- edsl/questions/templates/numerical/question_presentation.jinja +7 -0
- edsl/questions/templates/rank/__init__.py +0 -0
- edsl/questions/templates/rank/answering_instructions.jinja +11 -0
- edsl/questions/templates/rank/question_presentation.jinja +15 -0
- edsl/questions/templates/top_k/__init__.py +0 -0
- edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
- edsl/questions/templates/top_k/question_presentation.jinja +22 -0
- edsl/questions/templates/yes_no/__init__.py +0 -0
- edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
- edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
- edsl/results/CSSParameterizer.py +108 -0
- edsl/results/Dataset.py +550 -19
- edsl/results/DatasetExportMixin.py +594 -0
- edsl/results/DatasetTree.py +295 -0
- edsl/results/MarkdownToDocx.py +122 -0
- edsl/results/MarkdownToPDF.py +111 -0
- edsl/results/Result.py +477 -173
- edsl/results/Results.py +987 -269
- edsl/results/ResultsExportMixin.py +28 -125
- edsl/results/ResultsGGMixin.py +83 -15
- edsl/results/TableDisplay.py +125 -0
- edsl/results/TextEditor.py +50 -0
- edsl/results/__init__.py +1 -1
- edsl/results/file_exports.py +252 -0
- edsl/results/results_fetch_mixin.py +33 -0
- edsl/results/results_selector.py +145 -0
- edsl/results/results_tools_mixin.py +98 -0
- edsl/results/smart_objects.py +96 -0
- edsl/results/table_data_class.py +12 -0
- edsl/results/table_display.css +78 -0
- edsl/results/table_renderers.py +118 -0
- edsl/results/tree_explore.py +115 -0
- edsl/scenarios/ConstructDownloadLink.py +109 -0
- edsl/scenarios/DocumentChunker.py +102 -0
- edsl/scenarios/DocxScenario.py +16 -0
- edsl/scenarios/FileStore.py +543 -0
- edsl/scenarios/PdfExtractor.py +40 -0
- edsl/scenarios/Scenario.py +431 -62
- edsl/scenarios/ScenarioHtmlMixin.py +65 -0
- edsl/scenarios/ScenarioList.py +1415 -45
- edsl/scenarios/ScenarioListExportMixin.py +45 -0
- edsl/scenarios/ScenarioListPdfMixin.py +239 -0
- edsl/scenarios/__init__.py +2 -0
- edsl/scenarios/directory_scanner.py +96 -0
- edsl/scenarios/file_methods.py +85 -0
- edsl/scenarios/handlers/__init__.py +13 -0
- edsl/scenarios/handlers/csv.py +49 -0
- edsl/scenarios/handlers/docx.py +76 -0
- edsl/scenarios/handlers/html.py +37 -0
- edsl/scenarios/handlers/json.py +111 -0
- edsl/scenarios/handlers/latex.py +5 -0
- edsl/scenarios/handlers/md.py +51 -0
- edsl/scenarios/handlers/pdf.py +68 -0
- edsl/scenarios/handlers/png.py +39 -0
- edsl/scenarios/handlers/pptx.py +105 -0
- edsl/scenarios/handlers/py.py +294 -0
- edsl/scenarios/handlers/sql.py +313 -0
- edsl/scenarios/handlers/sqlite.py +149 -0
- edsl/scenarios/handlers/txt.py +33 -0
- edsl/scenarios/scenario_join.py +131 -0
- edsl/scenarios/scenario_selector.py +156 -0
- edsl/shared.py +1 -0
- edsl/study/ObjectEntry.py +173 -0
- edsl/study/ProofOfWork.py +113 -0
- edsl/study/SnapShot.py +80 -0
- edsl/study/Study.py +521 -0
- edsl/study/__init__.py +4 -0
- edsl/surveys/ConstructDAG.py +92 -0
- edsl/surveys/DAG.py +92 -11
- edsl/surveys/EditSurvey.py +221 -0
- edsl/surveys/InstructionHandler.py +100 -0
- edsl/surveys/Memory.py +9 -4
- edsl/surveys/MemoryManagement.py +72 -0
- edsl/surveys/MemoryPlan.py +156 -35
- edsl/surveys/Rule.py +221 -74
- edsl/surveys/RuleCollection.py +241 -61
- edsl/surveys/RuleManager.py +172 -0
- edsl/surveys/Simulator.py +75 -0
- edsl/surveys/Survey.py +1079 -339
- edsl/surveys/SurveyCSS.py +273 -0
- edsl/surveys/SurveyExportMixin.py +235 -40
- edsl/surveys/SurveyFlowVisualization.py +181 -0
- edsl/surveys/SurveyQualtricsImport.py +284 -0
- edsl/surveys/SurveyToApp.py +141 -0
- edsl/surveys/__init__.py +4 -2
- edsl/surveys/base.py +19 -3
- edsl/surveys/descriptors.py +17 -6
- edsl/surveys/instructions/ChangeInstruction.py +48 -0
- edsl/surveys/instructions/Instruction.py +56 -0
- edsl/surveys/instructions/InstructionCollection.py +82 -0
- edsl/surveys/instructions/__init__.py +0 -0
- edsl/templates/error_reporting/base.html +24 -0
- edsl/templates/error_reporting/exceptions_by_model.html +35 -0
- edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
- edsl/templates/error_reporting/exceptions_by_type.html +17 -0
- edsl/templates/error_reporting/interview_details.html +116 -0
- edsl/templates/error_reporting/interviews.html +19 -0
- edsl/templates/error_reporting/overview.html +5 -0
- edsl/templates/error_reporting/performance_plot.html +2 -0
- edsl/templates/error_reporting/report.css +74 -0
- edsl/templates/error_reporting/report.html +118 -0
- edsl/templates/error_reporting/report.js +25 -0
- edsl/tools/__init__.py +1 -0
- edsl/tools/clusters.py +192 -0
- edsl/tools/embeddings.py +27 -0
- edsl/tools/embeddings_plotting.py +118 -0
- edsl/tools/plotting.py +112 -0
- edsl/tools/summarize.py +18 -0
- edsl/utilities/PrettyList.py +56 -0
- edsl/utilities/SystemInfo.py +5 -0
- edsl/utilities/__init__.py +21 -20
- edsl/utilities/ast_utilities.py +3 -0
- edsl/utilities/data/Registry.py +2 -0
- edsl/utilities/decorators.py +41 -0
- edsl/utilities/gcp_bucket/__init__.py +0 -0
- edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
- edsl/utilities/interface.py +310 -60
- edsl/utilities/is_notebook.py +18 -0
- edsl/utilities/is_valid_variable_name.py +11 -0
- edsl/utilities/naming_utilities.py +263 -0
- edsl/utilities/remove_edsl_version.py +24 -0
- edsl/utilities/repair_functions.py +28 -0
- edsl/utilities/restricted_python.py +70 -0
- edsl/utilities/utilities.py +203 -13
- edsl-0.1.40.dist-info/METADATA +111 -0
- edsl-0.1.40.dist-info/RECORD +362 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
- edsl/agents/AgentListExportMixin.py +0 -24
- edsl/coop/old.py +0 -31
- edsl/data/Database.py +0 -141
- edsl/data/crud.py +0 -121
- edsl/jobs/Interview.py +0 -417
- edsl/jobs/JobsRunner.py +0 -63
- edsl/jobs/JobsRunnerStatusMixin.py +0 -115
- edsl/jobs/base.py +0 -47
- edsl/jobs/buckets.py +0 -166
- edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
- edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
- edsl/jobs/task_management.py +0 -218
- edsl/jobs/token_tracking.py +0 -78
- edsl/language_models/DeepInfra.py +0 -69
- edsl/language_models/OpenAI.py +0 -98
- edsl/language_models/model_interfaces/GeminiPro.py +0 -66
- edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
- edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
- edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
- edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
- edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
- edsl/language_models/registry.py +0 -81
- edsl/language_models/schemas.py +0 -15
- edsl/language_models/unused/ReplicateBase.py +0 -83
- edsl/prompts/QuestionInstructionsBase.py +0 -6
- edsl/prompts/library/agent_instructions.py +0 -29
- edsl/prompts/library/agent_persona.py +0 -17
- edsl/prompts/library/question_budget.py +0 -26
- edsl/prompts/library/question_checkbox.py +0 -32
- edsl/prompts/library/question_extract.py +0 -19
- edsl/prompts/library/question_freetext.py +0 -14
- edsl/prompts/library/question_linear_scale.py +0 -20
- edsl/prompts/library/question_list.py +0 -22
- edsl/prompts/library/question_multiple_choice.py +0 -44
- edsl/prompts/library/question_numerical.py +0 -31
- edsl/prompts/library/question_rank.py +0 -21
- edsl/prompts/prompt_config.py +0 -33
- edsl/prompts/registry.py +0 -185
- edsl/questions/Question.py +0 -240
- edsl/report/InputOutputDataTypes.py +0 -134
- edsl/report/RegressionMixin.py +0 -28
- edsl/report/ReportOutputs.py +0 -1228
- edsl/report/ResultsFetchMixin.py +0 -106
- edsl/report/ResultsOutputMixin.py +0 -14
- edsl/report/demo.ipynb +0 -645
- edsl/results/ResultsDBMixin.py +0 -184
- edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
- edsl/trackers/Tracker.py +0 -91
- edsl/trackers/TrackerAPI.py +0 -196
- edsl/trackers/TrackerTasks.py +0 -70
- edsl/utilities/pastebin.py +0 -141
- edsl-0.1.14.dist-info/METADATA +0 -69
- edsl-0.1.14.dist-info/RECORD +0 -141
- /edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
- /edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
- /edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0
@@ -0,0 +1,392 @@
|
|
1
|
+
"""This module contains the Interview class, which is responsible for conducting an interview asynchronously."""
|
2
|
+
|
3
|
+
from __future__ import annotations
|
4
|
+
import asyncio
|
5
|
+
from typing import Any, Type, List, Generator, Optional, Union, TYPE_CHECKING
|
6
|
+
import copy
|
7
|
+
from dataclasses import dataclass
|
8
|
+
|
9
|
+
# from edsl.jobs.Answers import Answers
|
10
|
+
from edsl.jobs.data_structures import Answers
|
11
|
+
from edsl.jobs.interviews.InterviewStatusLog import InterviewStatusLog
|
12
|
+
from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
|
13
|
+
from edsl.jobs.interviews.InterviewExceptionCollection import (
|
14
|
+
InterviewExceptionCollection,
|
15
|
+
)
|
16
|
+
from edsl.jobs.interviews.InterviewExceptionEntry import InterviewExceptionEntry
|
17
|
+
from edsl.jobs.buckets.ModelBuckets import ModelBuckets
|
18
|
+
from edsl.jobs.AnswerQuestionFunctionConstructor import (
|
19
|
+
AnswerQuestionFunctionConstructor,
|
20
|
+
)
|
21
|
+
from edsl.jobs.InterviewTaskManager import InterviewTaskManager
|
22
|
+
from edsl.jobs.FetchInvigilator import FetchInvigilator
|
23
|
+
from edsl.jobs.RequestTokenEstimator import RequestTokenEstimator
|
24
|
+
|
25
|
+
|
26
|
+
if TYPE_CHECKING:
|
27
|
+
from edsl.agents.Agent import Agent
|
28
|
+
from edsl.surveys.Survey import Survey
|
29
|
+
from edsl.scenarios.Scenario import Scenario
|
30
|
+
from edsl.data.Cache import Cache
|
31
|
+
from edsl.language_models.LanguageModel import LanguageModel
|
32
|
+
from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
|
33
|
+
from edsl.agents.InvigilatorBase import InvigilatorBase
|
34
|
+
from edsl.language_models.key_management.KeyLookup import KeyLookup
|
35
|
+
|
36
|
+
|
37
|
+
@dataclass
|
38
|
+
class InterviewRunningConfig:
|
39
|
+
cache: Optional["Cache"] = (None,)
|
40
|
+
skip_retry: bool = (False,) # COULD BE SET WITH CONFIG
|
41
|
+
raise_validation_errors: bool = (True,)
|
42
|
+
stop_on_exception: bool = (False,)
|
43
|
+
|
44
|
+
|
45
|
+
class Interview:
|
46
|
+
"""
|
47
|
+
An 'interview' is one agent answering one survey, with one language model, for a given scenario.
|
48
|
+
|
49
|
+
The main method is `async_conduct_interview`, which conducts the interview asynchronously.
|
50
|
+
Most of the class is dedicated to creating the tasks for each question in the survey, and then running them.
|
51
|
+
"""
|
52
|
+
|
53
|
+
def __init__(
|
54
|
+
self,
|
55
|
+
agent: Agent,
|
56
|
+
survey: Survey,
|
57
|
+
scenario: Scenario,
|
58
|
+
model: Type["LanguageModel"],
|
59
|
+
iteration: int = 0,
|
60
|
+
indices: dict = None, # explain?
|
61
|
+
cache: Optional["Cache"] = None,
|
62
|
+
skip_retry: bool = False, # COULD BE SET WITH CONFIG
|
63
|
+
raise_validation_errors: bool = True,
|
64
|
+
):
|
65
|
+
"""Initialize the Interview instance.
|
66
|
+
|
67
|
+
:param agent: the agent being interviewed.
|
68
|
+
:param survey: the survey being administered to the agent.
|
69
|
+
:param scenario: the scenario that populates the survey questions.
|
70
|
+
:param model: the language model used to answer the questions.
|
71
|
+
# :param debug: if True, run without calls to the language model.
|
72
|
+
:param iteration: the iteration number of the interview.
|
73
|
+
:param cache: the cache used to store the answers.
|
74
|
+
|
75
|
+
>>> i = Interview.example()
|
76
|
+
>>> i.task_manager.task_creators
|
77
|
+
{}
|
78
|
+
|
79
|
+
>>> i.exceptions
|
80
|
+
{}
|
81
|
+
|
82
|
+
>>> _ = asyncio.run(i.async_conduct_interview())
|
83
|
+
>>> i.task_status_logs['q0']
|
84
|
+
[{'log_time': ..., 'value': <TaskStatus.NOT_STARTED: 1>}, {'log_time': ..., 'value': <TaskStatus.WAITING_FOR_DEPENDENCIES: 2>}, {'log_time': ..., 'value': <TaskStatus.API_CALL_IN_PROGRESS: 7>}, {'log_time': ..., 'value': <TaskStatus.SUCCESS: 8>}]
|
85
|
+
|
86
|
+
>>> i.to_index
|
87
|
+
{'q0': 0, 'q1': 1, 'q2': 2}
|
88
|
+
|
89
|
+
"""
|
90
|
+
self.agent = agent
|
91
|
+
self.survey = copy.deepcopy(survey) # why do we need to deepcopy the survey?
|
92
|
+
self.scenario = scenario
|
93
|
+
self.model = model
|
94
|
+
self.iteration = iteration
|
95
|
+
|
96
|
+
self.answers = Answers() # will get filled in as interview progresses
|
97
|
+
|
98
|
+
self.task_manager = InterviewTaskManager(
|
99
|
+
survey=self.survey,
|
100
|
+
iteration=iteration,
|
101
|
+
)
|
102
|
+
|
103
|
+
self.exceptions = InterviewExceptionCollection()
|
104
|
+
|
105
|
+
self.running_config = InterviewRunningConfig(
|
106
|
+
cache=cache,
|
107
|
+
skip_retry=skip_retry,
|
108
|
+
raise_validation_errors=raise_validation_errors,
|
109
|
+
)
|
110
|
+
|
111
|
+
self.cache = cache
|
112
|
+
self.skip_retry = skip_retry
|
113
|
+
self.raise_validation_errors = raise_validation_errors
|
114
|
+
|
115
|
+
# dictionary mapping question names to their index in the survey.
|
116
|
+
self.to_index = {
|
117
|
+
question_name: index
|
118
|
+
for index, question_name in enumerate(self.survey.question_names)
|
119
|
+
}
|
120
|
+
|
121
|
+
self.failed_questions = []
|
122
|
+
|
123
|
+
self.indices = indices
|
124
|
+
self.initial_hash = hash(self)
|
125
|
+
|
126
|
+
@property
|
127
|
+
def has_exceptions(self) -> bool:
|
128
|
+
"""Return True if there are exceptions."""
|
129
|
+
return len(self.exceptions) > 0
|
130
|
+
|
131
|
+
@property
|
132
|
+
def task_status_logs(self) -> InterviewStatusLog:
|
133
|
+
"""Return the task status logs for the interview.
|
134
|
+
|
135
|
+
The keys are the question names; the values are the lists of status log changes for each task.
|
136
|
+
"""
|
137
|
+
return self.task_manager.task_status_logs
|
138
|
+
|
139
|
+
@property
|
140
|
+
def token_usage(self) -> InterviewTokenUsage:
|
141
|
+
"""Determine how many tokens were used for the interview."""
|
142
|
+
return self.task_manager.token_usage # task_creators.token_usage
|
143
|
+
|
144
|
+
@property
|
145
|
+
def interview_status(self) -> InterviewStatusDictionary:
|
146
|
+
"""Return a dictionary mapping task status codes to counts."""
|
147
|
+
# return self.task_creators.interview_status
|
148
|
+
return self.task_manager.interview_status
|
149
|
+
|
150
|
+
def to_dict(self, include_exceptions=True, add_edsl_version=True) -> dict[str, Any]:
|
151
|
+
"""Return a dictionary representation of the Interview instance.
|
152
|
+
This is just for hashing purposes.
|
153
|
+
|
154
|
+
>>> i = Interview.example()
|
155
|
+
>>> hash(i)
|
156
|
+
193593189022259693
|
157
|
+
"""
|
158
|
+
d = {
|
159
|
+
"agent": self.agent.to_dict(add_edsl_version=add_edsl_version),
|
160
|
+
"survey": self.survey.to_dict(add_edsl_version=add_edsl_version),
|
161
|
+
"scenario": self.scenario.to_dict(add_edsl_version=add_edsl_version),
|
162
|
+
"model": self.model.to_dict(add_edsl_version=add_edsl_version),
|
163
|
+
"iteration": self.iteration,
|
164
|
+
"exceptions": {},
|
165
|
+
}
|
166
|
+
if include_exceptions:
|
167
|
+
d["exceptions"] = self.exceptions.to_dict()
|
168
|
+
if hasattr(self, "indices"):
|
169
|
+
d["indices"] = self.indices
|
170
|
+
return d
|
171
|
+
|
172
|
+
@classmethod
|
173
|
+
def from_dict(cls, d: dict[str, Any]) -> "Interview":
|
174
|
+
"""Return an Interview instance from a dictionary."""
|
175
|
+
|
176
|
+
from edsl.agents.Agent import Agent
|
177
|
+
from edsl.surveys.Survey import Survey
|
178
|
+
from edsl.scenarios.Scenario import Scenario
|
179
|
+
from edsl.language_models.LanguageModel import LanguageModel
|
180
|
+
|
181
|
+
agent = Agent.from_dict(d["agent"])
|
182
|
+
survey = Survey.from_dict(d["survey"])
|
183
|
+
scenario = Scenario.from_dict(d["scenario"])
|
184
|
+
model = LanguageModel.from_dict(d["model"])
|
185
|
+
iteration = d["iteration"]
|
186
|
+
params = {
|
187
|
+
"agent": agent,
|
188
|
+
"survey": survey,
|
189
|
+
"scenario": scenario,
|
190
|
+
"model": model,
|
191
|
+
"iteration": iteration,
|
192
|
+
}
|
193
|
+
if "indices" in d:
|
194
|
+
params["indices"] = d["indices"]
|
195
|
+
interview = cls(**params)
|
196
|
+
if "exceptions" in d:
|
197
|
+
exceptions = InterviewExceptionCollection.from_dict(d["exceptions"])
|
198
|
+
interview.exceptions = exceptions
|
199
|
+
return interview
|
200
|
+
|
201
|
+
def __hash__(self) -> int:
|
202
|
+
from edsl.utilities.utilities import dict_hash
|
203
|
+
|
204
|
+
return dict_hash(self.to_dict(include_exceptions=False, add_edsl_version=False))
|
205
|
+
|
206
|
+
def __eq__(self, other: "Interview") -> bool:
|
207
|
+
"""
|
208
|
+
>>> from edsl.jobs.interviews.Interview import Interview; i = Interview.example(); d = i.to_dict(); i2 = Interview.from_dict(d); i == i2
|
209
|
+
True
|
210
|
+
"""
|
211
|
+
return hash(self) == hash(other)
|
212
|
+
|
213
|
+
async def async_conduct_interview(
|
214
|
+
self,
|
215
|
+
run_config: Optional["RunConfig"] = None,
|
216
|
+
) -> tuple["Answers", List[dict[str, Any]]]:
|
217
|
+
"""
|
218
|
+
Conduct an Interview asynchronously.
|
219
|
+
It returns a tuple with the answers and a list of valid results.
|
220
|
+
|
221
|
+
:param model_buckets: a dictionary of token buckets for the model.
|
222
|
+
:param debug: run without calls to LLM.
|
223
|
+
:param stop_on_exception: if True, stops the interview if an exception is raised.
|
224
|
+
|
225
|
+
Example usage:
|
226
|
+
|
227
|
+
>>> i = Interview.example()
|
228
|
+
>>> result, _ = asyncio.run(i.async_conduct_interview())
|
229
|
+
>>> result['q0']
|
230
|
+
'yes'
|
231
|
+
|
232
|
+
>>> i = Interview.example(throw_exception = True)
|
233
|
+
>>> result, _ = asyncio.run(i.async_conduct_interview())
|
234
|
+
>>> i.exceptions
|
235
|
+
{'q0': ...
|
236
|
+
>>> i = Interview.example()
|
237
|
+
>>> from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
|
238
|
+
>>> run_config = RunConfig(parameters = RunParameters(), environment = RunEnvironment())
|
239
|
+
>>> run_config.parameters.stop_on_exception = True
|
240
|
+
>>> result, _ = asyncio.run(i.async_conduct_interview(run_config))
|
241
|
+
Traceback (most recent call last):
|
242
|
+
...
|
243
|
+
asyncio.exceptions.CancelledError
|
244
|
+
"""
|
245
|
+
from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
|
246
|
+
|
247
|
+
if run_config is None:
|
248
|
+
run_config = RunConfig(
|
249
|
+
parameters=RunParameters(),
|
250
|
+
environment=RunEnvironment(),
|
251
|
+
)
|
252
|
+
self.stop_on_exception = run_config.parameters.stop_on_exception
|
253
|
+
|
254
|
+
# if no model bucket is passed, create an 'infinity' bucket with no rate limits
|
255
|
+
bucket_collection = run_config.environment.bucket_collection
|
256
|
+
|
257
|
+
if bucket_collection:
|
258
|
+
model_buckets = bucket_collection.get(self.model)
|
259
|
+
else:
|
260
|
+
model_buckets = None
|
261
|
+
|
262
|
+
if model_buckets is None or hasattr(self.agent, "answer_question_directly"):
|
263
|
+
model_buckets = ModelBuckets.infinity_bucket()
|
264
|
+
|
265
|
+
# was "self.tasks" - is that necessary?
|
266
|
+
self.tasks = self.task_manager.build_question_tasks(
|
267
|
+
answer_func=AnswerQuestionFunctionConstructor(
|
268
|
+
self, key_lookup=run_config.environment.key_lookup
|
269
|
+
)(),
|
270
|
+
token_estimator=RequestTokenEstimator(self),
|
271
|
+
model_buckets=model_buckets,
|
272
|
+
)
|
273
|
+
|
274
|
+
## This is the key part---it creates a task for each question,
|
275
|
+
## with dependencies on the questions that must be answered before this one can be answered.
|
276
|
+
|
277
|
+
## 'Invigilators' are used to administer the survey.
|
278
|
+
fetcher = FetchInvigilator(
|
279
|
+
interview=self,
|
280
|
+
current_answers=self.answers,
|
281
|
+
key_lookup=run_config.environment.key_lookup,
|
282
|
+
)
|
283
|
+
self.invigilators = [fetcher(question) for question in self.survey.questions]
|
284
|
+
await asyncio.gather(
|
285
|
+
*self.tasks, return_exceptions=not run_config.parameters.stop_on_exception
|
286
|
+
)
|
287
|
+
self.answers.replace_missing_answers_with_none(self.survey)
|
288
|
+
valid_results = list(
|
289
|
+
self._extract_valid_results(self.tasks, self.invigilators, self.exceptions)
|
290
|
+
)
|
291
|
+
return self.answers, valid_results
|
292
|
+
|
293
|
+
@staticmethod
|
294
|
+
def _extract_valid_results(
|
295
|
+
tasks: List["asyncio.Task"],
|
296
|
+
invigilators: List["InvigilatorBase"],
|
297
|
+
exceptions: InterviewExceptionCollection,
|
298
|
+
) -> Generator["Answers", None, None]:
|
299
|
+
"""Extract the valid results from the list of results.
|
300
|
+
|
301
|
+
It iterates through the tasks and invigilators, and yields the results of the tasks that are done.
|
302
|
+
If a task is not done, it raises a ValueError.
|
303
|
+
If an exception is raised in the task, it records the exception in the Interview instance except if the task was cancelled, which is expected behavior.
|
304
|
+
|
305
|
+
>>> i = Interview.example()
|
306
|
+
>>> result, _ = asyncio.run(i.async_conduct_interview())
|
307
|
+
"""
|
308
|
+
assert len(tasks) == len(invigilators)
|
309
|
+
|
310
|
+
def handle_task(task, invigilator):
|
311
|
+
try:
|
312
|
+
result: Answers = task.result()
|
313
|
+
except asyncio.CancelledError as e: # task was cancelled
|
314
|
+
result = invigilator.get_failed_task_result(
|
315
|
+
failure_reason="Task was cancelled."
|
316
|
+
)
|
317
|
+
except Exception as e: # any other kind of exception in the task
|
318
|
+
result = invigilator.get_failed_task_result(
|
319
|
+
failure_reason=f"Task failed with exception: {str(e)}."
|
320
|
+
)
|
321
|
+
exception_entry = InterviewExceptionEntry(
|
322
|
+
exception=e,
|
323
|
+
invigilator=invigilator,
|
324
|
+
)
|
325
|
+
exceptions.add(task.get_name(), exception_entry)
|
326
|
+
return result
|
327
|
+
|
328
|
+
for task, invigilator in zip(tasks, invigilators):
|
329
|
+
if not task.done():
|
330
|
+
raise ValueError(f"Task {task.get_name()} is not done.")
|
331
|
+
|
332
|
+
yield handle_task(task, invigilator)
|
333
|
+
|
334
|
+
def __repr__(self) -> str:
|
335
|
+
"""Return a string representation of the Interview instance."""
|
336
|
+
return f"Interview(agent = {repr(self.agent)}, survey = {repr(self.survey)}, scenario = {repr(self.scenario)}, model = {repr(self.model)})"
|
337
|
+
|
338
|
+
def duplicate(
|
339
|
+
self, iteration: int, cache: "Cache", randomize_survey: Optional[bool] = True
|
340
|
+
) -> Interview:
|
341
|
+
"""Duplicate the interview, but with a new iteration number and cache.
|
342
|
+
|
343
|
+
>>> i = Interview.example()
|
344
|
+
>>> i2 = i.duplicate(1, None)
|
345
|
+
>>> i.iteration + 1 == i2.iteration
|
346
|
+
True
|
347
|
+
|
348
|
+
"""
|
349
|
+
if randomize_survey:
|
350
|
+
new_survey = self.survey.draw()
|
351
|
+
else:
|
352
|
+
new_survey = self.survey
|
353
|
+
|
354
|
+
return Interview(
|
355
|
+
agent=self.agent,
|
356
|
+
survey=new_survey,
|
357
|
+
scenario=self.scenario,
|
358
|
+
model=self.model,
|
359
|
+
iteration=iteration,
|
360
|
+
cache=self.running_config.cache,
|
361
|
+
skip_retry=self.running_config.skip_retry,
|
362
|
+
indices=self.indices,
|
363
|
+
)
|
364
|
+
|
365
|
+
@classmethod
|
366
|
+
def example(self, throw_exception: bool = False) -> Interview:
|
367
|
+
"""Return an example Interview instance."""
|
368
|
+
from edsl.agents import Agent
|
369
|
+
from edsl.surveys import Survey
|
370
|
+
from edsl.scenarios import Scenario
|
371
|
+
from edsl.language_models import LanguageModel
|
372
|
+
|
373
|
+
def f(self, question, scenario):
|
374
|
+
return "yes"
|
375
|
+
|
376
|
+
agent = Agent.example()
|
377
|
+
agent.add_direct_question_answering_method(f)
|
378
|
+
survey = Survey.example()
|
379
|
+
scenario = Scenario.example()
|
380
|
+
model = LanguageModel.example()
|
381
|
+
if throw_exception:
|
382
|
+
model = LanguageModel.example(test_model=True, throw_exception=True)
|
383
|
+
agent = Agent.example()
|
384
|
+
return Interview(agent=agent, survey=survey, scenario=scenario, model=model)
|
385
|
+
return Interview(agent=agent, survey=survey, scenario=scenario, model=model)
|
386
|
+
|
387
|
+
|
388
|
+
if __name__ == "__main__":
|
389
|
+
import doctest
|
390
|
+
|
391
|
+
# add ellipsis
|
392
|
+
doctest.testmod(optionflags=doctest.ELLIPSIS)
|
@@ -0,0 +1,99 @@
|
|
1
|
+
from collections import UserDict
|
2
|
+
|
3
|
+
from edsl.jobs.interviews.InterviewExceptionEntry import InterviewExceptionEntry
|
4
|
+
|
5
|
+
|
6
|
+
class InterviewExceptionCollection(UserDict):
|
7
|
+
"""A collection of exceptions that occurred during the interview."""
|
8
|
+
|
9
|
+
def __init__(self):
|
10
|
+
super().__init__()
|
11
|
+
self.fixed = set()
|
12
|
+
|
13
|
+
def unfixed_exceptions(self) -> list:
|
14
|
+
"""Return a list of unfixed exceptions."""
|
15
|
+
return {k: v for k, v in self.data.items() if k not in self.fixed}
|
16
|
+
|
17
|
+
def num_unfixed(self) -> list:
|
18
|
+
"""Return a list of unfixed questions."""
|
19
|
+
return len([k for k in self.data.keys() if k not in self.fixed])
|
20
|
+
|
21
|
+
def record_fixed_question(self, question_name: str) -> None:
|
22
|
+
"""Record that a question has been fixed."""
|
23
|
+
self.fixed.add(question_name)
|
24
|
+
|
25
|
+
def add(self, question_name: str, entry: InterviewExceptionEntry) -> None:
|
26
|
+
"""Add an exception entry to the collection."""
|
27
|
+
question_name = question_name
|
28
|
+
if question_name not in self.data:
|
29
|
+
self.data[question_name] = []
|
30
|
+
self.data[question_name].append(entry)
|
31
|
+
|
32
|
+
def to_dict(self, include_traceback=True) -> dict:
|
33
|
+
"""Return the collection of exceptions as a dictionary."""
|
34
|
+
newdata = {k: [e.to_dict() for e in v] for k, v in self.data.items()}
|
35
|
+
return newdata
|
36
|
+
|
37
|
+
@classmethod
|
38
|
+
def from_dict(cls, data: dict) -> "InterviewExceptionCollection":
|
39
|
+
"""Create an InterviewExceptionCollection from a dictionary."""
|
40
|
+
collection = cls()
|
41
|
+
for question_name, entries in data.items():
|
42
|
+
for entry in entries:
|
43
|
+
collection.add(question_name, InterviewExceptionEntry.from_dict(entry))
|
44
|
+
return collection
|
45
|
+
|
46
|
+
def _repr_html_(self) -> str:
|
47
|
+
from edsl.utilities.utilities import data_to_html
|
48
|
+
|
49
|
+
return data_to_html(self.to_dict(include_traceback=True))
|
50
|
+
|
51
|
+
def ascii_table(self, traceback: bool = False) -> None:
|
52
|
+
headers = ["Question name", "Exception", "Time", "Traceback"]
|
53
|
+
from tabulate import tabulate
|
54
|
+
|
55
|
+
data = []
|
56
|
+
for question, exceptions in self.data.items():
|
57
|
+
for exception in exceptions:
|
58
|
+
if traceback:
|
59
|
+
row = [
|
60
|
+
question,
|
61
|
+
exception["exception"],
|
62
|
+
exception["time"],
|
63
|
+
exception["traceback"],
|
64
|
+
]
|
65
|
+
else:
|
66
|
+
row = [question, exception["exception"], exception["time"]]
|
67
|
+
data.append(row)
|
68
|
+
|
69
|
+
print(tabulate(data, headers=headers, tablefmt="grid"))
|
70
|
+
|
71
|
+
def print(self, traceback=False):
|
72
|
+
"""Print the collection of exceptions."""
|
73
|
+
console = Console()
|
74
|
+
table = Table(show_header=True, header_style="bold magenta")
|
75
|
+
table.add_column("Question name", style="dim", width=12)
|
76
|
+
table.add_column("Exception", width=32)
|
77
|
+
table.add_column("Time", justify="right")
|
78
|
+
table.add_column("Traceback", min_width=20)
|
79
|
+
|
80
|
+
for queue, exceptions in self.data.items():
|
81
|
+
for exception in exceptions:
|
82
|
+
if traceback:
|
83
|
+
traceback_string = exception["traceback"].replace("\n", "\n\n")
|
84
|
+
else:
|
85
|
+
traceback_string = ""
|
86
|
+
table.add_row(
|
87
|
+
queue,
|
88
|
+
exception["exception"],
|
89
|
+
str(exception["time"]),
|
90
|
+
traceback_string, # Adding extra newlines for better readability
|
91
|
+
)
|
92
|
+
|
93
|
+
console.print(table)
|
94
|
+
|
95
|
+
|
96
|
+
if __name__ == "__main__":
|
97
|
+
import doctest
|
98
|
+
|
99
|
+
doctest.testmod(optionflags=doctest.ELLIPSIS)
|
@@ -0,0 +1,186 @@
|
|
1
|
+
import traceback
|
2
|
+
import datetime
|
3
|
+
|
4
|
+
|
5
|
+
class InterviewExceptionEntry:
|
6
|
+
"""Class to record an exception that occurred during the interview."""
|
7
|
+
|
8
|
+
def __init__(
|
9
|
+
self,
|
10
|
+
*,
|
11
|
+
exception: Exception,
|
12
|
+
invigilator: "Invigilator",
|
13
|
+
traceback_format="text",
|
14
|
+
answers=None,
|
15
|
+
):
|
16
|
+
self.time = datetime.datetime.now().isoformat()
|
17
|
+
self.exception = exception
|
18
|
+
# self.failed_question = failed_question
|
19
|
+
self.invigilator = invigilator
|
20
|
+
self.traceback_format = traceback_format
|
21
|
+
self.answers = answers
|
22
|
+
|
23
|
+
@property
|
24
|
+
def question_type(self):
|
25
|
+
# return self.failed_question.question.question_type
|
26
|
+
return self.invigilator.question.question_type
|
27
|
+
|
28
|
+
@property
|
29
|
+
def name(self):
|
30
|
+
return repr(self.exception)
|
31
|
+
|
32
|
+
@property
|
33
|
+
def rendered_prompts(self):
|
34
|
+
return self.invigilator.get_prompts()
|
35
|
+
|
36
|
+
@property
|
37
|
+
def key_sequence(self):
|
38
|
+
return self.invigilator.model.key_sequence
|
39
|
+
|
40
|
+
@property
|
41
|
+
def generated_token_string(self):
|
42
|
+
# return "POO"
|
43
|
+
if self.invigilator.raw_model_response is None:
|
44
|
+
return "No raw model response available."
|
45
|
+
else:
|
46
|
+
return self.invigilator.model.get_generated_token_string(
|
47
|
+
self.invigilator.raw_model_response
|
48
|
+
)
|
49
|
+
|
50
|
+
@property
|
51
|
+
def raw_model_response(self):
|
52
|
+
import json
|
53
|
+
|
54
|
+
if self.invigilator.raw_model_response is None:
|
55
|
+
return "No raw model response available."
|
56
|
+
return json.dumps(self.invigilator.raw_model_response, indent=2)
|
57
|
+
|
58
|
+
def __getitem__(self, key):
|
59
|
+
# Support dict-like access obj['a']
|
60
|
+
return str(getattr(self, key))
|
61
|
+
|
62
|
+
@classmethod
|
63
|
+
def example(cls):
|
64
|
+
from edsl import QuestionFreeText
|
65
|
+
from edsl.language_models import LanguageModel
|
66
|
+
|
67
|
+
m = LanguageModel.example(test_model=True)
|
68
|
+
q = QuestionFreeText.example(exception_to_throw=ValueError)
|
69
|
+
results = q.by(m).run(
|
70
|
+
skip_retry=True,
|
71
|
+
print_exceptions=False,
|
72
|
+
raise_validation_errors=True,
|
73
|
+
disable_remote_cache=True,
|
74
|
+
disable_remote_inference=True,
|
75
|
+
)
|
76
|
+
return results.task_history.exceptions[0]["how_are_you"][0]
|
77
|
+
|
78
|
+
@property
|
79
|
+
def code_to_reproduce(self):
|
80
|
+
return self.code(run=False)
|
81
|
+
|
82
|
+
def code(self, run=True):
|
83
|
+
lines = []
|
84
|
+
lines.append("from edsl import Question, Model, Scenario, Agent")
|
85
|
+
|
86
|
+
lines.append(f"q = {repr(self.invigilator.question)}")
|
87
|
+
lines.append(f"scenario = {repr(self.invigilator.scenario)}")
|
88
|
+
lines.append(f"agent = {repr(self.invigilator.agent)}")
|
89
|
+
lines.append(f"m = Model('{self.invigilator.model.model}')")
|
90
|
+
lines.append("results = q.by(m).by(agent).by(scenario).run()")
|
91
|
+
code_str = "\n".join(lines)
|
92
|
+
|
93
|
+
if run:
|
94
|
+
# Create a new namespace to avoid polluting the global namespace
|
95
|
+
namespace = {}
|
96
|
+
exec(code_str, namespace)
|
97
|
+
return namespace["results"]
|
98
|
+
return code_str
|
99
|
+
|
100
|
+
@property
|
101
|
+
def traceback(self):
|
102
|
+
"""Return the exception as HTML."""
|
103
|
+
if self.traceback_format == "html":
|
104
|
+
return self.html_traceback
|
105
|
+
else:
|
106
|
+
return self.text_traceback
|
107
|
+
|
108
|
+
@property
|
109
|
+
def text_traceback(self):
|
110
|
+
"""
|
111
|
+
>>> entry = InterviewExceptionEntry.example()
|
112
|
+
>>> entry.text_traceback
|
113
|
+
'Traceback (most recent call last):...'
|
114
|
+
"""
|
115
|
+
e = self.exception
|
116
|
+
tb_str = "".join(traceback.format_exception(type(e), e, e.__traceback__))
|
117
|
+
return tb_str
|
118
|
+
|
119
|
+
@property
|
120
|
+
def html_traceback(self):
|
121
|
+
from rich.console import Console
|
122
|
+
from rich.table import Table
|
123
|
+
from rich.traceback import Traceback
|
124
|
+
|
125
|
+
from io import StringIO
|
126
|
+
|
127
|
+
html_output = StringIO()
|
128
|
+
|
129
|
+
console = Console(file=html_output, record=True)
|
130
|
+
|
131
|
+
tb = Traceback.from_exception(
|
132
|
+
type(self.exception),
|
133
|
+
self.exception,
|
134
|
+
self.exception.__traceback__,
|
135
|
+
show_locals=True,
|
136
|
+
)
|
137
|
+
console.print(tb)
|
138
|
+
return html_output.getvalue()
|
139
|
+
|
140
|
+
@staticmethod
|
141
|
+
def serialize_exception(exception: Exception) -> dict:
|
142
|
+
return {
|
143
|
+
"type": type(exception).__name__,
|
144
|
+
"message": str(exception),
|
145
|
+
"traceback": "".join(
|
146
|
+
traceback.format_exception(
|
147
|
+
type(exception), exception, exception.__traceback__
|
148
|
+
)
|
149
|
+
),
|
150
|
+
}
|
151
|
+
|
152
|
+
@staticmethod
|
153
|
+
def deserialize_exception(data: dict) -> Exception:
|
154
|
+
try:
|
155
|
+
exception_class = globals()[data["type"]]
|
156
|
+
except KeyError:
|
157
|
+
exception_class = Exception
|
158
|
+
return exception_class(data["message"])
|
159
|
+
|
160
|
+
def to_dict(self) -> dict:
|
161
|
+
"""Return the exception as a dictionary.
|
162
|
+
|
163
|
+
>>> entry = InterviewExceptionEntry.example()
|
164
|
+
>>> _ = entry.to_dict()
|
165
|
+
"""
|
166
|
+
return {
|
167
|
+
"exception": self.serialize_exception(self.exception),
|
168
|
+
"time": self.time,
|
169
|
+
"traceback": self.traceback,
|
170
|
+
"invigilator": self.invigilator.to_dict(),
|
171
|
+
}
|
172
|
+
|
173
|
+
@classmethod
|
174
|
+
def from_dict(cls, data: dict) -> "InterviewExceptionEntry":
|
175
|
+
"""Create an InterviewExceptionEntry from a dictionary."""
|
176
|
+
from edsl.agents.Invigilator import InvigilatorAI
|
177
|
+
|
178
|
+
exception = cls.deserialize_exception(data["exception"])
|
179
|
+
invigilator = InvigilatorAI.from_dict(data["invigilator"])
|
180
|
+
return cls(exception=exception, invigilator=invigilator)
|
181
|
+
|
182
|
+
|
183
|
+
if __name__ == "__main__":
|
184
|
+
import doctest
|
185
|
+
|
186
|
+
doctest.testmod(optionflags=doctest.ELLIPSIS)
|