edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (344) hide show
  1. edsl/Base.py +413 -332
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +57 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +1071 -867
  7. edsl/agents/AgentList.py +551 -413
  8. edsl/agents/Invigilator.py +284 -233
  9. edsl/agents/InvigilatorBase.py +257 -270
  10. edsl/agents/PromptConstructor.py +272 -354
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/__init__.py +2 -3
  14. edsl/agents/descriptors.py +99 -99
  15. edsl/agents/prompt_helpers.py +129 -129
  16. edsl/agents/question_option_processor.py +172 -0
  17. edsl/auto/AutoStudy.py +130 -117
  18. edsl/auto/StageBase.py +243 -230
  19. edsl/auto/StageGenerateSurvey.py +178 -178
  20. edsl/auto/StageLabelQuestions.py +125 -125
  21. edsl/auto/StagePersona.py +61 -61
  22. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  23. edsl/auto/StagePersonaDimensionValues.py +74 -74
  24. edsl/auto/StagePersonaDimensions.py +69 -69
  25. edsl/auto/StageQuestions.py +74 -73
  26. edsl/auto/SurveyCreatorPipeline.py +21 -21
  27. edsl/auto/utilities.py +218 -224
  28. edsl/base/Base.py +279 -279
  29. edsl/config.py +177 -157
  30. edsl/conversation/Conversation.py +290 -290
  31. edsl/conversation/car_buying.py +59 -58
  32. edsl/conversation/chips.py +95 -95
  33. edsl/conversation/mug_negotiation.py +81 -81
  34. edsl/conversation/next_speaker_utilities.py +93 -93
  35. edsl/coop/CoopFunctionsMixin.py +15 -0
  36. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  37. edsl/coop/PriceFetcher.py +54 -54
  38. edsl/coop/__init__.py +2 -2
  39. edsl/coop/coop.py +1106 -1028
  40. edsl/coop/utils.py +131 -131
  41. edsl/data/Cache.py +573 -555
  42. edsl/data/CacheEntry.py +230 -233
  43. edsl/data/CacheHandler.py +168 -149
  44. edsl/data/RemoteCacheSync.py +186 -78
  45. edsl/data/SQLiteDict.py +292 -292
  46. edsl/data/__init__.py +5 -4
  47. edsl/data/hack.py +10 -0
  48. edsl/data/orm.py +10 -10
  49. edsl/data_transfer_models.py +74 -73
  50. edsl/enums.py +202 -175
  51. edsl/exceptions/BaseException.py +21 -21
  52. edsl/exceptions/__init__.py +54 -54
  53. edsl/exceptions/agents.py +54 -42
  54. edsl/exceptions/cache.py +5 -5
  55. edsl/exceptions/configuration.py +16 -16
  56. edsl/exceptions/coop.py +10 -10
  57. edsl/exceptions/data.py +14 -14
  58. edsl/exceptions/general.py +34 -34
  59. edsl/exceptions/inference_services.py +5 -0
  60. edsl/exceptions/jobs.py +33 -33
  61. edsl/exceptions/language_models.py +63 -63
  62. edsl/exceptions/prompts.py +15 -15
  63. edsl/exceptions/questions.py +109 -91
  64. edsl/exceptions/results.py +29 -29
  65. edsl/exceptions/scenarios.py +29 -22
  66. edsl/exceptions/surveys.py +37 -37
  67. edsl/inference_services/AnthropicService.py +106 -87
  68. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  69. edsl/inference_services/AvailableModelFetcher.py +215 -0
  70. edsl/inference_services/AwsBedrock.py +118 -120
  71. edsl/inference_services/AzureAI.py +215 -217
  72. edsl/inference_services/DeepInfraService.py +18 -18
  73. edsl/inference_services/GoogleService.py +143 -148
  74. edsl/inference_services/GroqService.py +20 -20
  75. edsl/inference_services/InferenceServiceABC.py +80 -147
  76. edsl/inference_services/InferenceServicesCollection.py +138 -97
  77. edsl/inference_services/MistralAIService.py +120 -123
  78. edsl/inference_services/OllamaService.py +18 -18
  79. edsl/inference_services/OpenAIService.py +236 -224
  80. edsl/inference_services/PerplexityService.py +160 -163
  81. edsl/inference_services/ServiceAvailability.py +135 -0
  82. edsl/inference_services/TestService.py +90 -89
  83. edsl/inference_services/TogetherAIService.py +172 -170
  84. edsl/inference_services/data_structures.py +134 -0
  85. edsl/inference_services/models_available_cache.py +118 -118
  86. edsl/inference_services/rate_limits_cache.py +25 -25
  87. edsl/inference_services/registry.py +41 -41
  88. edsl/inference_services/write_available.py +10 -10
  89. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  90. edsl/jobs/Answers.py +43 -56
  91. edsl/jobs/FetchInvigilator.py +47 -0
  92. edsl/jobs/InterviewTaskManager.py +98 -0
  93. edsl/jobs/InterviewsConstructor.py +50 -0
  94. edsl/jobs/Jobs.py +823 -898
  95. edsl/jobs/JobsChecks.py +172 -147
  96. edsl/jobs/JobsComponentConstructor.py +189 -0
  97. edsl/jobs/JobsPrompts.py +270 -268
  98. edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
  99. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  100. edsl/jobs/RequestTokenEstimator.py +30 -0
  101. edsl/jobs/__init__.py +1 -1
  102. edsl/jobs/async_interview_runner.py +138 -0
  103. edsl/jobs/buckets/BucketCollection.py +104 -63
  104. edsl/jobs/buckets/ModelBuckets.py +65 -65
  105. edsl/jobs/buckets/TokenBucket.py +283 -251
  106. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  107. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  108. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  109. edsl/jobs/data_structures.py +120 -0
  110. edsl/jobs/decorators.py +35 -0
  111. edsl/jobs/interviews/Interview.py +396 -661
  112. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  113. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  114. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  115. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  116. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  117. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  118. edsl/jobs/interviews/ReportErrors.py +66 -66
  119. edsl/jobs/interviews/interview_status_enum.py +9 -9
  120. edsl/jobs/jobs_status_enums.py +9 -0
  121. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  122. edsl/jobs/results_exceptions_handler.py +98 -0
  123. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
  124. edsl/jobs/runners/JobsRunnerStatus.py +297 -330
  125. edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
  126. edsl/jobs/tasks/TaskCreators.py +64 -64
  127. edsl/jobs/tasks/TaskHistory.py +470 -450
  128. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  129. edsl/jobs/tasks/task_status_enum.py +161 -163
  130. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  131. edsl/jobs/tokens/TokenUsage.py +34 -34
  132. edsl/language_models/ComputeCost.py +63 -0
  133. edsl/language_models/LanguageModel.py +626 -668
  134. edsl/language_models/ModelList.py +164 -155
  135. edsl/language_models/PriceManager.py +127 -0
  136. edsl/language_models/RawResponseHandler.py +106 -0
  137. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  138. edsl/language_models/ServiceDataSources.py +0 -0
  139. edsl/language_models/__init__.py +2 -3
  140. edsl/language_models/fake_openai_call.py +15 -15
  141. edsl/language_models/fake_openai_service.py +61 -61
  142. edsl/language_models/key_management/KeyLookup.py +63 -0
  143. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  144. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  145. edsl/language_models/key_management/__init__.py +0 -0
  146. edsl/language_models/key_management/models.py +131 -0
  147. edsl/language_models/model.py +256 -0
  148. edsl/language_models/repair.py +156 -156
  149. edsl/language_models/utilities.py +65 -64
  150. edsl/notebooks/Notebook.py +263 -258
  151. edsl/notebooks/NotebookToLaTeX.py +142 -0
  152. edsl/notebooks/__init__.py +1 -1
  153. edsl/prompts/Prompt.py +352 -362
  154. edsl/prompts/__init__.py +2 -2
  155. edsl/questions/ExceptionExplainer.py +77 -0
  156. edsl/questions/HTMLQuestion.py +103 -0
  157. edsl/questions/QuestionBase.py +518 -664
  158. edsl/questions/QuestionBasePromptsMixin.py +221 -217
  159. edsl/questions/QuestionBudget.py +227 -227
  160. edsl/questions/QuestionCheckBox.py +359 -359
  161. edsl/questions/QuestionExtract.py +180 -182
  162. edsl/questions/QuestionFreeText.py +113 -114
  163. edsl/questions/QuestionFunctional.py +166 -166
  164. edsl/questions/QuestionList.py +223 -231
  165. edsl/questions/QuestionMatrix.py +265 -0
  166. edsl/questions/QuestionMultipleChoice.py +330 -286
  167. edsl/questions/QuestionNumerical.py +151 -153
  168. edsl/questions/QuestionRank.py +314 -324
  169. edsl/questions/Quick.py +41 -41
  170. edsl/questions/SimpleAskMixin.py +74 -73
  171. edsl/questions/__init__.py +27 -26
  172. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
  173. edsl/questions/compose_questions.py +98 -98
  174. edsl/questions/data_structures.py +20 -0
  175. edsl/questions/decorators.py +21 -21
  176. edsl/questions/derived/QuestionLikertFive.py +76 -76
  177. edsl/questions/derived/QuestionLinearScale.py +90 -87
  178. edsl/questions/derived/QuestionTopK.py +93 -93
  179. edsl/questions/derived/QuestionYesNo.py +82 -82
  180. edsl/questions/descriptors.py +427 -413
  181. edsl/questions/loop_processor.py +149 -0
  182. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  183. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  184. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  185. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  186. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  187. edsl/questions/prompt_templates/question_list.jinja +17 -17
  188. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  189. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  190. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
  191. edsl/questions/question_registry.py +177 -177
  192. edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
  193. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
  194. edsl/questions/response_validator_factory.py +34 -0
  195. edsl/questions/settings.py +12 -12
  196. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  197. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  198. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  199. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  200. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  201. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  202. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  203. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  204. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  205. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  206. edsl/questions/templates/list/question_presentation.jinja +5 -5
  207. edsl/questions/templates/matrix/__init__.py +1 -0
  208. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  209. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  210. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  211. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  212. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  213. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  214. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  215. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  216. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  217. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  218. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  219. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  220. edsl/results/CSSParameterizer.py +108 -108
  221. edsl/results/Dataset.py +587 -424
  222. edsl/results/DatasetExportMixin.py +594 -731
  223. edsl/results/DatasetTree.py +295 -275
  224. edsl/results/MarkdownToDocx.py +122 -0
  225. edsl/results/MarkdownToPDF.py +111 -0
  226. edsl/results/Result.py +557 -465
  227. edsl/results/Results.py +1183 -1165
  228. edsl/results/ResultsExportMixin.py +45 -43
  229. edsl/results/ResultsGGMixin.py +121 -121
  230. edsl/results/TableDisplay.py +125 -198
  231. edsl/results/TextEditor.py +50 -0
  232. edsl/results/__init__.py +2 -2
  233. edsl/results/file_exports.py +252 -0
  234. edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
  235. edsl/results/{Selector.py → results_selector.py} +145 -135
  236. edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
  237. edsl/results/smart_objects.py +96 -0
  238. edsl/results/table_data_class.py +12 -0
  239. edsl/results/table_display.css +77 -77
  240. edsl/results/table_renderers.py +118 -0
  241. edsl/results/tree_explore.py +115 -115
  242. edsl/scenarios/ConstructDownloadLink.py +109 -0
  243. edsl/scenarios/DocumentChunker.py +102 -0
  244. edsl/scenarios/DocxScenario.py +16 -0
  245. edsl/scenarios/FileStore.py +511 -632
  246. edsl/scenarios/PdfExtractor.py +40 -0
  247. edsl/scenarios/Scenario.py +498 -601
  248. edsl/scenarios/ScenarioHtmlMixin.py +65 -64
  249. edsl/scenarios/ScenarioList.py +1458 -1287
  250. edsl/scenarios/ScenarioListExportMixin.py +45 -52
  251. edsl/scenarios/ScenarioListPdfMixin.py +239 -261
  252. edsl/scenarios/__init__.py +3 -4
  253. edsl/scenarios/directory_scanner.py +96 -0
  254. edsl/scenarios/file_methods.py +85 -0
  255. edsl/scenarios/handlers/__init__.py +13 -0
  256. edsl/scenarios/handlers/csv.py +38 -0
  257. edsl/scenarios/handlers/docx.py +76 -0
  258. edsl/scenarios/handlers/html.py +37 -0
  259. edsl/scenarios/handlers/json.py +111 -0
  260. edsl/scenarios/handlers/latex.py +5 -0
  261. edsl/scenarios/handlers/md.py +51 -0
  262. edsl/scenarios/handlers/pdf.py +68 -0
  263. edsl/scenarios/handlers/png.py +39 -0
  264. edsl/scenarios/handlers/pptx.py +105 -0
  265. edsl/scenarios/handlers/py.py +294 -0
  266. edsl/scenarios/handlers/sql.py +313 -0
  267. edsl/scenarios/handlers/sqlite.py +149 -0
  268. edsl/scenarios/handlers/txt.py +33 -0
  269. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
  270. edsl/scenarios/scenario_selector.py +156 -0
  271. edsl/shared.py +1 -1
  272. edsl/study/ObjectEntry.py +173 -173
  273. edsl/study/ProofOfWork.py +113 -113
  274. edsl/study/SnapShot.py +80 -80
  275. edsl/study/Study.py +521 -528
  276. edsl/study/__init__.py +4 -4
  277. edsl/surveys/ConstructDAG.py +92 -0
  278. edsl/surveys/DAG.py +148 -148
  279. edsl/surveys/EditSurvey.py +221 -0
  280. edsl/surveys/InstructionHandler.py +100 -0
  281. edsl/surveys/Memory.py +31 -31
  282. edsl/surveys/MemoryManagement.py +72 -0
  283. edsl/surveys/MemoryPlan.py +244 -244
  284. edsl/surveys/Rule.py +327 -326
  285. edsl/surveys/RuleCollection.py +385 -387
  286. edsl/surveys/RuleManager.py +172 -0
  287. edsl/surveys/Simulator.py +75 -0
  288. edsl/surveys/Survey.py +1280 -1801
  289. edsl/surveys/SurveyCSS.py +273 -261
  290. edsl/surveys/SurveyExportMixin.py +259 -259
  291. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
  292. edsl/surveys/SurveyQualtricsImport.py +284 -284
  293. edsl/surveys/SurveyToApp.py +141 -0
  294. edsl/surveys/__init__.py +5 -3
  295. edsl/surveys/base.py +53 -53
  296. edsl/surveys/descriptors.py +60 -56
  297. edsl/surveys/instructions/ChangeInstruction.py +48 -49
  298. edsl/surveys/instructions/Instruction.py +56 -65
  299. edsl/surveys/instructions/InstructionCollection.py +82 -77
  300. edsl/templates/error_reporting/base.html +23 -23
  301. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  302. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  303. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  304. edsl/templates/error_reporting/interview_details.html +115 -115
  305. edsl/templates/error_reporting/interviews.html +19 -19
  306. edsl/templates/error_reporting/overview.html +4 -4
  307. edsl/templates/error_reporting/performance_plot.html +1 -1
  308. edsl/templates/error_reporting/report.css +73 -73
  309. edsl/templates/error_reporting/report.html +117 -117
  310. edsl/templates/error_reporting/report.js +25 -25
  311. edsl/test_h +1 -0
  312. edsl/tools/__init__.py +1 -1
  313. edsl/tools/clusters.py +192 -192
  314. edsl/tools/embeddings.py +27 -27
  315. edsl/tools/embeddings_plotting.py +118 -118
  316. edsl/tools/plotting.py +112 -112
  317. edsl/tools/summarize.py +18 -18
  318. edsl/utilities/PrettyList.py +56 -0
  319. edsl/utilities/SystemInfo.py +28 -28
  320. edsl/utilities/__init__.py +22 -22
  321. edsl/utilities/ast_utilities.py +25 -25
  322. edsl/utilities/data/Registry.py +6 -6
  323. edsl/utilities/data/__init__.py +1 -1
  324. edsl/utilities/data/scooter_results.json +1 -1
  325. edsl/utilities/decorators.py +77 -77
  326. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  327. edsl/utilities/gcp_bucket/example.py +50 -0
  328. edsl/utilities/interface.py +627 -627
  329. edsl/utilities/is_notebook.py +18 -0
  330. edsl/utilities/is_valid_variable_name.py +11 -0
  331. edsl/utilities/naming_utilities.py +263 -263
  332. edsl/utilities/remove_edsl_version.py +24 -0
  333. edsl/utilities/repair_functions.py +28 -28
  334. edsl/utilities/restricted_python.py +70 -70
  335. edsl/utilities/utilities.py +436 -424
  336. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/LICENSE +21 -21
  337. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/METADATA +13 -11
  338. edsl-0.1.39.dev4.dist-info/RECORD +361 -0
  339. edsl/language_models/KeyLookup.py +0 -30
  340. edsl/language_models/registry.py +0 -190
  341. edsl/language_models/unused/ReplicateBase.py +0 -83
  342. edsl/results/ResultsDBMixin.py +0 -238
  343. edsl-0.1.39.dev3.dist-info/RECORD +0 -277
  344. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/WHEEL +0 -0
@@ -1,354 +1,272 @@
1
- from __future__ import annotations
2
- from typing import Dict, Any, Optional, Set
3
-
4
- from jinja2 import Environment, meta
5
-
6
- from edsl.prompts.Prompt import Prompt
7
- from edsl.agents.prompt_helpers import PromptPlan
8
-
9
-
10
- class PlaceholderAnswer:
11
- """A placeholder answer for when a question is not yet answered."""
12
-
13
- def __init__(self):
14
- self.answer = "N/A"
15
- self.comment = "Will be populated by prior answer"
16
-
17
- def __getitem__(self, index):
18
- return ""
19
-
20
- def __str__(self):
21
- return "<<PlaceholderAnswer>>"
22
-
23
- def __repr__(self):
24
- return "<<PlaceholderAnswer>>"
25
-
26
-
27
- def get_jinja2_variables(template_str: str) -> Set[str]:
28
- """
29
- Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
-
31
- Args:
32
- template_str (str): The Jinja2 template string
33
-
34
- Returns:
35
- Set[str]: A set of variable names found in the template
36
- """
37
- env = Environment()
38
- ast = env.parse(template_str)
39
- return meta.find_undeclared_variables(ast)
40
-
41
-
42
- class PromptConstructor:
43
- """
44
- The pieces of a prompt are:
45
- - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
- - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
- - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
- - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
-
50
- This is mixed into the Invigilator class.
51
- """
52
-
53
- def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
- self.invigilator = invigilator
55
- self.agent = invigilator.agent
56
- self.question = invigilator.question
57
- self.scenario = invigilator.scenario
58
- self.survey = invigilator.survey
59
- self.model = invigilator.model
60
- self.current_answers = invigilator.current_answers
61
- self.memory_plan = invigilator.memory_plan
62
- self.prompt_plan = prompt_plan or PromptPlan()
63
-
64
- @property
65
- def scenario_file_keys(self) -> list:
66
- """We need to find all the keys in the scenario that refer to FileStore objects.
67
- These will be used to append to the prompt a list of files that are part of the scenario.
68
- """
69
- from edsl.scenarios.FileStore import FileStore
70
-
71
- file_entries = []
72
- for key, value in self.scenario.items():
73
- if isinstance(value, FileStore):
74
- file_entries.append(key)
75
- return file_entries
76
-
77
- @property
78
- def agent_instructions_prompt(self) -> Prompt:
79
- """
80
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
- >>> i = InvigilatorBase.example()
82
- >>> i.prompt_constructor.agent_instructions_prompt
83
- Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
- """
85
- from edsl import Agent
86
-
87
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
- return Prompt(text="")
89
-
90
- return Prompt(text=self.agent.instruction)
91
-
92
- @property
93
- def agent_persona_prompt(self) -> Prompt:
94
- """
95
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
- >>> i = InvigilatorBase.example()
97
- >>> i.prompt_constructor.agent_persona_prompt
98
- Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
- """
100
- from edsl import Agent
101
-
102
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
- return Prompt(text="")
104
-
105
- return self.agent.prompt()
106
-
107
- def prior_answers_dict(self) -> dict:
108
- # this is all questions
109
- d = self.survey.question_names_to_questions()
110
- # This attaches the answer to the question
111
- for question in d:
112
- if question in self.current_answers:
113
- d[question].answer = self.current_answers[question]
114
- else:
115
- d[question].answer = PlaceholderAnswer()
116
-
117
- # if (new_question := question.split("_comment")[0]) in d:
118
- # d[new_question].comment = answer
119
- # d[question].answer = PlaceholderAnswer()
120
-
121
- # breakpoint()
122
- return d
123
-
124
- @property
125
- def question_file_keys(self):
126
- raw_question_text = self.question.question_text
127
- variables = get_jinja2_variables(raw_question_text)
128
- question_file_keys = []
129
- for var in variables:
130
- if var in self.scenario_file_keys:
131
- question_file_keys.append(var)
132
- return question_file_keys
133
-
134
- def build_replacement_dict(self, question_data: dict):
135
- """
136
- Builds a dictionary of replacement values by combining multiple data sources.
137
- """
138
- # File references dictionary
139
- file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
-
141
- # Scenario items excluding file keys
142
- scenario_items = {
143
- k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
- }
145
-
146
- # Question settings with defaults
147
- question_settings = {
148
- "use_code": getattr(self.question, "_use_code", True),
149
- "include_comment": getattr(self.question, "_include_comment", False),
150
- }
151
-
152
- # Combine all dictionaries using dict.update() for clarity
153
- replacement_dict = {}
154
- for d in [
155
- file_refs,
156
- question_data,
157
- scenario_items,
158
- self.prior_answers_dict(),
159
- {"agent": self.agent},
160
- question_settings,
161
- ]:
162
- replacement_dict.update(d)
163
-
164
- return replacement_dict
165
-
166
- def _get_question_options(self, question_data):
167
- question_options_entry = question_data.get("question_options", None)
168
- question_options = question_options_entry
169
-
170
- placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
-
172
- # print("Question options entry: ", question_options_entry)
173
-
174
- if isinstance(question_options_entry, str):
175
- env = Environment()
176
- parsed_content = env.parse(question_options_entry)
177
- question_option_key = list(meta.find_undeclared_variables(parsed_content))[
178
- 0
179
- ]
180
- if isinstance(self.scenario.get(question_option_key), list):
181
- question_options = self.scenario.get(question_option_key)
182
-
183
- # might be getting it from the prior answers
184
- if self.prior_answers_dict().get(question_option_key) is not None:
185
- prior_question = self.prior_answers_dict().get(question_option_key)
186
- if hasattr(prior_question, "answer"):
187
- if isinstance(prior_question.answer, list):
188
- question_options = prior_question.answer
189
- else:
190
- question_options = placeholder
191
- else:
192
- question_options = placeholder
193
-
194
- return question_options
195
-
196
- def build_question_instructions_prompt(self):
197
- """Buils the question instructions prompt."""
198
-
199
- question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
200
-
201
- # Get the data for the question - this is a dictionary of the question data
202
- # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
203
- question_data = self.question.data.copy()
204
-
205
- if (
206
- "question_options" in question_data
207
- ): # is this a question with question options?
208
- question_options = self._get_question_options(question_data)
209
- question_data["question_options"] = question_options
210
-
211
- replacement_dict = self.build_replacement_dict(question_data)
212
- rendered_instructions = question_prompt.render(replacement_dict)
213
-
214
- # is there anything left to render?
215
- undefined_template_variables = (
216
- rendered_instructions.undefined_template_variables({})
217
- )
218
-
219
- # Check if it's the name of a question in the survey
220
- for question_name in self.survey.question_names:
221
- if question_name in undefined_template_variables:
222
- print(
223
- "Question name found in undefined_template_variables: ",
224
- question_name,
225
- )
226
-
227
- if undefined_template_variables:
228
- msg = f"Question instructions still has variables: {undefined_template_variables}."
229
- import warnings
230
-
231
- warnings.warn(msg)
232
- # raise QuestionScenarioRenderError(
233
- # f"Question instructions still has variables: {undefined_template_variables}."
234
- # )
235
-
236
- # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
237
- relevant_instructions = self.survey.relevant_instructions(
238
- self.question.question_name
239
- )
240
-
241
- if relevant_instructions != []:
242
- # preamble_text = Prompt(
243
- # text="You were given the following instructions: "
244
- # )
245
- preamble_text = Prompt(text="")
246
- for instruction in relevant_instructions:
247
- preamble_text += instruction.text
248
- rendered_instructions = preamble_text + rendered_instructions
249
-
250
- return rendered_instructions
251
-
252
- @property
253
- def question_instructions_prompt(self) -> Prompt:
254
- """
255
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
256
- >>> i = InvigilatorBase.example()
257
- >>> i.prompt_constructor.question_instructions_prompt
258
- Prompt(text=\"""...
259
- ...
260
- """
261
- if not hasattr(self, "_question_instructions_prompt"):
262
- self._question_instructions_prompt = (
263
- self.build_question_instructions_prompt()
264
- )
265
-
266
- return self._question_instructions_prompt
267
-
268
- @property
269
- def prior_question_memory_prompt(self) -> Prompt:
270
- if not hasattr(self, "_prior_question_memory_prompt"):
271
- from edsl.prompts.Prompt import Prompt
272
-
273
- memory_prompt = Prompt(text="")
274
- if self.memory_plan is not None:
275
- memory_prompt += self.create_memory_prompt(
276
- self.question.question_name
277
- ).render(self.scenario | self.prior_answers_dict())
278
- self._prior_question_memory_prompt = memory_prompt
279
- return self._prior_question_memory_prompt
280
-
281
- def create_memory_prompt(self, question_name: str) -> Prompt:
282
- """Create a memory for the agent.
283
-
284
- The returns a memory prompt for the agent.
285
-
286
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
287
- >>> i = InvigilatorBase.example()
288
- >>> i.current_answers = {"q0": "Prior answer"}
289
- >>> i.memory_plan.add_single_memory("q1", "q0")
290
- >>> p = i.prompt_constructor.create_memory_prompt("q1")
291
- >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
292
- 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
293
- """
294
- return self.memory_plan.get_memory_prompt_fragment(
295
- question_name, self.current_answers
296
- )
297
-
298
- def construct_system_prompt(self) -> Prompt:
299
- """Construct the system prompt for the LLM call."""
300
- import warnings
301
-
302
- warnings.warn(
303
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
304
- )
305
- return self.get_prompts()["system_prompt"]
306
-
307
- def construct_user_prompt(self) -> Prompt:
308
- """Construct the user prompt for the LLM call."""
309
- import warnings
310
-
311
- warnings.warn(
312
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
313
- )
314
- return self.get_prompts()["user_prompt"]
315
-
316
- def get_prompts(self) -> Dict[str, Prompt]:
317
- """Get both prompts for the LLM call.
318
-
319
- >>> from edsl import QuestionFreeText
320
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
321
- >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
322
- >>> i = InvigilatorBase.example(question = q)
323
- >>> i.get_prompts()
324
- {'user_prompt': ..., 'system_prompt': ...}
325
- """
326
- # breakpoint()
327
- prompts = self.prompt_plan.get_prompts(
328
- agent_instructions=self.agent_instructions_prompt,
329
- agent_persona=self.agent_persona_prompt,
330
- question_instructions=Prompt(self.question_instructions_prompt),
331
- prior_question_memory=self.prior_question_memory_prompt,
332
- )
333
- if self.question_file_keys:
334
- files_list = []
335
- for key in self.question_file_keys:
336
- files_list.append(self.scenario[key])
337
- prompts["files_list"] = files_list
338
- return prompts
339
-
340
- def _get_scenario_with_image(self) -> Scenario:
341
- """This is a helper function to get a scenario with an image, for testing purposes."""
342
- from edsl import Scenario
343
-
344
- try:
345
- scenario = Scenario.from_image("../../static/logo.png")
346
- except FileNotFoundError:
347
- scenario = Scenario.from_image("static/logo.png")
348
- return scenario
349
-
350
-
351
- if __name__ == "__main__":
352
- import doctest
353
-
354
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ from __future__ import annotations
2
+ from typing import Dict, Any, Optional, Set, Union, TYPE_CHECKING
3
+ from functools import cached_property
4
+
5
+ from edsl.prompts.Prompt import Prompt
6
+
7
+ from dataclasses import dataclass
8
+
9
+ from .prompt_helpers import PromptPlan
10
+ from .QuestionTemplateReplacementsBuilder import (
11
+ QuestionTemplateReplacementsBuilder,
12
+ )
13
+ from .question_option_processor import QuestionOptionProcessor
14
+
15
+ if TYPE_CHECKING:
16
+ from edsl.agents.InvigilatorBase import InvigilatorBase
17
+ from edsl.questions.QuestionBase import QuestionBase
18
+ from edsl.agents.Agent import Agent
19
+ from edsl.surveys.Survey import Survey
20
+ from edsl.language_models.LanguageModel import LanguageModel
21
+ from edsl.surveys.MemoryPlan import MemoryPlan
22
+ from edsl.questions.QuestionBase import QuestionBase
23
+ from edsl.scenarios.Scenario import Scenario
24
+
25
+
26
+ class BasePlaceholder:
27
+ """Base class for placeholder values when a question is not yet answered."""
28
+
29
+ def __init__(self, placeholder_type: str = "answer"):
30
+ self.value = "N/A"
31
+ self.comment = "Will be populated by prior answer"
32
+ self._type = placeholder_type
33
+
34
+ def __getitem__(self, index):
35
+ return ""
36
+
37
+ def __str__(self):
38
+ return f"<<{self.__class__.__name__}:{self._type}>>"
39
+
40
+ def __repr__(self):
41
+ return self.__str__()
42
+
43
+
44
+ class PlaceholderAnswer(BasePlaceholder):
45
+ def __init__(self):
46
+ super().__init__("answer")
47
+
48
+
49
+ class PlaceholderComment(BasePlaceholder):
50
+ def __init__(self):
51
+ super().__init__("comment")
52
+
53
+
54
+ class PlaceholderGeneratedTokens(BasePlaceholder):
55
+ def __init__(self):
56
+ super().__init__("generated_tokens")
57
+
58
+
59
+ class PromptConstructor:
60
+ """
61
+ This class constructs the prompts for the language model.
62
+
63
+ The pieces of a prompt are:
64
+ - The agent instructions - "You are answering questions as if you were a human. Do not break character."
65
+ - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
66
+ - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
67
+ - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
68
+ """
69
+
70
+ def __init__(
71
+ self, invigilator: "InvigilatorBase", prompt_plan: Optional["PromptPlan"] = None
72
+ ):
73
+ self.invigilator = invigilator
74
+ self.prompt_plan = prompt_plan or PromptPlan()
75
+
76
+ self.agent = invigilator.agent
77
+ self.question = invigilator.question
78
+ self.scenario = invigilator.scenario
79
+ self.survey = invigilator.survey
80
+ self.model = invigilator.model
81
+ self.current_answers = invigilator.current_answers
82
+ self.memory_plan = invigilator.memory_plan
83
+
84
+ def get_question_options(self, question_data):
85
+ """Get the question options."""
86
+ return QuestionOptionProcessor(self).get_question_options(question_data)
87
+
88
+ @cached_property
89
+ def agent_instructions_prompt(self) -> Prompt:
90
+ """
91
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
92
+ >>> i = InvigilatorBase.example()
93
+ >>> i.prompt_constructor.agent_instructions_prompt
94
+ Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
95
+ """
96
+ from edsl.agents.Agent import Agent
97
+
98
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
99
+ return Prompt(text="")
100
+
101
+ return Prompt(text=self.agent.instruction)
102
+
103
+ @cached_property
104
+ def agent_persona_prompt(self) -> Prompt:
105
+ """
106
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
107
+ >>> i = InvigilatorBase.example()
108
+ >>> i.prompt_constructor.agent_persona_prompt
109
+ Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
110
+ """
111
+ from edsl.agents.Agent import Agent
112
+
113
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
114
+ return Prompt(text="")
115
+
116
+ return self.agent.prompt()
117
+
118
+ def prior_answers_dict(self) -> dict[str, "QuestionBase"]:
119
+ """This is a dictionary of prior answers, if they exist."""
120
+ return self._add_answers(
121
+ self.survey.question_names_to_questions(), self.current_answers
122
+ )
123
+
124
+ @staticmethod
125
+ def _extract_quetion_and_entry_type(key_entry) -> tuple[str, str]:
126
+ """
127
+ Extracts the question name and type for the current answer dictionary key entry.
128
+
129
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0")
130
+ ('q0', 'answer')
131
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_comment")
132
+ ('q0', 'comment')
133
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_alternate_generated_tokens")
134
+ ('q0_alternate', 'generated_tokens')
135
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_alt_comment")
136
+ ('q0_alt', 'comment')
137
+ """
138
+ split_list = key_entry.rsplit("_", maxsplit=1)
139
+ if len(split_list) == 1:
140
+ question_name = split_list[0]
141
+ entry_type = "answer"
142
+ else:
143
+ if split_list[1] == "comment":
144
+ question_name = split_list[0]
145
+ entry_type = "comment"
146
+ elif split_list[1] == "tokens": # it's actually 'generated_tokens'
147
+ question_name = key_entry.replace("_generated_tokens", "")
148
+ entry_type = "generated_tokens"
149
+ else:
150
+ question_name = key_entry
151
+ entry_type = "answer"
152
+ return question_name, entry_type
153
+
154
+ @staticmethod
155
+ def _augmented_answers_dict(current_answers: dict) -> dict:
156
+ """
157
+ >>> PromptConstructor._augmented_answers_dict({"q0": "LOVE IT!", "q0_comment": "I love school!"})
158
+ {'q0': {'answer': 'LOVE IT!', 'comment': 'I love school!'}}
159
+ """
160
+ from collections import defaultdict
161
+
162
+ d = defaultdict(dict)
163
+ for key, value in current_answers.items():
164
+ question_name, entry_type = (
165
+ PromptConstructor._extract_quetion_and_entry_type(key)
166
+ )
167
+ d[question_name][entry_type] = value
168
+ return dict(d)
169
+
170
+ @staticmethod
171
+ def _add_answers(
172
+ answer_dict: dict, current_answers: dict
173
+ ) -> dict[str, "QuestionBase"]:
174
+ """
175
+ >>> from edsl import QuestionFreeText
176
+ >>> d = {"q0": QuestionFreeText(question_text="Do you like school?", question_name = "q0")}
177
+ >>> current_answers = {"q0": "LOVE IT!"}
178
+ >>> PromptConstructor._add_answers(d, current_answers)['q0'].answer
179
+ 'LOVE IT!'
180
+ """
181
+ augmented_answers = PromptConstructor._augmented_answers_dict(current_answers)
182
+
183
+ for question in answer_dict:
184
+ if question in augmented_answers:
185
+ for entry_type, value in augmented_answers[question].items():
186
+ setattr(answer_dict[question], entry_type, value)
187
+ else:
188
+ answer_dict[question].answer = PlaceholderAnswer()
189
+ answer_dict[question].comment = PlaceholderComment()
190
+ answer_dict[question].generated_tokens = PlaceholderGeneratedTokens()
191
+ return answer_dict
192
+
193
+ @cached_property
194
+ def question_file_keys(self) -> list:
195
+ """Extracts the file keys from the question text.
196
+ It checks if the variables in the question text are in the scenario file keys.
197
+ """
198
+ return QuestionTemplateReplacementsBuilder(self).question_file_keys()
199
+
200
+ @cached_property
201
+ def question_instructions_prompt(self) -> Prompt:
202
+ """
203
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
204
+ >>> i = InvigilatorBase.example()
205
+ >>> i.prompt_constructor.question_instructions_prompt
206
+ Prompt(text=\"""...
207
+ ...
208
+ """
209
+ return self.build_question_instructions_prompt()
210
+
211
+ def build_question_instructions_prompt(self) -> Prompt:
212
+ """Buils the question instructions prompt."""
213
+ from edsl.agents.QuestionInstructionPromptBuilder import (
214
+ QuestionInstructionPromptBuilder,
215
+ )
216
+
217
+ return QuestionInstructionPromptBuilder(self).build()
218
+
219
+ @cached_property
220
+ def prior_question_memory_prompt(self) -> Prompt:
221
+ memory_prompt = Prompt(text="")
222
+ if self.memory_plan is not None:
223
+ memory_prompt += self.create_memory_prompt(
224
+ self.question.question_name
225
+ ).render(self.scenario | self.prior_answers_dict())
226
+ return memory_prompt
227
+
228
+ def create_memory_prompt(self, question_name: str) -> Prompt:
229
+ """Create a memory for the agent.
230
+
231
+ The returns a memory prompt for the agent.
232
+
233
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
234
+ >>> i = InvigilatorBase.example()
235
+ >>> i.current_answers = {"q0": "Prior answer"}
236
+ >>> i.memory_plan.add_single_memory("q1", "q0")
237
+ >>> p = i.prompt_constructor.create_memory_prompt("q1")
238
+ >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
239
+ 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
240
+ """
241
+ return self.memory_plan.get_memory_prompt_fragment(
242
+ question_name, self.current_answers
243
+ )
244
+
245
+ def get_prompts(self) -> Dict[str, Prompt]:
246
+ """Get both prompts for the LLM call.
247
+
248
+ >>> from edsl import QuestionFreeText
249
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
250
+ >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
251
+ >>> i = InvigilatorBase.example(question = q)
252
+ >>> i.get_prompts()
253
+ {'user_prompt': ..., 'system_prompt': ...}
254
+ """
255
+ prompts = self.prompt_plan.get_prompts(
256
+ agent_instructions=self.agent_instructions_prompt,
257
+ agent_persona=self.agent_persona_prompt,
258
+ question_instructions=Prompt(self.question_instructions_prompt),
259
+ prior_question_memory=self.prior_question_memory_prompt,
260
+ )
261
+ if self.question_file_keys:
262
+ files_list = []
263
+ for key in self.question_file_keys:
264
+ files_list.append(self.scenario[key])
265
+ prompts["files_list"] = files_list
266
+ return prompts
267
+
268
+
269
+ if __name__ == "__main__":
270
+ import doctest
271
+
272
+ doctest.testmod(optionflags=doctest.ELLIPSIS)