edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (341) hide show
  1. edsl/Base.py +413 -332
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +57 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +1071 -867
  7. edsl/agents/AgentList.py +551 -413
  8. edsl/agents/Invigilator.py +284 -233
  9. edsl/agents/InvigilatorBase.py +257 -270
  10. edsl/agents/PromptConstructor.py +272 -354
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/__init__.py +2 -3
  14. edsl/agents/descriptors.py +99 -99
  15. edsl/agents/prompt_helpers.py +129 -129
  16. edsl/agents/question_option_processor.py +172 -0
  17. edsl/auto/AutoStudy.py +130 -117
  18. edsl/auto/StageBase.py +243 -230
  19. edsl/auto/StageGenerateSurvey.py +178 -178
  20. edsl/auto/StageLabelQuestions.py +125 -125
  21. edsl/auto/StagePersona.py +61 -61
  22. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  23. edsl/auto/StagePersonaDimensionValues.py +74 -74
  24. edsl/auto/StagePersonaDimensions.py +69 -69
  25. edsl/auto/StageQuestions.py +74 -73
  26. edsl/auto/SurveyCreatorPipeline.py +21 -21
  27. edsl/auto/utilities.py +218 -224
  28. edsl/base/Base.py +279 -279
  29. edsl/config.py +177 -157
  30. edsl/conversation/Conversation.py +290 -290
  31. edsl/conversation/car_buying.py +59 -58
  32. edsl/conversation/chips.py +95 -95
  33. edsl/conversation/mug_negotiation.py +81 -81
  34. edsl/conversation/next_speaker_utilities.py +93 -93
  35. edsl/coop/CoopFunctionsMixin.py +15 -0
  36. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  37. edsl/coop/PriceFetcher.py +54 -54
  38. edsl/coop/__init__.py +2 -2
  39. edsl/coop/coop.py +1106 -1028
  40. edsl/coop/utils.py +131 -131
  41. edsl/data/Cache.py +573 -555
  42. edsl/data/CacheEntry.py +230 -233
  43. edsl/data/CacheHandler.py +168 -149
  44. edsl/data/RemoteCacheSync.py +186 -78
  45. edsl/data/SQLiteDict.py +292 -292
  46. edsl/data/__init__.py +5 -4
  47. edsl/data/orm.py +10 -10
  48. edsl/data_transfer_models.py +74 -73
  49. edsl/enums.py +202 -175
  50. edsl/exceptions/BaseException.py +21 -21
  51. edsl/exceptions/__init__.py +54 -54
  52. edsl/exceptions/agents.py +54 -42
  53. edsl/exceptions/cache.py +5 -5
  54. edsl/exceptions/configuration.py +16 -16
  55. edsl/exceptions/coop.py +10 -10
  56. edsl/exceptions/data.py +14 -14
  57. edsl/exceptions/general.py +34 -34
  58. edsl/exceptions/inference_services.py +5 -0
  59. edsl/exceptions/jobs.py +33 -33
  60. edsl/exceptions/language_models.py +63 -63
  61. edsl/exceptions/prompts.py +15 -15
  62. edsl/exceptions/questions.py +109 -91
  63. edsl/exceptions/results.py +29 -29
  64. edsl/exceptions/scenarios.py +29 -22
  65. edsl/exceptions/surveys.py +37 -37
  66. edsl/inference_services/AnthropicService.py +106 -87
  67. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  68. edsl/inference_services/AvailableModelFetcher.py +215 -0
  69. edsl/inference_services/AwsBedrock.py +118 -120
  70. edsl/inference_services/AzureAI.py +215 -217
  71. edsl/inference_services/DeepInfraService.py +18 -18
  72. edsl/inference_services/GoogleService.py +143 -148
  73. edsl/inference_services/GroqService.py +20 -20
  74. edsl/inference_services/InferenceServiceABC.py +80 -147
  75. edsl/inference_services/InferenceServicesCollection.py +138 -97
  76. edsl/inference_services/MistralAIService.py +120 -123
  77. edsl/inference_services/OllamaService.py +18 -18
  78. edsl/inference_services/OpenAIService.py +236 -224
  79. edsl/inference_services/PerplexityService.py +160 -163
  80. edsl/inference_services/ServiceAvailability.py +135 -0
  81. edsl/inference_services/TestService.py +90 -89
  82. edsl/inference_services/TogetherAIService.py +172 -170
  83. edsl/inference_services/data_structures.py +134 -0
  84. edsl/inference_services/models_available_cache.py +118 -118
  85. edsl/inference_services/rate_limits_cache.py +25 -25
  86. edsl/inference_services/registry.py +41 -41
  87. edsl/inference_services/write_available.py +10 -10
  88. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  89. edsl/jobs/Answers.py +43 -56
  90. edsl/jobs/FetchInvigilator.py +47 -0
  91. edsl/jobs/InterviewTaskManager.py +98 -0
  92. edsl/jobs/InterviewsConstructor.py +50 -0
  93. edsl/jobs/Jobs.py +823 -898
  94. edsl/jobs/JobsChecks.py +172 -147
  95. edsl/jobs/JobsComponentConstructor.py +189 -0
  96. edsl/jobs/JobsPrompts.py +270 -268
  97. edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
  98. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  99. edsl/jobs/RequestTokenEstimator.py +30 -0
  100. edsl/jobs/__init__.py +1 -1
  101. edsl/jobs/async_interview_runner.py +138 -0
  102. edsl/jobs/buckets/BucketCollection.py +104 -63
  103. edsl/jobs/buckets/ModelBuckets.py +65 -65
  104. edsl/jobs/buckets/TokenBucket.py +283 -251
  105. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  106. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  107. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  108. edsl/jobs/data_structures.py +120 -0
  109. edsl/jobs/decorators.py +35 -0
  110. edsl/jobs/interviews/Interview.py +396 -661
  111. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  112. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  113. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  114. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  115. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  116. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  117. edsl/jobs/interviews/ReportErrors.py +66 -66
  118. edsl/jobs/interviews/interview_status_enum.py +9 -9
  119. edsl/jobs/jobs_status_enums.py +9 -0
  120. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  121. edsl/jobs/results_exceptions_handler.py +98 -0
  122. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
  123. edsl/jobs/runners/JobsRunnerStatus.py +297 -330
  124. edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
  125. edsl/jobs/tasks/TaskCreators.py +64 -64
  126. edsl/jobs/tasks/TaskHistory.py +470 -450
  127. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  128. edsl/jobs/tasks/task_status_enum.py +161 -163
  129. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  130. edsl/jobs/tokens/TokenUsage.py +34 -34
  131. edsl/language_models/ComputeCost.py +63 -0
  132. edsl/language_models/LanguageModel.py +626 -668
  133. edsl/language_models/ModelList.py +164 -155
  134. edsl/language_models/PriceManager.py +127 -0
  135. edsl/language_models/RawResponseHandler.py +106 -0
  136. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  137. edsl/language_models/ServiceDataSources.py +0 -0
  138. edsl/language_models/__init__.py +2 -3
  139. edsl/language_models/fake_openai_call.py +15 -15
  140. edsl/language_models/fake_openai_service.py +61 -61
  141. edsl/language_models/key_management/KeyLookup.py +63 -0
  142. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  143. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  144. edsl/language_models/key_management/__init__.py +0 -0
  145. edsl/language_models/key_management/models.py +131 -0
  146. edsl/language_models/model.py +256 -0
  147. edsl/language_models/repair.py +156 -156
  148. edsl/language_models/utilities.py +65 -64
  149. edsl/notebooks/Notebook.py +263 -258
  150. edsl/notebooks/NotebookToLaTeX.py +142 -0
  151. edsl/notebooks/__init__.py +1 -1
  152. edsl/prompts/Prompt.py +352 -362
  153. edsl/prompts/__init__.py +2 -2
  154. edsl/questions/ExceptionExplainer.py +77 -0
  155. edsl/questions/HTMLQuestion.py +103 -0
  156. edsl/questions/QuestionBase.py +518 -664
  157. edsl/questions/QuestionBasePromptsMixin.py +221 -217
  158. edsl/questions/QuestionBudget.py +227 -227
  159. edsl/questions/QuestionCheckBox.py +359 -359
  160. edsl/questions/QuestionExtract.py +180 -182
  161. edsl/questions/QuestionFreeText.py +113 -114
  162. edsl/questions/QuestionFunctional.py +166 -166
  163. edsl/questions/QuestionList.py +223 -231
  164. edsl/questions/QuestionMatrix.py +265 -0
  165. edsl/questions/QuestionMultipleChoice.py +330 -286
  166. edsl/questions/QuestionNumerical.py +151 -153
  167. edsl/questions/QuestionRank.py +314 -324
  168. edsl/questions/Quick.py +41 -41
  169. edsl/questions/SimpleAskMixin.py +74 -73
  170. edsl/questions/__init__.py +27 -26
  171. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
  172. edsl/questions/compose_questions.py +98 -98
  173. edsl/questions/data_structures.py +20 -0
  174. edsl/questions/decorators.py +21 -21
  175. edsl/questions/derived/QuestionLikertFive.py +76 -76
  176. edsl/questions/derived/QuestionLinearScale.py +90 -87
  177. edsl/questions/derived/QuestionTopK.py +93 -93
  178. edsl/questions/derived/QuestionYesNo.py +82 -82
  179. edsl/questions/descriptors.py +427 -413
  180. edsl/questions/loop_processor.py +149 -0
  181. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  182. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  183. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  184. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  185. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  186. edsl/questions/prompt_templates/question_list.jinja +17 -17
  187. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  188. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  189. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
  190. edsl/questions/question_registry.py +177 -177
  191. edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
  192. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
  193. edsl/questions/response_validator_factory.py +34 -0
  194. edsl/questions/settings.py +12 -12
  195. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  196. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  197. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  198. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  199. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  200. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  201. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  202. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  203. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  204. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  205. edsl/questions/templates/list/question_presentation.jinja +5 -5
  206. edsl/questions/templates/matrix/__init__.py +1 -0
  207. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  208. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  209. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  210. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  211. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  212. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  213. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  214. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  215. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  216. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  217. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  218. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  219. edsl/results/CSSParameterizer.py +108 -108
  220. edsl/results/Dataset.py +587 -424
  221. edsl/results/DatasetExportMixin.py +594 -731
  222. edsl/results/DatasetTree.py +295 -275
  223. edsl/results/MarkdownToDocx.py +122 -0
  224. edsl/results/MarkdownToPDF.py +111 -0
  225. edsl/results/Result.py +557 -465
  226. edsl/results/Results.py +1183 -1165
  227. edsl/results/ResultsExportMixin.py +45 -43
  228. edsl/results/ResultsGGMixin.py +121 -121
  229. edsl/results/TableDisplay.py +125 -198
  230. edsl/results/TextEditor.py +50 -0
  231. edsl/results/__init__.py +2 -2
  232. edsl/results/file_exports.py +252 -0
  233. edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
  234. edsl/results/{Selector.py → results_selector.py} +145 -135
  235. edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
  236. edsl/results/smart_objects.py +96 -0
  237. edsl/results/table_data_class.py +12 -0
  238. edsl/results/table_display.css +77 -77
  239. edsl/results/table_renderers.py +118 -0
  240. edsl/results/tree_explore.py +115 -115
  241. edsl/scenarios/ConstructDownloadLink.py +109 -0
  242. edsl/scenarios/DocumentChunker.py +102 -0
  243. edsl/scenarios/DocxScenario.py +16 -0
  244. edsl/scenarios/FileStore.py +511 -632
  245. edsl/scenarios/PdfExtractor.py +40 -0
  246. edsl/scenarios/Scenario.py +498 -601
  247. edsl/scenarios/ScenarioHtmlMixin.py +65 -64
  248. edsl/scenarios/ScenarioList.py +1458 -1287
  249. edsl/scenarios/ScenarioListExportMixin.py +45 -52
  250. edsl/scenarios/ScenarioListPdfMixin.py +239 -261
  251. edsl/scenarios/__init__.py +3 -4
  252. edsl/scenarios/directory_scanner.py +96 -0
  253. edsl/scenarios/file_methods.py +85 -0
  254. edsl/scenarios/handlers/__init__.py +13 -0
  255. edsl/scenarios/handlers/csv.py +38 -0
  256. edsl/scenarios/handlers/docx.py +76 -0
  257. edsl/scenarios/handlers/html.py +37 -0
  258. edsl/scenarios/handlers/json.py +111 -0
  259. edsl/scenarios/handlers/latex.py +5 -0
  260. edsl/scenarios/handlers/md.py +51 -0
  261. edsl/scenarios/handlers/pdf.py +68 -0
  262. edsl/scenarios/handlers/png.py +39 -0
  263. edsl/scenarios/handlers/pptx.py +105 -0
  264. edsl/scenarios/handlers/py.py +294 -0
  265. edsl/scenarios/handlers/sql.py +313 -0
  266. edsl/scenarios/handlers/sqlite.py +149 -0
  267. edsl/scenarios/handlers/txt.py +33 -0
  268. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
  269. edsl/scenarios/scenario_selector.py +156 -0
  270. edsl/shared.py +1 -1
  271. edsl/study/ObjectEntry.py +173 -173
  272. edsl/study/ProofOfWork.py +113 -113
  273. edsl/study/SnapShot.py +80 -80
  274. edsl/study/Study.py +521 -528
  275. edsl/study/__init__.py +4 -4
  276. edsl/surveys/ConstructDAG.py +92 -0
  277. edsl/surveys/DAG.py +148 -148
  278. edsl/surveys/EditSurvey.py +221 -0
  279. edsl/surveys/InstructionHandler.py +100 -0
  280. edsl/surveys/Memory.py +31 -31
  281. edsl/surveys/MemoryManagement.py +72 -0
  282. edsl/surveys/MemoryPlan.py +244 -244
  283. edsl/surveys/Rule.py +327 -326
  284. edsl/surveys/RuleCollection.py +385 -387
  285. edsl/surveys/RuleManager.py +172 -0
  286. edsl/surveys/Simulator.py +75 -0
  287. edsl/surveys/Survey.py +1280 -1801
  288. edsl/surveys/SurveyCSS.py +273 -261
  289. edsl/surveys/SurveyExportMixin.py +259 -259
  290. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
  291. edsl/surveys/SurveyQualtricsImport.py +284 -284
  292. edsl/surveys/SurveyToApp.py +141 -0
  293. edsl/surveys/__init__.py +5 -3
  294. edsl/surveys/base.py +53 -53
  295. edsl/surveys/descriptors.py +60 -56
  296. edsl/surveys/instructions/ChangeInstruction.py +48 -49
  297. edsl/surveys/instructions/Instruction.py +56 -65
  298. edsl/surveys/instructions/InstructionCollection.py +82 -77
  299. edsl/templates/error_reporting/base.html +23 -23
  300. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  301. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  302. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  303. edsl/templates/error_reporting/interview_details.html +115 -115
  304. edsl/templates/error_reporting/interviews.html +19 -19
  305. edsl/templates/error_reporting/overview.html +4 -4
  306. edsl/templates/error_reporting/performance_plot.html +1 -1
  307. edsl/templates/error_reporting/report.css +73 -73
  308. edsl/templates/error_reporting/report.html +117 -117
  309. edsl/templates/error_reporting/report.js +25 -25
  310. edsl/tools/__init__.py +1 -1
  311. edsl/tools/clusters.py +192 -192
  312. edsl/tools/embeddings.py +27 -27
  313. edsl/tools/embeddings_plotting.py +118 -118
  314. edsl/tools/plotting.py +112 -112
  315. edsl/tools/summarize.py +18 -18
  316. edsl/utilities/PrettyList.py +56 -0
  317. edsl/utilities/SystemInfo.py +28 -28
  318. edsl/utilities/__init__.py +22 -22
  319. edsl/utilities/ast_utilities.py +25 -25
  320. edsl/utilities/data/Registry.py +6 -6
  321. edsl/utilities/data/__init__.py +1 -1
  322. edsl/utilities/data/scooter_results.json +1 -1
  323. edsl/utilities/decorators.py +77 -77
  324. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  325. edsl/utilities/interface.py +627 -627
  326. edsl/utilities/is_notebook.py +18 -0
  327. edsl/utilities/is_valid_variable_name.py +11 -0
  328. edsl/utilities/naming_utilities.py +263 -263
  329. edsl/utilities/remove_edsl_version.py +24 -0
  330. edsl/utilities/repair_functions.py +28 -28
  331. edsl/utilities/restricted_python.py +70 -70
  332. edsl/utilities/utilities.py +436 -424
  333. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/LICENSE +21 -21
  334. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/METADATA +13 -11
  335. edsl-0.1.39.dev5.dist-info/RECORD +358 -0
  336. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/WHEEL +1 -1
  337. edsl/language_models/KeyLookup.py +0 -30
  338. edsl/language_models/registry.py +0 -190
  339. edsl/language_models/unused/ReplicateBase.py +0 -83
  340. edsl/results/ResultsDBMixin.py +0 -238
  341. edsl-0.1.39.dev3.dist-info/RECORD +0 -277
@@ -1,354 +1,272 @@
1
- from __future__ import annotations
2
- from typing import Dict, Any, Optional, Set
3
-
4
- from jinja2 import Environment, meta
5
-
6
- from edsl.prompts.Prompt import Prompt
7
- from edsl.agents.prompt_helpers import PromptPlan
8
-
9
-
10
- class PlaceholderAnswer:
11
- """A placeholder answer for when a question is not yet answered."""
12
-
13
- def __init__(self):
14
- self.answer = "N/A"
15
- self.comment = "Will be populated by prior answer"
16
-
17
- def __getitem__(self, index):
18
- return ""
19
-
20
- def __str__(self):
21
- return "<<PlaceholderAnswer>>"
22
-
23
- def __repr__(self):
24
- return "<<PlaceholderAnswer>>"
25
-
26
-
27
- def get_jinja2_variables(template_str: str) -> Set[str]:
28
- """
29
- Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
-
31
- Args:
32
- template_str (str): The Jinja2 template string
33
-
34
- Returns:
35
- Set[str]: A set of variable names found in the template
36
- """
37
- env = Environment()
38
- ast = env.parse(template_str)
39
- return meta.find_undeclared_variables(ast)
40
-
41
-
42
- class PromptConstructor:
43
- """
44
- The pieces of a prompt are:
45
- - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
- - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
- - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
- - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
-
50
- This is mixed into the Invigilator class.
51
- """
52
-
53
- def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
- self.invigilator = invigilator
55
- self.agent = invigilator.agent
56
- self.question = invigilator.question
57
- self.scenario = invigilator.scenario
58
- self.survey = invigilator.survey
59
- self.model = invigilator.model
60
- self.current_answers = invigilator.current_answers
61
- self.memory_plan = invigilator.memory_plan
62
- self.prompt_plan = prompt_plan or PromptPlan()
63
-
64
- @property
65
- def scenario_file_keys(self) -> list:
66
- """We need to find all the keys in the scenario that refer to FileStore objects.
67
- These will be used to append to the prompt a list of files that are part of the scenario.
68
- """
69
- from edsl.scenarios.FileStore import FileStore
70
-
71
- file_entries = []
72
- for key, value in self.scenario.items():
73
- if isinstance(value, FileStore):
74
- file_entries.append(key)
75
- return file_entries
76
-
77
- @property
78
- def agent_instructions_prompt(self) -> Prompt:
79
- """
80
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
- >>> i = InvigilatorBase.example()
82
- >>> i.prompt_constructor.agent_instructions_prompt
83
- Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
- """
85
- from edsl import Agent
86
-
87
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
- return Prompt(text="")
89
-
90
- return Prompt(text=self.agent.instruction)
91
-
92
- @property
93
- def agent_persona_prompt(self) -> Prompt:
94
- """
95
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
- >>> i = InvigilatorBase.example()
97
- >>> i.prompt_constructor.agent_persona_prompt
98
- Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
- """
100
- from edsl import Agent
101
-
102
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
- return Prompt(text="")
104
-
105
- return self.agent.prompt()
106
-
107
- def prior_answers_dict(self) -> dict:
108
- # this is all questions
109
- d = self.survey.question_names_to_questions()
110
- # This attaches the answer to the question
111
- for question in d:
112
- if question in self.current_answers:
113
- d[question].answer = self.current_answers[question]
114
- else:
115
- d[question].answer = PlaceholderAnswer()
116
-
117
- # if (new_question := question.split("_comment")[0]) in d:
118
- # d[new_question].comment = answer
119
- # d[question].answer = PlaceholderAnswer()
120
-
121
- # breakpoint()
122
- return d
123
-
124
- @property
125
- def question_file_keys(self):
126
- raw_question_text = self.question.question_text
127
- variables = get_jinja2_variables(raw_question_text)
128
- question_file_keys = []
129
- for var in variables:
130
- if var in self.scenario_file_keys:
131
- question_file_keys.append(var)
132
- return question_file_keys
133
-
134
- def build_replacement_dict(self, question_data: dict):
135
- """
136
- Builds a dictionary of replacement values by combining multiple data sources.
137
- """
138
- # File references dictionary
139
- file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
-
141
- # Scenario items excluding file keys
142
- scenario_items = {
143
- k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
- }
145
-
146
- # Question settings with defaults
147
- question_settings = {
148
- "use_code": getattr(self.question, "_use_code", True),
149
- "include_comment": getattr(self.question, "_include_comment", False),
150
- }
151
-
152
- # Combine all dictionaries using dict.update() for clarity
153
- replacement_dict = {}
154
- for d in [
155
- file_refs,
156
- question_data,
157
- scenario_items,
158
- self.prior_answers_dict(),
159
- {"agent": self.agent},
160
- question_settings,
161
- ]:
162
- replacement_dict.update(d)
163
-
164
- return replacement_dict
165
-
166
- def _get_question_options(self, question_data):
167
- question_options_entry = question_data.get("question_options", None)
168
- question_options = question_options_entry
169
-
170
- placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
-
172
- # print("Question options entry: ", question_options_entry)
173
-
174
- if isinstance(question_options_entry, str):
175
- env = Environment()
176
- parsed_content = env.parse(question_options_entry)
177
- question_option_key = list(meta.find_undeclared_variables(parsed_content))[
178
- 0
179
- ]
180
- if isinstance(self.scenario.get(question_option_key), list):
181
- question_options = self.scenario.get(question_option_key)
182
-
183
- # might be getting it from the prior answers
184
- if self.prior_answers_dict().get(question_option_key) is not None:
185
- prior_question = self.prior_answers_dict().get(question_option_key)
186
- if hasattr(prior_question, "answer"):
187
- if isinstance(prior_question.answer, list):
188
- question_options = prior_question.answer
189
- else:
190
- question_options = placeholder
191
- else:
192
- question_options = placeholder
193
-
194
- return question_options
195
-
196
- def build_question_instructions_prompt(self):
197
- """Buils the question instructions prompt."""
198
-
199
- question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
200
-
201
- # Get the data for the question - this is a dictionary of the question data
202
- # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
203
- question_data = self.question.data.copy()
204
-
205
- if (
206
- "question_options" in question_data
207
- ): # is this a question with question options?
208
- question_options = self._get_question_options(question_data)
209
- question_data["question_options"] = question_options
210
-
211
- replacement_dict = self.build_replacement_dict(question_data)
212
- rendered_instructions = question_prompt.render(replacement_dict)
213
-
214
- # is there anything left to render?
215
- undefined_template_variables = (
216
- rendered_instructions.undefined_template_variables({})
217
- )
218
-
219
- # Check if it's the name of a question in the survey
220
- for question_name in self.survey.question_names:
221
- if question_name in undefined_template_variables:
222
- print(
223
- "Question name found in undefined_template_variables: ",
224
- question_name,
225
- )
226
-
227
- if undefined_template_variables:
228
- msg = f"Question instructions still has variables: {undefined_template_variables}."
229
- import warnings
230
-
231
- warnings.warn(msg)
232
- # raise QuestionScenarioRenderError(
233
- # f"Question instructions still has variables: {undefined_template_variables}."
234
- # )
235
-
236
- # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
237
- relevant_instructions = self.survey.relevant_instructions(
238
- self.question.question_name
239
- )
240
-
241
- if relevant_instructions != []:
242
- # preamble_text = Prompt(
243
- # text="You were given the following instructions: "
244
- # )
245
- preamble_text = Prompt(text="")
246
- for instruction in relevant_instructions:
247
- preamble_text += instruction.text
248
- rendered_instructions = preamble_text + rendered_instructions
249
-
250
- return rendered_instructions
251
-
252
- @property
253
- def question_instructions_prompt(self) -> Prompt:
254
- """
255
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
256
- >>> i = InvigilatorBase.example()
257
- >>> i.prompt_constructor.question_instructions_prompt
258
- Prompt(text=\"""...
259
- ...
260
- """
261
- if not hasattr(self, "_question_instructions_prompt"):
262
- self._question_instructions_prompt = (
263
- self.build_question_instructions_prompt()
264
- )
265
-
266
- return self._question_instructions_prompt
267
-
268
- @property
269
- def prior_question_memory_prompt(self) -> Prompt:
270
- if not hasattr(self, "_prior_question_memory_prompt"):
271
- from edsl.prompts.Prompt import Prompt
272
-
273
- memory_prompt = Prompt(text="")
274
- if self.memory_plan is not None:
275
- memory_prompt += self.create_memory_prompt(
276
- self.question.question_name
277
- ).render(self.scenario | self.prior_answers_dict())
278
- self._prior_question_memory_prompt = memory_prompt
279
- return self._prior_question_memory_prompt
280
-
281
- def create_memory_prompt(self, question_name: str) -> Prompt:
282
- """Create a memory for the agent.
283
-
284
- The returns a memory prompt for the agent.
285
-
286
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
287
- >>> i = InvigilatorBase.example()
288
- >>> i.current_answers = {"q0": "Prior answer"}
289
- >>> i.memory_plan.add_single_memory("q1", "q0")
290
- >>> p = i.prompt_constructor.create_memory_prompt("q1")
291
- >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
292
- 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
293
- """
294
- return self.memory_plan.get_memory_prompt_fragment(
295
- question_name, self.current_answers
296
- )
297
-
298
- def construct_system_prompt(self) -> Prompt:
299
- """Construct the system prompt for the LLM call."""
300
- import warnings
301
-
302
- warnings.warn(
303
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
304
- )
305
- return self.get_prompts()["system_prompt"]
306
-
307
- def construct_user_prompt(self) -> Prompt:
308
- """Construct the user prompt for the LLM call."""
309
- import warnings
310
-
311
- warnings.warn(
312
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
313
- )
314
- return self.get_prompts()["user_prompt"]
315
-
316
- def get_prompts(self) -> Dict[str, Prompt]:
317
- """Get both prompts for the LLM call.
318
-
319
- >>> from edsl import QuestionFreeText
320
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
321
- >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
322
- >>> i = InvigilatorBase.example(question = q)
323
- >>> i.get_prompts()
324
- {'user_prompt': ..., 'system_prompt': ...}
325
- """
326
- # breakpoint()
327
- prompts = self.prompt_plan.get_prompts(
328
- agent_instructions=self.agent_instructions_prompt,
329
- agent_persona=self.agent_persona_prompt,
330
- question_instructions=Prompt(self.question_instructions_prompt),
331
- prior_question_memory=self.prior_question_memory_prompt,
332
- )
333
- if self.question_file_keys:
334
- files_list = []
335
- for key in self.question_file_keys:
336
- files_list.append(self.scenario[key])
337
- prompts["files_list"] = files_list
338
- return prompts
339
-
340
- def _get_scenario_with_image(self) -> Scenario:
341
- """This is a helper function to get a scenario with an image, for testing purposes."""
342
- from edsl import Scenario
343
-
344
- try:
345
- scenario = Scenario.from_image("../../static/logo.png")
346
- except FileNotFoundError:
347
- scenario = Scenario.from_image("static/logo.png")
348
- return scenario
349
-
350
-
351
- if __name__ == "__main__":
352
- import doctest
353
-
354
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ from __future__ import annotations
2
+ from typing import Dict, Any, Optional, Set, Union, TYPE_CHECKING
3
+ from functools import cached_property
4
+
5
+ from edsl.prompts.Prompt import Prompt
6
+
7
+ from dataclasses import dataclass
8
+
9
+ from .prompt_helpers import PromptPlan
10
+ from .QuestionTemplateReplacementsBuilder import (
11
+ QuestionTemplateReplacementsBuilder,
12
+ )
13
+ from .question_option_processor import QuestionOptionProcessor
14
+
15
+ if TYPE_CHECKING:
16
+ from edsl.agents.InvigilatorBase import InvigilatorBase
17
+ from edsl.questions.QuestionBase import QuestionBase
18
+ from edsl.agents.Agent import Agent
19
+ from edsl.surveys.Survey import Survey
20
+ from edsl.language_models.LanguageModel import LanguageModel
21
+ from edsl.surveys.MemoryPlan import MemoryPlan
22
+ from edsl.questions.QuestionBase import QuestionBase
23
+ from edsl.scenarios.Scenario import Scenario
24
+
25
+
26
+ class BasePlaceholder:
27
+ """Base class for placeholder values when a question is not yet answered."""
28
+
29
+ def __init__(self, placeholder_type: str = "answer"):
30
+ self.value = "N/A"
31
+ self.comment = "Will be populated by prior answer"
32
+ self._type = placeholder_type
33
+
34
+ def __getitem__(self, index):
35
+ return ""
36
+
37
+ def __str__(self):
38
+ return f"<<{self.__class__.__name__}:{self._type}>>"
39
+
40
+ def __repr__(self):
41
+ return self.__str__()
42
+
43
+
44
+ class PlaceholderAnswer(BasePlaceholder):
45
+ def __init__(self):
46
+ super().__init__("answer")
47
+
48
+
49
+ class PlaceholderComment(BasePlaceholder):
50
+ def __init__(self):
51
+ super().__init__("comment")
52
+
53
+
54
+ class PlaceholderGeneratedTokens(BasePlaceholder):
55
+ def __init__(self):
56
+ super().__init__("generated_tokens")
57
+
58
+
59
+ class PromptConstructor:
60
+ """
61
+ This class constructs the prompts for the language model.
62
+
63
+ The pieces of a prompt are:
64
+ - The agent instructions - "You are answering questions as if you were a human. Do not break character."
65
+ - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
66
+ - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
67
+ - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
68
+ """
69
+
70
+ def __init__(
71
+ self, invigilator: "InvigilatorBase", prompt_plan: Optional["PromptPlan"] = None
72
+ ):
73
+ self.invigilator = invigilator
74
+ self.prompt_plan = prompt_plan or PromptPlan()
75
+
76
+ self.agent = invigilator.agent
77
+ self.question = invigilator.question
78
+ self.scenario = invigilator.scenario
79
+ self.survey = invigilator.survey
80
+ self.model = invigilator.model
81
+ self.current_answers = invigilator.current_answers
82
+ self.memory_plan = invigilator.memory_plan
83
+
84
+ def get_question_options(self, question_data):
85
+ """Get the question options."""
86
+ return QuestionOptionProcessor(self).get_question_options(question_data)
87
+
88
+ @cached_property
89
+ def agent_instructions_prompt(self) -> Prompt:
90
+ """
91
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
92
+ >>> i = InvigilatorBase.example()
93
+ >>> i.prompt_constructor.agent_instructions_prompt
94
+ Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
95
+ """
96
+ from edsl.agents.Agent import Agent
97
+
98
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
99
+ return Prompt(text="")
100
+
101
+ return Prompt(text=self.agent.instruction)
102
+
103
+ @cached_property
104
+ def agent_persona_prompt(self) -> Prompt:
105
+ """
106
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
107
+ >>> i = InvigilatorBase.example()
108
+ >>> i.prompt_constructor.agent_persona_prompt
109
+ Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
110
+ """
111
+ from edsl.agents.Agent import Agent
112
+
113
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
114
+ return Prompt(text="")
115
+
116
+ return self.agent.prompt()
117
+
118
+ def prior_answers_dict(self) -> dict[str, "QuestionBase"]:
119
+ """This is a dictionary of prior answers, if they exist."""
120
+ return self._add_answers(
121
+ self.survey.question_names_to_questions(), self.current_answers
122
+ )
123
+
124
+ @staticmethod
125
+ def _extract_quetion_and_entry_type(key_entry) -> tuple[str, str]:
126
+ """
127
+ Extracts the question name and type for the current answer dictionary key entry.
128
+
129
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0")
130
+ ('q0', 'answer')
131
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_comment")
132
+ ('q0', 'comment')
133
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_alternate_generated_tokens")
134
+ ('q0_alternate', 'generated_tokens')
135
+ >>> PromptConstructor._extract_quetion_and_entry_type("q0_alt_comment")
136
+ ('q0_alt', 'comment')
137
+ """
138
+ split_list = key_entry.rsplit("_", maxsplit=1)
139
+ if len(split_list) == 1:
140
+ question_name = split_list[0]
141
+ entry_type = "answer"
142
+ else:
143
+ if split_list[1] == "comment":
144
+ question_name = split_list[0]
145
+ entry_type = "comment"
146
+ elif split_list[1] == "tokens": # it's actually 'generated_tokens'
147
+ question_name = key_entry.replace("_generated_tokens", "")
148
+ entry_type = "generated_tokens"
149
+ else:
150
+ question_name = key_entry
151
+ entry_type = "answer"
152
+ return question_name, entry_type
153
+
154
+ @staticmethod
155
+ def _augmented_answers_dict(current_answers: dict) -> dict:
156
+ """
157
+ >>> PromptConstructor._augmented_answers_dict({"q0": "LOVE IT!", "q0_comment": "I love school!"})
158
+ {'q0': {'answer': 'LOVE IT!', 'comment': 'I love school!'}}
159
+ """
160
+ from collections import defaultdict
161
+
162
+ d = defaultdict(dict)
163
+ for key, value in current_answers.items():
164
+ question_name, entry_type = (
165
+ PromptConstructor._extract_quetion_and_entry_type(key)
166
+ )
167
+ d[question_name][entry_type] = value
168
+ return dict(d)
169
+
170
+ @staticmethod
171
+ def _add_answers(
172
+ answer_dict: dict, current_answers: dict
173
+ ) -> dict[str, "QuestionBase"]:
174
+ """
175
+ >>> from edsl import QuestionFreeText
176
+ >>> d = {"q0": QuestionFreeText(question_text="Do you like school?", question_name = "q0")}
177
+ >>> current_answers = {"q0": "LOVE IT!"}
178
+ >>> PromptConstructor._add_answers(d, current_answers)['q0'].answer
179
+ 'LOVE IT!'
180
+ """
181
+ augmented_answers = PromptConstructor._augmented_answers_dict(current_answers)
182
+
183
+ for question in answer_dict:
184
+ if question in augmented_answers:
185
+ for entry_type, value in augmented_answers[question].items():
186
+ setattr(answer_dict[question], entry_type, value)
187
+ else:
188
+ answer_dict[question].answer = PlaceholderAnswer()
189
+ answer_dict[question].comment = PlaceholderComment()
190
+ answer_dict[question].generated_tokens = PlaceholderGeneratedTokens()
191
+ return answer_dict
192
+
193
+ @cached_property
194
+ def question_file_keys(self) -> list:
195
+ """Extracts the file keys from the question text.
196
+ It checks if the variables in the question text are in the scenario file keys.
197
+ """
198
+ return QuestionTemplateReplacementsBuilder(self).question_file_keys()
199
+
200
+ @cached_property
201
+ def question_instructions_prompt(self) -> Prompt:
202
+ """
203
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
204
+ >>> i = InvigilatorBase.example()
205
+ >>> i.prompt_constructor.question_instructions_prompt
206
+ Prompt(text=\"""...
207
+ ...
208
+ """
209
+ return self.build_question_instructions_prompt()
210
+
211
+ def build_question_instructions_prompt(self) -> Prompt:
212
+ """Buils the question instructions prompt."""
213
+ from edsl.agents.QuestionInstructionPromptBuilder import (
214
+ QuestionInstructionPromptBuilder,
215
+ )
216
+
217
+ return QuestionInstructionPromptBuilder(self).build()
218
+
219
+ @cached_property
220
+ def prior_question_memory_prompt(self) -> Prompt:
221
+ memory_prompt = Prompt(text="")
222
+ if self.memory_plan is not None:
223
+ memory_prompt += self.create_memory_prompt(
224
+ self.question.question_name
225
+ ).render(self.scenario | self.prior_answers_dict())
226
+ return memory_prompt
227
+
228
+ def create_memory_prompt(self, question_name: str) -> Prompt:
229
+ """Create a memory for the agent.
230
+
231
+ The returns a memory prompt for the agent.
232
+
233
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
234
+ >>> i = InvigilatorBase.example()
235
+ >>> i.current_answers = {"q0": "Prior answer"}
236
+ >>> i.memory_plan.add_single_memory("q1", "q0")
237
+ >>> p = i.prompt_constructor.create_memory_prompt("q1")
238
+ >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
239
+ 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
240
+ """
241
+ return self.memory_plan.get_memory_prompt_fragment(
242
+ question_name, self.current_answers
243
+ )
244
+
245
+ def get_prompts(self) -> Dict[str, Prompt]:
246
+ """Get both prompts for the LLM call.
247
+
248
+ >>> from edsl import QuestionFreeText
249
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
250
+ >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
251
+ >>> i = InvigilatorBase.example(question = q)
252
+ >>> i.get_prompts()
253
+ {'user_prompt': ..., 'system_prompt': ...}
254
+ """
255
+ prompts = self.prompt_plan.get_prompts(
256
+ agent_instructions=self.agent_instructions_prompt,
257
+ agent_persona=self.agent_persona_prompt,
258
+ question_instructions=Prompt(self.question_instructions_prompt),
259
+ prior_question_memory=self.prior_question_memory_prompt,
260
+ )
261
+ if self.question_file_keys:
262
+ files_list = []
263
+ for key in self.question_file_keys:
264
+ files_list.append(self.scenario[key])
265
+ prompts["files_list"] = files_list
266
+ return prompts
267
+
268
+
269
+ if __name__ == "__main__":
270
+ import doctest
271
+
272
+ doctest.testmod(optionflags=doctest.ELLIPSIS)