edsl 0.1.38.dev3__py3-none-any.whl → 0.1.38.dev4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (256) hide show
  1. edsl/Base.py +332 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +49 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +867 -858
  7. edsl/agents/AgentList.py +413 -362
  8. edsl/agents/Invigilator.py +233 -222
  9. edsl/agents/InvigilatorBase.py +265 -284
  10. edsl/agents/PromptConstructor.py +354 -353
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -99
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +279 -279
  26. edsl/config.py +157 -149
  27. edsl/conversation/Conversation.py +290 -290
  28. edsl/conversation/car_buying.py +58 -58
  29. edsl/conversation/chips.py +95 -95
  30. edsl/conversation/mug_negotiation.py +81 -81
  31. edsl/conversation/next_speaker_utilities.py +93 -93
  32. edsl/coop/PriceFetcher.py +54 -54
  33. edsl/coop/__init__.py +2 -2
  34. edsl/coop/coop.py +1028 -961
  35. edsl/coop/utils.py +131 -131
  36. edsl/data/Cache.py +555 -530
  37. edsl/data/CacheEntry.py +233 -228
  38. edsl/data/CacheHandler.py +149 -149
  39. edsl/data/RemoteCacheSync.py +78 -97
  40. edsl/data/SQLiteDict.py +292 -292
  41. edsl/data/__init__.py +4 -4
  42. edsl/data/orm.py +10 -10
  43. edsl/data_transfer_models.py +73 -73
  44. edsl/enums.py +175 -173
  45. edsl/exceptions/BaseException.py +21 -21
  46. edsl/exceptions/__init__.py +54 -54
  47. edsl/exceptions/agents.py +42 -42
  48. edsl/exceptions/cache.py +5 -5
  49. edsl/exceptions/configuration.py +16 -16
  50. edsl/exceptions/coop.py +10 -10
  51. edsl/exceptions/data.py +14 -14
  52. edsl/exceptions/general.py +34 -34
  53. edsl/exceptions/jobs.py +33 -33
  54. edsl/exceptions/language_models.py +63 -63
  55. edsl/exceptions/prompts.py +15 -15
  56. edsl/exceptions/questions.py +91 -91
  57. edsl/exceptions/results.py +29 -29
  58. edsl/exceptions/scenarios.py +22 -22
  59. edsl/exceptions/surveys.py +37 -37
  60. edsl/inference_services/AnthropicService.py +87 -87
  61. edsl/inference_services/AwsBedrock.py +120 -120
  62. edsl/inference_services/AzureAI.py +217 -217
  63. edsl/inference_services/DeepInfraService.py +18 -18
  64. edsl/inference_services/GoogleService.py +148 -156
  65. edsl/inference_services/GroqService.py +20 -20
  66. edsl/inference_services/InferenceServiceABC.py +147 -147
  67. edsl/inference_services/InferenceServicesCollection.py +97 -97
  68. edsl/inference_services/MistralAIService.py +123 -123
  69. edsl/inference_services/OllamaService.py +18 -18
  70. edsl/inference_services/OpenAIService.py +224 -224
  71. edsl/inference_services/PerplexityService.py +163 -0
  72. edsl/inference_services/TestService.py +89 -89
  73. edsl/inference_services/TogetherAIService.py +170 -170
  74. edsl/inference_services/models_available_cache.py +118 -118
  75. edsl/inference_services/rate_limits_cache.py +25 -25
  76. edsl/inference_services/registry.py +41 -39
  77. edsl/inference_services/write_available.py +10 -10
  78. edsl/jobs/Answers.py +56 -56
  79. edsl/jobs/Jobs.py +898 -1358
  80. edsl/jobs/JobsChecks.py +147 -0
  81. edsl/jobs/JobsPrompts.py +268 -0
  82. edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
  83. edsl/jobs/__init__.py +1 -1
  84. edsl/jobs/buckets/BucketCollection.py +63 -63
  85. edsl/jobs/buckets/ModelBuckets.py +65 -65
  86. edsl/jobs/buckets/TokenBucket.py +251 -251
  87. edsl/jobs/interviews/Interview.py +661 -661
  88. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  89. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  90. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  91. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  92. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  93. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  94. edsl/jobs/interviews/ReportErrors.py +66 -66
  95. edsl/jobs/interviews/interview_status_enum.py +9 -9
  96. edsl/jobs/runners/JobsRunnerAsyncio.py +466 -361
  97. edsl/jobs/runners/JobsRunnerStatus.py +330 -332
  98. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  99. edsl/jobs/tasks/TaskCreators.py +64 -64
  100. edsl/jobs/tasks/TaskHistory.py +450 -451
  101. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  102. edsl/jobs/tasks/task_status_enum.py +163 -163
  103. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  104. edsl/jobs/tokens/TokenUsage.py +34 -34
  105. edsl/language_models/KeyLookup.py +30 -30
  106. edsl/language_models/LanguageModel.py +668 -708
  107. edsl/language_models/ModelList.py +155 -109
  108. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  109. edsl/language_models/__init__.py +3 -3
  110. edsl/language_models/fake_openai_call.py +15 -15
  111. edsl/language_models/fake_openai_service.py +61 -61
  112. edsl/language_models/registry.py +190 -137
  113. edsl/language_models/repair.py +156 -156
  114. edsl/language_models/unused/ReplicateBase.py +83 -83
  115. edsl/language_models/utilities.py +64 -64
  116. edsl/notebooks/Notebook.py +258 -258
  117. edsl/notebooks/__init__.py +1 -1
  118. edsl/prompts/Prompt.py +362 -357
  119. edsl/prompts/__init__.py +2 -2
  120. edsl/questions/AnswerValidatorMixin.py +289 -289
  121. edsl/questions/QuestionBase.py +664 -660
  122. edsl/questions/QuestionBaseGenMixin.py +161 -161
  123. edsl/questions/QuestionBasePromptsMixin.py +217 -217
  124. edsl/questions/QuestionBudget.py +227 -227
  125. edsl/questions/QuestionCheckBox.py +359 -359
  126. edsl/questions/QuestionExtract.py +182 -183
  127. edsl/questions/QuestionFreeText.py +114 -114
  128. edsl/questions/QuestionFunctional.py +166 -166
  129. edsl/questions/QuestionList.py +231 -231
  130. edsl/questions/QuestionMultipleChoice.py +286 -286
  131. edsl/questions/QuestionNumerical.py +153 -153
  132. edsl/questions/QuestionRank.py +324 -324
  133. edsl/questions/Quick.py +41 -41
  134. edsl/questions/RegisterQuestionsMeta.py +71 -71
  135. edsl/questions/ResponseValidatorABC.py +174 -174
  136. edsl/questions/SimpleAskMixin.py +73 -73
  137. edsl/questions/__init__.py +26 -26
  138. edsl/questions/compose_questions.py +98 -98
  139. edsl/questions/decorators.py +21 -21
  140. edsl/questions/derived/QuestionLikertFive.py +76 -76
  141. edsl/questions/derived/QuestionLinearScale.py +87 -87
  142. edsl/questions/derived/QuestionTopK.py +93 -93
  143. edsl/questions/derived/QuestionYesNo.py +82 -82
  144. edsl/questions/descriptors.py +413 -413
  145. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  146. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  147. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  148. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  149. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  150. edsl/questions/prompt_templates/question_list.jinja +17 -17
  151. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  152. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  153. edsl/questions/question_registry.py +177 -147
  154. edsl/questions/settings.py +12 -12
  155. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  156. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  157. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  158. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  159. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  160. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  161. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  162. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  163. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  164. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  165. edsl/questions/templates/list/question_presentation.jinja +5 -5
  166. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  167. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  168. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  169. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  170. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  171. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  172. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  173. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  174. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  175. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  176. edsl/results/CSSParameterizer.py +108 -0
  177. edsl/results/Dataset.py +424 -293
  178. edsl/results/DatasetExportMixin.py +731 -717
  179. edsl/results/DatasetTree.py +275 -145
  180. edsl/results/Result.py +465 -456
  181. edsl/results/Results.py +1165 -1071
  182. edsl/results/ResultsDBMixin.py +238 -238
  183. edsl/results/ResultsExportMixin.py +43 -43
  184. edsl/results/ResultsFetchMixin.py +33 -33
  185. edsl/results/ResultsGGMixin.py +121 -121
  186. edsl/results/ResultsToolsMixin.py +98 -98
  187. edsl/results/Selector.py +135 -135
  188. edsl/results/TableDisplay.py +198 -0
  189. edsl/results/__init__.py +2 -2
  190. edsl/results/table_display.css +78 -0
  191. edsl/results/tree_explore.py +115 -115
  192. edsl/scenarios/FileStore.py +632 -458
  193. edsl/scenarios/Scenario.py +601 -544
  194. edsl/scenarios/ScenarioHtmlMixin.py +64 -64
  195. edsl/scenarios/ScenarioJoin.py +127 -0
  196. edsl/scenarios/ScenarioList.py +1287 -1112
  197. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  198. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  199. edsl/scenarios/__init__.py +4 -4
  200. edsl/shared.py +1 -1
  201. edsl/study/ObjectEntry.py +173 -173
  202. edsl/study/ProofOfWork.py +113 -113
  203. edsl/study/SnapShot.py +80 -80
  204. edsl/study/Study.py +528 -528
  205. edsl/study/__init__.py +4 -4
  206. edsl/surveys/DAG.py +148 -148
  207. edsl/surveys/Memory.py +31 -31
  208. edsl/surveys/MemoryPlan.py +244 -244
  209. edsl/surveys/Rule.py +326 -326
  210. edsl/surveys/RuleCollection.py +387 -387
  211. edsl/surveys/Survey.py +1801 -1787
  212. edsl/surveys/SurveyCSS.py +261 -261
  213. edsl/surveys/SurveyExportMixin.py +259 -259
  214. edsl/surveys/SurveyFlowVisualizationMixin.py +179 -121
  215. edsl/surveys/SurveyQualtricsImport.py +284 -284
  216. edsl/surveys/__init__.py +3 -3
  217. edsl/surveys/base.py +53 -53
  218. edsl/surveys/descriptors.py +56 -56
  219. edsl/surveys/instructions/ChangeInstruction.py +49 -49
  220. edsl/surveys/instructions/Instruction.py +65 -53
  221. edsl/surveys/instructions/InstructionCollection.py +77 -77
  222. edsl/templates/error_reporting/base.html +23 -23
  223. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  224. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  225. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  226. edsl/templates/error_reporting/interview_details.html +115 -115
  227. edsl/templates/error_reporting/interviews.html +19 -10
  228. edsl/templates/error_reporting/overview.html +4 -4
  229. edsl/templates/error_reporting/performance_plot.html +1 -1
  230. edsl/templates/error_reporting/report.css +73 -73
  231. edsl/templates/error_reporting/report.html +117 -117
  232. edsl/templates/error_reporting/report.js +25 -25
  233. edsl/tools/__init__.py +1 -1
  234. edsl/tools/clusters.py +192 -192
  235. edsl/tools/embeddings.py +27 -27
  236. edsl/tools/embeddings_plotting.py +118 -118
  237. edsl/tools/plotting.py +112 -112
  238. edsl/tools/summarize.py +18 -18
  239. edsl/utilities/SystemInfo.py +28 -28
  240. edsl/utilities/__init__.py +22 -22
  241. edsl/utilities/ast_utilities.py +25 -25
  242. edsl/utilities/data/Registry.py +6 -6
  243. edsl/utilities/data/__init__.py +1 -1
  244. edsl/utilities/data/scooter_results.json +1 -1
  245. edsl/utilities/decorators.py +77 -77
  246. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  247. edsl/utilities/interface.py +627 -627
  248. edsl/utilities/naming_utilities.py +263 -263
  249. edsl/utilities/repair_functions.py +28 -28
  250. edsl/utilities/restricted_python.py +70 -70
  251. edsl/utilities/utilities.py +424 -409
  252. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/LICENSE +21 -21
  253. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/METADATA +2 -1
  254. edsl-0.1.38.dev4.dist-info/RECORD +277 -0
  255. edsl-0.1.38.dev3.dist-info/RECORD +0 -269
  256. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/WHEEL +0 -0
@@ -1,353 +1,354 @@
1
- from __future__ import annotations
2
- from typing import Dict, Any, Optional, Set
3
-
4
- from jinja2 import Environment, meta
5
-
6
- from edsl.prompts.Prompt import Prompt
7
- from edsl.agents.prompt_helpers import PromptPlan
8
-
9
-
10
- class PlaceholderAnswer:
11
- """A placeholder answer for when a question is not yet answered."""
12
-
13
- def __init__(self):
14
- self.answer = "N/A"
15
- self.comment = "Will be populated by prior answer"
16
-
17
- def __getitem__(self, index):
18
- return ""
19
-
20
- def __str__(self):
21
- return "<<PlaceholderAnswer>>"
22
-
23
- def __repr__(self):
24
- return "<<PlaceholderAnswer>>"
25
-
26
-
27
- def get_jinja2_variables(template_str: str) -> Set[str]:
28
- """
29
- Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
-
31
- Args:
32
- template_str (str): The Jinja2 template string
33
-
34
- Returns:
35
- Set[str]: A set of variable names found in the template
36
- """
37
- env = Environment()
38
- ast = env.parse(template_str)
39
- return meta.find_undeclared_variables(ast)
40
-
41
-
42
- class PromptConstructor:
43
- """
44
- The pieces of a prompt are:
45
- - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
- - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
- - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
- - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
-
50
- This is mixed into the Invigilator class.
51
- """
52
-
53
- def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
- self.invigilator = invigilator
55
- self.agent = invigilator.agent
56
- self.question = invigilator.question
57
- self.scenario = invigilator.scenario
58
- self.survey = invigilator.survey
59
- self.model = invigilator.model
60
- self.current_answers = invigilator.current_answers
61
- self.memory_plan = invigilator.memory_plan
62
- self.prompt_plan = prompt_plan or PromptPlan()
63
-
64
- @property
65
- def scenario_file_keys(self) -> list:
66
- """We need to find all the keys in the scenario that refer to FileStore objects.
67
- These will be used to append to the prompt a list of files that are part of the scenario.
68
- """
69
- from edsl.scenarios.FileStore import FileStore
70
-
71
- file_entries = []
72
- for key, value in self.scenario.items():
73
- if isinstance(value, FileStore):
74
- file_entries.append(key)
75
- return file_entries
76
-
77
- @property
78
- def agent_instructions_prompt(self) -> Prompt:
79
- """
80
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
- >>> i = InvigilatorBase.example()
82
- >>> i.prompt_constructor.agent_instructions_prompt
83
- Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
- """
85
- from edsl import Agent
86
-
87
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
- return Prompt(text="")
89
-
90
- return Prompt(text=self.agent.instruction)
91
-
92
- @property
93
- def agent_persona_prompt(self) -> Prompt:
94
- """
95
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
- >>> i = InvigilatorBase.example()
97
- >>> i.prompt_constructor.agent_persona_prompt
98
- Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
- """
100
- from edsl import Agent
101
-
102
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
- return Prompt(text="")
104
-
105
- return self.agent.prompt()
106
-
107
- def prior_answers_dict(self) -> dict:
108
- # this is all questions
109
- d = self.survey.question_names_to_questions()
110
- # This attaches the answer to the question
111
- for question in d:
112
- if question in self.current_answers:
113
- d[question].answer = self.current_answers[question]
114
- else:
115
- d[question].answer = PlaceholderAnswer()
116
-
117
- # if (new_question := question.split("_comment")[0]) in d:
118
- # d[new_question].comment = answer
119
- # d[question].answer = PlaceholderAnswer()
120
-
121
- # breakpoint()
122
- return d
123
-
124
- @property
125
- def question_file_keys(self):
126
- raw_question_text = self.question.question_text
127
- variables = get_jinja2_variables(raw_question_text)
128
- question_file_keys = []
129
- for var in variables:
130
- if var in self.scenario_file_keys:
131
- question_file_keys.append(var)
132
- return question_file_keys
133
-
134
- def build_replacement_dict(self, question_data: dict):
135
- """
136
- Builds a dictionary of replacement values by combining multiple data sources.
137
- """
138
- # File references dictionary
139
- file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
-
141
- # Scenario items excluding file keys
142
- scenario_items = {
143
- k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
- }
145
-
146
- # Question settings with defaults
147
- question_settings = {
148
- "use_code": getattr(self.question, "_use_code", True),
149
- "include_comment": getattr(self.question, "_include_comment", False),
150
- }
151
-
152
- # Combine all dictionaries using dict.update() for clarity
153
- replacement_dict = {}
154
- for d in [
155
- file_refs,
156
- question_data,
157
- scenario_items,
158
- self.prior_answers_dict(),
159
- {"agent": self.agent},
160
- question_settings,
161
- ]:
162
- replacement_dict.update(d)
163
-
164
- return replacement_dict
165
-
166
- def _get_question_options(self, question_data):
167
- question_options_entry = question_data.get("question_options", None)
168
- question_options = question_options_entry
169
-
170
- placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
-
172
- if isinstance(question_options_entry, str):
173
- env = Environment()
174
- parsed_content = env.parse(question_options_entry)
175
- question_option_key = list(meta.find_undeclared_variables(parsed_content))[
176
- 0
177
- ]
178
- if isinstance(self.scenario.get(question_option_key), list):
179
- question_options = self.scenario.get(question_option_key)
180
-
181
- # might be getting it from the prior answers
182
- if self.prior_answers_dict().get(question_option_key) is not None:
183
- prior_question = self.prior_answers_dict().get(question_option_key)
184
- if hasattr(prior_question, "answer"):
185
- if isinstance(prior_question.answer, list):
186
- question_options = prior_question.answer
187
- else:
188
- question_options = placeholder
189
- else:
190
- question_options = placeholder
191
-
192
- return question_options
193
-
194
- def build_question_instructions_prompt(self):
195
- """Buils the question instructions prompt."""
196
-
197
- question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
198
-
199
- # Get the data for the question - this is a dictionary of the question data
200
- # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
201
- question_data = self.question.data.copy()
202
-
203
- if "question_options" in question_data:
204
- question_options = self._get_question_options(question_data)
205
- question_data["question_options"] = question_options
206
-
207
- # check to see if the question_options is actually a string
208
- # This is used when the user is using the question_options as a variable from a scenario
209
- # if "question_options" in question_data:
210
- replacement_dict = self.build_replacement_dict(question_data)
211
- rendered_instructions = question_prompt.render(replacement_dict)
212
-
213
- # is there anything left to render?
214
- undefined_template_variables = (
215
- rendered_instructions.undefined_template_variables({})
216
- )
217
-
218
- # Check if it's the name of a question in the survey
219
- for question_name in self.survey.question_names:
220
- if question_name in undefined_template_variables:
221
- print(
222
- "Question name found in undefined_template_variables: ",
223
- question_name,
224
- )
225
-
226
- if undefined_template_variables:
227
- msg = f"Question instructions still has variables: {undefined_template_variables}."
228
- import warnings
229
-
230
- warnings.warn(msg)
231
- # raise QuestionScenarioRenderError(
232
- # f"Question instructions still has variables: {undefined_template_variables}."
233
- # )
234
-
235
- # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
236
- relevant_instructions = self.survey.relevant_instructions(
237
- self.question.question_name
238
- )
239
-
240
- if relevant_instructions != []:
241
- # preamble_text = Prompt(
242
- # text="You were given the following instructions: "
243
- # )
244
- preamble_text = Prompt(text="")
245
- for instruction in relevant_instructions:
246
- preamble_text += instruction.text
247
- rendered_instructions = preamble_text + rendered_instructions
248
-
249
- return rendered_instructions
250
-
251
- @property
252
- def question_instructions_prompt(self) -> Prompt:
253
- """
254
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
255
- >>> i = InvigilatorBase.example()
256
- >>> i.prompt_constructor.question_instructions_prompt
257
- Prompt(text=\"""...
258
- ...
259
- """
260
- if not hasattr(self, "_question_instructions_prompt"):
261
- self._question_instructions_prompt = (
262
- self.build_question_instructions_prompt()
263
- )
264
-
265
- return self._question_instructions_prompt
266
-
267
- @property
268
- def prior_question_memory_prompt(self) -> Prompt:
269
- if not hasattr(self, "_prior_question_memory_prompt"):
270
- from edsl.prompts.Prompt import Prompt
271
-
272
- memory_prompt = Prompt(text="")
273
- if self.memory_plan is not None:
274
- memory_prompt += self.create_memory_prompt(
275
- self.question.question_name
276
- ).render(self.scenario | self.prior_answers_dict())
277
- self._prior_question_memory_prompt = memory_prompt
278
- return self._prior_question_memory_prompt
279
-
280
- def create_memory_prompt(self, question_name: str) -> Prompt:
281
- """Create a memory for the agent.
282
-
283
- The returns a memory prompt for the agent.
284
-
285
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
286
- >>> i = InvigilatorBase.example()
287
- >>> i.current_answers = {"q0": "Prior answer"}
288
- >>> i.memory_plan.add_single_memory("q1", "q0")
289
- >>> p = i.prompt_constructor.create_memory_prompt("q1")
290
- >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
291
- 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
292
- """
293
- return self.memory_plan.get_memory_prompt_fragment(
294
- question_name, self.current_answers
295
- )
296
-
297
- def construct_system_prompt(self) -> Prompt:
298
- """Construct the system prompt for the LLM call."""
299
- import warnings
300
-
301
- warnings.warn(
302
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
303
- )
304
- return self.get_prompts()["system_prompt"]
305
-
306
- def construct_user_prompt(self) -> Prompt:
307
- """Construct the user prompt for the LLM call."""
308
- import warnings
309
-
310
- warnings.warn(
311
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
312
- )
313
- return self.get_prompts()["user_prompt"]
314
-
315
- def get_prompts(self) -> Dict[str, Prompt]:
316
- """Get both prompts for the LLM call.
317
-
318
- >>> from edsl import QuestionFreeText
319
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
320
- >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
321
- >>> i = InvigilatorBase.example(question = q)
322
- >>> i.get_prompts()
323
- {'user_prompt': ..., 'system_prompt': ...}
324
- """
325
- # breakpoint()
326
- prompts = self.prompt_plan.get_prompts(
327
- agent_instructions=self.agent_instructions_prompt,
328
- agent_persona=self.agent_persona_prompt,
329
- question_instructions=Prompt(self.question_instructions_prompt),
330
- prior_question_memory=self.prior_question_memory_prompt,
331
- )
332
- if self.question_file_keys:
333
- files_list = []
334
- for key in self.question_file_keys:
335
- files_list.append(self.scenario[key])
336
- prompts["files_list"] = files_list
337
- return prompts
338
-
339
- def _get_scenario_with_image(self) -> Scenario:
340
- """This is a helper function to get a scenario with an image, for testing purposes."""
341
- from edsl import Scenario
342
-
343
- try:
344
- scenario = Scenario.from_image("../../static/logo.png")
345
- except FileNotFoundError:
346
- scenario = Scenario.from_image("static/logo.png")
347
- return scenario
348
-
349
-
350
- if __name__ == "__main__":
351
- import doctest
352
-
353
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ from __future__ import annotations
2
+ from typing import Dict, Any, Optional, Set
3
+
4
+ from jinja2 import Environment, meta
5
+
6
+ from edsl.prompts.Prompt import Prompt
7
+ from edsl.agents.prompt_helpers import PromptPlan
8
+
9
+
10
+ class PlaceholderAnswer:
11
+ """A placeholder answer for when a question is not yet answered."""
12
+
13
+ def __init__(self):
14
+ self.answer = "N/A"
15
+ self.comment = "Will be populated by prior answer"
16
+
17
+ def __getitem__(self, index):
18
+ return ""
19
+
20
+ def __str__(self):
21
+ return "<<PlaceholderAnswer>>"
22
+
23
+ def __repr__(self):
24
+ return "<<PlaceholderAnswer>>"
25
+
26
+
27
+ def get_jinja2_variables(template_str: str) -> Set[str]:
28
+ """
29
+ Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
+
31
+ Args:
32
+ template_str (str): The Jinja2 template string
33
+
34
+ Returns:
35
+ Set[str]: A set of variable names found in the template
36
+ """
37
+ env = Environment()
38
+ ast = env.parse(template_str)
39
+ return meta.find_undeclared_variables(ast)
40
+
41
+
42
+ class PromptConstructor:
43
+ """
44
+ The pieces of a prompt are:
45
+ - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
+ - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
+ - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
+ - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
+
50
+ This is mixed into the Invigilator class.
51
+ """
52
+
53
+ def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
+ self.invigilator = invigilator
55
+ self.agent = invigilator.agent
56
+ self.question = invigilator.question
57
+ self.scenario = invigilator.scenario
58
+ self.survey = invigilator.survey
59
+ self.model = invigilator.model
60
+ self.current_answers = invigilator.current_answers
61
+ self.memory_plan = invigilator.memory_plan
62
+ self.prompt_plan = prompt_plan or PromptPlan()
63
+
64
+ @property
65
+ def scenario_file_keys(self) -> list:
66
+ """We need to find all the keys in the scenario that refer to FileStore objects.
67
+ These will be used to append to the prompt a list of files that are part of the scenario.
68
+ """
69
+ from edsl.scenarios.FileStore import FileStore
70
+
71
+ file_entries = []
72
+ for key, value in self.scenario.items():
73
+ if isinstance(value, FileStore):
74
+ file_entries.append(key)
75
+ return file_entries
76
+
77
+ @property
78
+ def agent_instructions_prompt(self) -> Prompt:
79
+ """
80
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
+ >>> i = InvigilatorBase.example()
82
+ >>> i.prompt_constructor.agent_instructions_prompt
83
+ Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
+ """
85
+ from edsl import Agent
86
+
87
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
+ return Prompt(text="")
89
+
90
+ return Prompt(text=self.agent.instruction)
91
+
92
+ @property
93
+ def agent_persona_prompt(self) -> Prompt:
94
+ """
95
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
+ >>> i = InvigilatorBase.example()
97
+ >>> i.prompt_constructor.agent_persona_prompt
98
+ Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
+ """
100
+ from edsl import Agent
101
+
102
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
+ return Prompt(text="")
104
+
105
+ return self.agent.prompt()
106
+
107
+ def prior_answers_dict(self) -> dict:
108
+ # this is all questions
109
+ d = self.survey.question_names_to_questions()
110
+ # This attaches the answer to the question
111
+ for question in d:
112
+ if question in self.current_answers:
113
+ d[question].answer = self.current_answers[question]
114
+ else:
115
+ d[question].answer = PlaceholderAnswer()
116
+
117
+ # if (new_question := question.split("_comment")[0]) in d:
118
+ # d[new_question].comment = answer
119
+ # d[question].answer = PlaceholderAnswer()
120
+
121
+ # breakpoint()
122
+ return d
123
+
124
+ @property
125
+ def question_file_keys(self):
126
+ raw_question_text = self.question.question_text
127
+ variables = get_jinja2_variables(raw_question_text)
128
+ question_file_keys = []
129
+ for var in variables:
130
+ if var in self.scenario_file_keys:
131
+ question_file_keys.append(var)
132
+ return question_file_keys
133
+
134
+ def build_replacement_dict(self, question_data: dict):
135
+ """
136
+ Builds a dictionary of replacement values by combining multiple data sources.
137
+ """
138
+ # File references dictionary
139
+ file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
+
141
+ # Scenario items excluding file keys
142
+ scenario_items = {
143
+ k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
+ }
145
+
146
+ # Question settings with defaults
147
+ question_settings = {
148
+ "use_code": getattr(self.question, "_use_code", True),
149
+ "include_comment": getattr(self.question, "_include_comment", False),
150
+ }
151
+
152
+ # Combine all dictionaries using dict.update() for clarity
153
+ replacement_dict = {}
154
+ for d in [
155
+ file_refs,
156
+ question_data,
157
+ scenario_items,
158
+ self.prior_answers_dict(),
159
+ {"agent": self.agent},
160
+ question_settings,
161
+ ]:
162
+ replacement_dict.update(d)
163
+
164
+ return replacement_dict
165
+
166
+ def _get_question_options(self, question_data):
167
+ question_options_entry = question_data.get("question_options", None)
168
+ question_options = question_options_entry
169
+
170
+ placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
+
172
+ # print("Question options entry: ", question_options_entry)
173
+
174
+ if isinstance(question_options_entry, str):
175
+ env = Environment()
176
+ parsed_content = env.parse(question_options_entry)
177
+ question_option_key = list(meta.find_undeclared_variables(parsed_content))[
178
+ 0
179
+ ]
180
+ if isinstance(self.scenario.get(question_option_key), list):
181
+ question_options = self.scenario.get(question_option_key)
182
+
183
+ # might be getting it from the prior answers
184
+ if self.prior_answers_dict().get(question_option_key) is not None:
185
+ prior_question = self.prior_answers_dict().get(question_option_key)
186
+ if hasattr(prior_question, "answer"):
187
+ if isinstance(prior_question.answer, list):
188
+ question_options = prior_question.answer
189
+ else:
190
+ question_options = placeholder
191
+ else:
192
+ question_options = placeholder
193
+
194
+ return question_options
195
+
196
+ def build_question_instructions_prompt(self):
197
+ """Buils the question instructions prompt."""
198
+
199
+ question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
200
+
201
+ # Get the data for the question - this is a dictionary of the question data
202
+ # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
203
+ question_data = self.question.data.copy()
204
+
205
+ if (
206
+ "question_options" in question_data
207
+ ): # is this a question with question options?
208
+ question_options = self._get_question_options(question_data)
209
+ question_data["question_options"] = question_options
210
+
211
+ replacement_dict = self.build_replacement_dict(question_data)
212
+ rendered_instructions = question_prompt.render(replacement_dict)
213
+
214
+ # is there anything left to render?
215
+ undefined_template_variables = (
216
+ rendered_instructions.undefined_template_variables({})
217
+ )
218
+
219
+ # Check if it's the name of a question in the survey
220
+ for question_name in self.survey.question_names:
221
+ if question_name in undefined_template_variables:
222
+ print(
223
+ "Question name found in undefined_template_variables: ",
224
+ question_name,
225
+ )
226
+
227
+ if undefined_template_variables:
228
+ msg = f"Question instructions still has variables: {undefined_template_variables}."
229
+ import warnings
230
+
231
+ warnings.warn(msg)
232
+ # raise QuestionScenarioRenderError(
233
+ # f"Question instructions still has variables: {undefined_template_variables}."
234
+ # )
235
+
236
+ # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
237
+ relevant_instructions = self.survey.relevant_instructions(
238
+ self.question.question_name
239
+ )
240
+
241
+ if relevant_instructions != []:
242
+ # preamble_text = Prompt(
243
+ # text="You were given the following instructions: "
244
+ # )
245
+ preamble_text = Prompt(text="")
246
+ for instruction in relevant_instructions:
247
+ preamble_text += instruction.text
248
+ rendered_instructions = preamble_text + rendered_instructions
249
+
250
+ return rendered_instructions
251
+
252
+ @property
253
+ def question_instructions_prompt(self) -> Prompt:
254
+ """
255
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
256
+ >>> i = InvigilatorBase.example()
257
+ >>> i.prompt_constructor.question_instructions_prompt
258
+ Prompt(text=\"""...
259
+ ...
260
+ """
261
+ if not hasattr(self, "_question_instructions_prompt"):
262
+ self._question_instructions_prompt = (
263
+ self.build_question_instructions_prompt()
264
+ )
265
+
266
+ return self._question_instructions_prompt
267
+
268
+ @property
269
+ def prior_question_memory_prompt(self) -> Prompt:
270
+ if not hasattr(self, "_prior_question_memory_prompt"):
271
+ from edsl.prompts.Prompt import Prompt
272
+
273
+ memory_prompt = Prompt(text="")
274
+ if self.memory_plan is not None:
275
+ memory_prompt += self.create_memory_prompt(
276
+ self.question.question_name
277
+ ).render(self.scenario | self.prior_answers_dict())
278
+ self._prior_question_memory_prompt = memory_prompt
279
+ return self._prior_question_memory_prompt
280
+
281
+ def create_memory_prompt(self, question_name: str) -> Prompt:
282
+ """Create a memory for the agent.
283
+
284
+ The returns a memory prompt for the agent.
285
+
286
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
287
+ >>> i = InvigilatorBase.example()
288
+ >>> i.current_answers = {"q0": "Prior answer"}
289
+ >>> i.memory_plan.add_single_memory("q1", "q0")
290
+ >>> p = i.prompt_constructor.create_memory_prompt("q1")
291
+ >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
292
+ 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
293
+ """
294
+ return self.memory_plan.get_memory_prompt_fragment(
295
+ question_name, self.current_answers
296
+ )
297
+
298
+ def construct_system_prompt(self) -> Prompt:
299
+ """Construct the system prompt for the LLM call."""
300
+ import warnings
301
+
302
+ warnings.warn(
303
+ "This method is deprecated. Use get_prompts instead.", DeprecationWarning
304
+ )
305
+ return self.get_prompts()["system_prompt"]
306
+
307
+ def construct_user_prompt(self) -> Prompt:
308
+ """Construct the user prompt for the LLM call."""
309
+ import warnings
310
+
311
+ warnings.warn(
312
+ "This method is deprecated. Use get_prompts instead.", DeprecationWarning
313
+ )
314
+ return self.get_prompts()["user_prompt"]
315
+
316
+ def get_prompts(self) -> Dict[str, Prompt]:
317
+ """Get both prompts for the LLM call.
318
+
319
+ >>> from edsl import QuestionFreeText
320
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
321
+ >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
322
+ >>> i = InvigilatorBase.example(question = q)
323
+ >>> i.get_prompts()
324
+ {'user_prompt': ..., 'system_prompt': ...}
325
+ """
326
+ # breakpoint()
327
+ prompts = self.prompt_plan.get_prompts(
328
+ agent_instructions=self.agent_instructions_prompt,
329
+ agent_persona=self.agent_persona_prompt,
330
+ question_instructions=Prompt(self.question_instructions_prompt),
331
+ prior_question_memory=self.prior_question_memory_prompt,
332
+ )
333
+ if self.question_file_keys:
334
+ files_list = []
335
+ for key in self.question_file_keys:
336
+ files_list.append(self.scenario[key])
337
+ prompts["files_list"] = files_list
338
+ return prompts
339
+
340
+ def _get_scenario_with_image(self) -> Scenario:
341
+ """This is a helper function to get a scenario with an image, for testing purposes."""
342
+ from edsl import Scenario
343
+
344
+ try:
345
+ scenario = Scenario.from_image("../../static/logo.png")
346
+ except FileNotFoundError:
347
+ scenario = Scenario.from_image("static/logo.png")
348
+ return scenario
349
+
350
+
351
+ if __name__ == "__main__":
352
+ import doctest
353
+
354
+ doctest.testmod(optionflags=doctest.ELLIPSIS)