edsl 0.1.38.dev2__py3-none-any.whl → 0.1.38.dev3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (248) hide show
  1. edsl/Base.py +303 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +49 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +858 -858
  7. edsl/agents/AgentList.py +362 -362
  8. edsl/agents/Invigilator.py +222 -222
  9. edsl/agents/InvigilatorBase.py +284 -284
  10. edsl/agents/PromptConstructor.py +353 -353
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -99
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +279 -279
  26. edsl/config.py +149 -149
  27. edsl/conversation/Conversation.py +290 -290
  28. edsl/conversation/car_buying.py +58 -58
  29. edsl/conversation/chips.py +95 -95
  30. edsl/conversation/mug_negotiation.py +81 -81
  31. edsl/conversation/next_speaker_utilities.py +93 -93
  32. edsl/coop/PriceFetcher.py +54 -54
  33. edsl/coop/__init__.py +2 -2
  34. edsl/coop/coop.py +961 -961
  35. edsl/coop/utils.py +131 -131
  36. edsl/data/Cache.py +530 -530
  37. edsl/data/CacheEntry.py +228 -228
  38. edsl/data/CacheHandler.py +149 -149
  39. edsl/data/RemoteCacheSync.py +97 -97
  40. edsl/data/SQLiteDict.py +292 -292
  41. edsl/data/__init__.py +4 -4
  42. edsl/data/orm.py +10 -10
  43. edsl/data_transfer_models.py +73 -73
  44. edsl/enums.py +173 -173
  45. edsl/exceptions/BaseException.py +21 -21
  46. edsl/exceptions/__init__.py +54 -54
  47. edsl/exceptions/agents.py +42 -42
  48. edsl/exceptions/cache.py +5 -5
  49. edsl/exceptions/configuration.py +16 -16
  50. edsl/exceptions/coop.py +10 -10
  51. edsl/exceptions/data.py +14 -14
  52. edsl/exceptions/general.py +34 -34
  53. edsl/exceptions/jobs.py +33 -33
  54. edsl/exceptions/language_models.py +63 -63
  55. edsl/exceptions/prompts.py +15 -15
  56. edsl/exceptions/questions.py +91 -91
  57. edsl/exceptions/results.py +29 -29
  58. edsl/exceptions/scenarios.py +22 -22
  59. edsl/exceptions/surveys.py +37 -37
  60. edsl/inference_services/AnthropicService.py +87 -87
  61. edsl/inference_services/AwsBedrock.py +120 -120
  62. edsl/inference_services/AzureAI.py +217 -217
  63. edsl/inference_services/DeepInfraService.py +18 -18
  64. edsl/inference_services/GoogleService.py +156 -156
  65. edsl/inference_services/GroqService.py +20 -20
  66. edsl/inference_services/InferenceServiceABC.py +147 -147
  67. edsl/inference_services/InferenceServicesCollection.py +97 -97
  68. edsl/inference_services/MistralAIService.py +123 -123
  69. edsl/inference_services/OllamaService.py +18 -18
  70. edsl/inference_services/OpenAIService.py +224 -224
  71. edsl/inference_services/TestService.py +89 -89
  72. edsl/inference_services/TogetherAIService.py +170 -170
  73. edsl/inference_services/models_available_cache.py +118 -118
  74. edsl/inference_services/rate_limits_cache.py +25 -25
  75. edsl/inference_services/registry.py +39 -39
  76. edsl/inference_services/write_available.py +10 -10
  77. edsl/jobs/Answers.py +56 -56
  78. edsl/jobs/Jobs.py +1358 -1358
  79. edsl/jobs/__init__.py +1 -1
  80. edsl/jobs/buckets/BucketCollection.py +63 -63
  81. edsl/jobs/buckets/ModelBuckets.py +65 -65
  82. edsl/jobs/buckets/TokenBucket.py +251 -251
  83. edsl/jobs/interviews/Interview.py +661 -661
  84. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  85. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  86. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  87. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  88. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  89. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  90. edsl/jobs/interviews/ReportErrors.py +66 -66
  91. edsl/jobs/interviews/interview_status_enum.py +9 -9
  92. edsl/jobs/runners/JobsRunnerAsyncio.py +361 -361
  93. edsl/jobs/runners/JobsRunnerStatus.py +332 -332
  94. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  95. edsl/jobs/tasks/TaskCreators.py +64 -64
  96. edsl/jobs/tasks/TaskHistory.py +451 -451
  97. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  98. edsl/jobs/tasks/task_status_enum.py +163 -163
  99. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  100. edsl/jobs/tokens/TokenUsage.py +34 -34
  101. edsl/language_models/KeyLookup.py +30 -30
  102. edsl/language_models/LanguageModel.py +708 -708
  103. edsl/language_models/ModelList.py +109 -109
  104. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  105. edsl/language_models/__init__.py +3 -3
  106. edsl/language_models/fake_openai_call.py +15 -15
  107. edsl/language_models/fake_openai_service.py +61 -61
  108. edsl/language_models/registry.py +137 -137
  109. edsl/language_models/repair.py +156 -156
  110. edsl/language_models/unused/ReplicateBase.py +83 -83
  111. edsl/language_models/utilities.py +64 -64
  112. edsl/notebooks/Notebook.py +258 -258
  113. edsl/notebooks/__init__.py +1 -1
  114. edsl/prompts/Prompt.py +357 -357
  115. edsl/prompts/__init__.py +2 -2
  116. edsl/questions/AnswerValidatorMixin.py +289 -289
  117. edsl/questions/QuestionBase.py +660 -660
  118. edsl/questions/QuestionBaseGenMixin.py +161 -161
  119. edsl/questions/QuestionBasePromptsMixin.py +217 -217
  120. edsl/questions/QuestionBudget.py +227 -227
  121. edsl/questions/QuestionCheckBox.py +359 -359
  122. edsl/questions/QuestionExtract.py +183 -183
  123. edsl/questions/QuestionFreeText.py +114 -114
  124. edsl/questions/QuestionFunctional.py +166 -166
  125. edsl/questions/QuestionList.py +231 -231
  126. edsl/questions/QuestionMultipleChoice.py +286 -286
  127. edsl/questions/QuestionNumerical.py +153 -153
  128. edsl/questions/QuestionRank.py +324 -324
  129. edsl/questions/Quick.py +41 -41
  130. edsl/questions/RegisterQuestionsMeta.py +71 -71
  131. edsl/questions/ResponseValidatorABC.py +174 -174
  132. edsl/questions/SimpleAskMixin.py +73 -73
  133. edsl/questions/__init__.py +26 -26
  134. edsl/questions/compose_questions.py +98 -98
  135. edsl/questions/decorators.py +21 -21
  136. edsl/questions/derived/QuestionLikertFive.py +76 -76
  137. edsl/questions/derived/QuestionLinearScale.py +87 -87
  138. edsl/questions/derived/QuestionTopK.py +93 -93
  139. edsl/questions/derived/QuestionYesNo.py +82 -82
  140. edsl/questions/descriptors.py +413 -413
  141. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  142. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  143. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  144. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  145. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  146. edsl/questions/prompt_templates/question_list.jinja +17 -17
  147. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  148. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  149. edsl/questions/question_registry.py +147 -147
  150. edsl/questions/settings.py +12 -12
  151. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  152. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  153. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  154. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  155. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  156. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  157. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  158. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  159. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  160. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  161. edsl/questions/templates/list/question_presentation.jinja +5 -5
  162. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  163. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  164. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  165. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  166. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  167. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  168. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  169. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  170. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  171. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  172. edsl/results/Dataset.py +293 -293
  173. edsl/results/DatasetExportMixin.py +717 -717
  174. edsl/results/DatasetTree.py +145 -145
  175. edsl/results/Result.py +456 -456
  176. edsl/results/Results.py +1071 -1071
  177. edsl/results/ResultsDBMixin.py +238 -238
  178. edsl/results/ResultsExportMixin.py +43 -43
  179. edsl/results/ResultsFetchMixin.py +33 -33
  180. edsl/results/ResultsGGMixin.py +121 -121
  181. edsl/results/ResultsToolsMixin.py +98 -98
  182. edsl/results/Selector.py +135 -135
  183. edsl/results/__init__.py +2 -2
  184. edsl/results/tree_explore.py +115 -115
  185. edsl/scenarios/FileStore.py +458 -458
  186. edsl/scenarios/Scenario.py +544 -544
  187. edsl/scenarios/ScenarioHtmlMixin.py +64 -64
  188. edsl/scenarios/ScenarioList.py +1112 -1112
  189. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  190. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  191. edsl/scenarios/__init__.py +4 -4
  192. edsl/shared.py +1 -1
  193. edsl/study/ObjectEntry.py +173 -173
  194. edsl/study/ProofOfWork.py +113 -113
  195. edsl/study/SnapShot.py +80 -80
  196. edsl/study/Study.py +528 -528
  197. edsl/study/__init__.py +4 -4
  198. edsl/surveys/DAG.py +148 -148
  199. edsl/surveys/Memory.py +31 -31
  200. edsl/surveys/MemoryPlan.py +244 -244
  201. edsl/surveys/Rule.py +326 -326
  202. edsl/surveys/RuleCollection.py +387 -387
  203. edsl/surveys/Survey.py +1787 -1787
  204. edsl/surveys/SurveyCSS.py +261 -261
  205. edsl/surveys/SurveyExportMixin.py +259 -259
  206. edsl/surveys/SurveyFlowVisualizationMixin.py +121 -121
  207. edsl/surveys/SurveyQualtricsImport.py +284 -284
  208. edsl/surveys/__init__.py +3 -3
  209. edsl/surveys/base.py +53 -53
  210. edsl/surveys/descriptors.py +56 -56
  211. edsl/surveys/instructions/ChangeInstruction.py +49 -49
  212. edsl/surveys/instructions/Instruction.py +53 -53
  213. edsl/surveys/instructions/InstructionCollection.py +77 -77
  214. edsl/templates/error_reporting/base.html +23 -23
  215. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  216. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  217. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  218. edsl/templates/error_reporting/interview_details.html +115 -115
  219. edsl/templates/error_reporting/interviews.html +9 -9
  220. edsl/templates/error_reporting/overview.html +4 -4
  221. edsl/templates/error_reporting/performance_plot.html +1 -1
  222. edsl/templates/error_reporting/report.css +73 -73
  223. edsl/templates/error_reporting/report.html +117 -117
  224. edsl/templates/error_reporting/report.js +25 -25
  225. edsl/tools/__init__.py +1 -1
  226. edsl/tools/clusters.py +192 -192
  227. edsl/tools/embeddings.py +27 -27
  228. edsl/tools/embeddings_plotting.py +118 -118
  229. edsl/tools/plotting.py +112 -112
  230. edsl/tools/summarize.py +18 -18
  231. edsl/utilities/SystemInfo.py +28 -28
  232. edsl/utilities/__init__.py +22 -22
  233. edsl/utilities/ast_utilities.py +25 -25
  234. edsl/utilities/data/Registry.py +6 -6
  235. edsl/utilities/data/__init__.py +1 -1
  236. edsl/utilities/data/scooter_results.json +1 -1
  237. edsl/utilities/decorators.py +77 -77
  238. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  239. edsl/utilities/interface.py +627 -627
  240. edsl/utilities/naming_utilities.py +263 -263
  241. edsl/utilities/repair_functions.py +28 -28
  242. edsl/utilities/restricted_python.py +70 -70
  243. edsl/utilities/utilities.py +409 -409
  244. {edsl-0.1.38.dev2.dist-info → edsl-0.1.38.dev3.dist-info}/LICENSE +21 -21
  245. {edsl-0.1.38.dev2.dist-info → edsl-0.1.38.dev3.dist-info}/METADATA +1 -1
  246. edsl-0.1.38.dev3.dist-info/RECORD +269 -0
  247. edsl-0.1.38.dev2.dist-info/RECORD +0 -269
  248. {edsl-0.1.38.dev2.dist-info → edsl-0.1.38.dev3.dist-info}/WHEEL +0 -0
@@ -1,353 +1,353 @@
1
- from __future__ import annotations
2
- from typing import Dict, Any, Optional, Set
3
-
4
- from jinja2 import Environment, meta
5
-
6
- from edsl.prompts.Prompt import Prompt
7
- from edsl.agents.prompt_helpers import PromptPlan
8
-
9
-
10
- class PlaceholderAnswer:
11
- """A placeholder answer for when a question is not yet answered."""
12
-
13
- def __init__(self):
14
- self.answer = "N/A"
15
- self.comment = "Will be populated by prior answer"
16
-
17
- def __getitem__(self, index):
18
- return ""
19
-
20
- def __str__(self):
21
- return "<<PlaceholderAnswer>>"
22
-
23
- def __repr__(self):
24
- return "<<PlaceholderAnswer>>"
25
-
26
-
27
- def get_jinja2_variables(template_str: str) -> Set[str]:
28
- """
29
- Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
-
31
- Args:
32
- template_str (str): The Jinja2 template string
33
-
34
- Returns:
35
- Set[str]: A set of variable names found in the template
36
- """
37
- env = Environment()
38
- ast = env.parse(template_str)
39
- return meta.find_undeclared_variables(ast)
40
-
41
-
42
- class PromptConstructor:
43
- """
44
- The pieces of a prompt are:
45
- - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
- - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
- - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
- - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
-
50
- This is mixed into the Invigilator class.
51
- """
52
-
53
- def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
- self.invigilator = invigilator
55
- self.agent = invigilator.agent
56
- self.question = invigilator.question
57
- self.scenario = invigilator.scenario
58
- self.survey = invigilator.survey
59
- self.model = invigilator.model
60
- self.current_answers = invigilator.current_answers
61
- self.memory_plan = invigilator.memory_plan
62
- self.prompt_plan = prompt_plan or PromptPlan()
63
-
64
- @property
65
- def scenario_file_keys(self) -> list:
66
- """We need to find all the keys in the scenario that refer to FileStore objects.
67
- These will be used to append to the prompt a list of files that are part of the scenario.
68
- """
69
- from edsl.scenarios.FileStore import FileStore
70
-
71
- file_entries = []
72
- for key, value in self.scenario.items():
73
- if isinstance(value, FileStore):
74
- file_entries.append(key)
75
- return file_entries
76
-
77
- @property
78
- def agent_instructions_prompt(self) -> Prompt:
79
- """
80
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
- >>> i = InvigilatorBase.example()
82
- >>> i.prompt_constructor.agent_instructions_prompt
83
- Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
- """
85
- from edsl import Agent
86
-
87
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
- return Prompt(text="")
89
-
90
- return Prompt(text=self.agent.instruction)
91
-
92
- @property
93
- def agent_persona_prompt(self) -> Prompt:
94
- """
95
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
- >>> i = InvigilatorBase.example()
97
- >>> i.prompt_constructor.agent_persona_prompt
98
- Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
- """
100
- from edsl import Agent
101
-
102
- if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
- return Prompt(text="")
104
-
105
- return self.agent.prompt()
106
-
107
- def prior_answers_dict(self) -> dict:
108
- # this is all questions
109
- d = self.survey.question_names_to_questions()
110
- # This attaches the answer to the question
111
- for question in d:
112
- if question in self.current_answers:
113
- d[question].answer = self.current_answers[question]
114
- else:
115
- d[question].answer = PlaceholderAnswer()
116
-
117
- # if (new_question := question.split("_comment")[0]) in d:
118
- # d[new_question].comment = answer
119
- # d[question].answer = PlaceholderAnswer()
120
-
121
- # breakpoint()
122
- return d
123
-
124
- @property
125
- def question_file_keys(self):
126
- raw_question_text = self.question.question_text
127
- variables = get_jinja2_variables(raw_question_text)
128
- question_file_keys = []
129
- for var in variables:
130
- if var in self.scenario_file_keys:
131
- question_file_keys.append(var)
132
- return question_file_keys
133
-
134
- def build_replacement_dict(self, question_data: dict):
135
- """
136
- Builds a dictionary of replacement values by combining multiple data sources.
137
- """
138
- # File references dictionary
139
- file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
-
141
- # Scenario items excluding file keys
142
- scenario_items = {
143
- k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
- }
145
-
146
- # Question settings with defaults
147
- question_settings = {
148
- "use_code": getattr(self.question, "_use_code", True),
149
- "include_comment": getattr(self.question, "_include_comment", False),
150
- }
151
-
152
- # Combine all dictionaries using dict.update() for clarity
153
- replacement_dict = {}
154
- for d in [
155
- file_refs,
156
- question_data,
157
- scenario_items,
158
- self.prior_answers_dict(),
159
- {"agent": self.agent},
160
- question_settings,
161
- ]:
162
- replacement_dict.update(d)
163
-
164
- return replacement_dict
165
-
166
- def _get_question_options(self, question_data):
167
- question_options_entry = question_data.get("question_options", None)
168
- question_options = question_options_entry
169
-
170
- placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
-
172
- if isinstance(question_options_entry, str):
173
- env = Environment()
174
- parsed_content = env.parse(question_options_entry)
175
- question_option_key = list(meta.find_undeclared_variables(parsed_content))[
176
- 0
177
- ]
178
- if isinstance(self.scenario.get(question_option_key), list):
179
- question_options = self.scenario.get(question_option_key)
180
-
181
- # might be getting it from the prior answers
182
- if self.prior_answers_dict().get(question_option_key) is not None:
183
- prior_question = self.prior_answers_dict().get(question_option_key)
184
- if hasattr(prior_question, "answer"):
185
- if isinstance(prior_question.answer, list):
186
- question_options = prior_question.answer
187
- else:
188
- question_options = placeholder
189
- else:
190
- question_options = placeholder
191
-
192
- return question_options
193
-
194
- def build_question_instructions_prompt(self):
195
- """Buils the question instructions prompt."""
196
-
197
- question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
198
-
199
- # Get the data for the question - this is a dictionary of the question data
200
- # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
201
- question_data = self.question.data.copy()
202
-
203
- if "question_options" in question_data:
204
- question_options = self._get_question_options(question_data)
205
- question_data["question_options"] = question_options
206
-
207
- # check to see if the question_options is actually a string
208
- # This is used when the user is using the question_options as a variable from a scenario
209
- # if "question_options" in question_data:
210
- replacement_dict = self.build_replacement_dict(question_data)
211
- rendered_instructions = question_prompt.render(replacement_dict)
212
-
213
- # is there anything left to render?
214
- undefined_template_variables = (
215
- rendered_instructions.undefined_template_variables({})
216
- )
217
-
218
- # Check if it's the name of a question in the survey
219
- for question_name in self.survey.question_names:
220
- if question_name in undefined_template_variables:
221
- print(
222
- "Question name found in undefined_template_variables: ",
223
- question_name,
224
- )
225
-
226
- if undefined_template_variables:
227
- msg = f"Question instructions still has variables: {undefined_template_variables}."
228
- import warnings
229
-
230
- warnings.warn(msg)
231
- # raise QuestionScenarioRenderError(
232
- # f"Question instructions still has variables: {undefined_template_variables}."
233
- # )
234
-
235
- # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
236
- relevant_instructions = self.survey.relevant_instructions(
237
- self.question.question_name
238
- )
239
-
240
- if relevant_instructions != []:
241
- # preamble_text = Prompt(
242
- # text="You were given the following instructions: "
243
- # )
244
- preamble_text = Prompt(text="")
245
- for instruction in relevant_instructions:
246
- preamble_text += instruction.text
247
- rendered_instructions = preamble_text + rendered_instructions
248
-
249
- return rendered_instructions
250
-
251
- @property
252
- def question_instructions_prompt(self) -> Prompt:
253
- """
254
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
255
- >>> i = InvigilatorBase.example()
256
- >>> i.prompt_constructor.question_instructions_prompt
257
- Prompt(text=\"""...
258
- ...
259
- """
260
- if not hasattr(self, "_question_instructions_prompt"):
261
- self._question_instructions_prompt = (
262
- self.build_question_instructions_prompt()
263
- )
264
-
265
- return self._question_instructions_prompt
266
-
267
- @property
268
- def prior_question_memory_prompt(self) -> Prompt:
269
- if not hasattr(self, "_prior_question_memory_prompt"):
270
- from edsl.prompts.Prompt import Prompt
271
-
272
- memory_prompt = Prompt(text="")
273
- if self.memory_plan is not None:
274
- memory_prompt += self.create_memory_prompt(
275
- self.question.question_name
276
- ).render(self.scenario | self.prior_answers_dict())
277
- self._prior_question_memory_prompt = memory_prompt
278
- return self._prior_question_memory_prompt
279
-
280
- def create_memory_prompt(self, question_name: str) -> Prompt:
281
- """Create a memory for the agent.
282
-
283
- The returns a memory prompt for the agent.
284
-
285
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
286
- >>> i = InvigilatorBase.example()
287
- >>> i.current_answers = {"q0": "Prior answer"}
288
- >>> i.memory_plan.add_single_memory("q1", "q0")
289
- >>> p = i.prompt_constructor.create_memory_prompt("q1")
290
- >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
291
- 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
292
- """
293
- return self.memory_plan.get_memory_prompt_fragment(
294
- question_name, self.current_answers
295
- )
296
-
297
- def construct_system_prompt(self) -> Prompt:
298
- """Construct the system prompt for the LLM call."""
299
- import warnings
300
-
301
- warnings.warn(
302
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
303
- )
304
- return self.get_prompts()["system_prompt"]
305
-
306
- def construct_user_prompt(self) -> Prompt:
307
- """Construct the user prompt for the LLM call."""
308
- import warnings
309
-
310
- warnings.warn(
311
- "This method is deprecated. Use get_prompts instead.", DeprecationWarning
312
- )
313
- return self.get_prompts()["user_prompt"]
314
-
315
- def get_prompts(self) -> Dict[str, Prompt]:
316
- """Get both prompts for the LLM call.
317
-
318
- >>> from edsl import QuestionFreeText
319
- >>> from edsl.agents.InvigilatorBase import InvigilatorBase
320
- >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
321
- >>> i = InvigilatorBase.example(question = q)
322
- >>> i.get_prompts()
323
- {'user_prompt': ..., 'system_prompt': ...}
324
- """
325
- # breakpoint()
326
- prompts = self.prompt_plan.get_prompts(
327
- agent_instructions=self.agent_instructions_prompt,
328
- agent_persona=self.agent_persona_prompt,
329
- question_instructions=Prompt(self.question_instructions_prompt),
330
- prior_question_memory=self.prior_question_memory_prompt,
331
- )
332
- if self.question_file_keys:
333
- files_list = []
334
- for key in self.question_file_keys:
335
- files_list.append(self.scenario[key])
336
- prompts["files_list"] = files_list
337
- return prompts
338
-
339
- def _get_scenario_with_image(self) -> Scenario:
340
- """This is a helper function to get a scenario with an image, for testing purposes."""
341
- from edsl import Scenario
342
-
343
- try:
344
- scenario = Scenario.from_image("../../static/logo.png")
345
- except FileNotFoundError:
346
- scenario = Scenario.from_image("static/logo.png")
347
- return scenario
348
-
349
-
350
- if __name__ == "__main__":
351
- import doctest
352
-
353
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ from __future__ import annotations
2
+ from typing import Dict, Any, Optional, Set
3
+
4
+ from jinja2 import Environment, meta
5
+
6
+ from edsl.prompts.Prompt import Prompt
7
+ from edsl.agents.prompt_helpers import PromptPlan
8
+
9
+
10
+ class PlaceholderAnswer:
11
+ """A placeholder answer for when a question is not yet answered."""
12
+
13
+ def __init__(self):
14
+ self.answer = "N/A"
15
+ self.comment = "Will be populated by prior answer"
16
+
17
+ def __getitem__(self, index):
18
+ return ""
19
+
20
+ def __str__(self):
21
+ return "<<PlaceholderAnswer>>"
22
+
23
+ def __repr__(self):
24
+ return "<<PlaceholderAnswer>>"
25
+
26
+
27
+ def get_jinja2_variables(template_str: str) -> Set[str]:
28
+ """
29
+ Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
30
+
31
+ Args:
32
+ template_str (str): The Jinja2 template string
33
+
34
+ Returns:
35
+ Set[str]: A set of variable names found in the template
36
+ """
37
+ env = Environment()
38
+ ast = env.parse(template_str)
39
+ return meta.find_undeclared_variables(ast)
40
+
41
+
42
+ class PromptConstructor:
43
+ """
44
+ The pieces of a prompt are:
45
+ - The agent instructions - "You are answering questions as if you were a human. Do not break character."
46
+ - The persona prompt - "You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}"
47
+ - The question instructions - "You are being asked the following question: Do you like school? The options are 0: yes 1: no Return a valid JSON formatted like this, selecting only the number of the option: {"answer": <put answer code here>, "comment": "<put explanation here>"} Only 1 option may be selected."
48
+ - The memory prompt - "Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer"
49
+
50
+ This is mixed into the Invigilator class.
51
+ """
52
+
53
+ def __init__(self, invigilator, prompt_plan: Optional["PromptPlan"] = None):
54
+ self.invigilator = invigilator
55
+ self.agent = invigilator.agent
56
+ self.question = invigilator.question
57
+ self.scenario = invigilator.scenario
58
+ self.survey = invigilator.survey
59
+ self.model = invigilator.model
60
+ self.current_answers = invigilator.current_answers
61
+ self.memory_plan = invigilator.memory_plan
62
+ self.prompt_plan = prompt_plan or PromptPlan()
63
+
64
+ @property
65
+ def scenario_file_keys(self) -> list:
66
+ """We need to find all the keys in the scenario that refer to FileStore objects.
67
+ These will be used to append to the prompt a list of files that are part of the scenario.
68
+ """
69
+ from edsl.scenarios.FileStore import FileStore
70
+
71
+ file_entries = []
72
+ for key, value in self.scenario.items():
73
+ if isinstance(value, FileStore):
74
+ file_entries.append(key)
75
+ return file_entries
76
+
77
+ @property
78
+ def agent_instructions_prompt(self) -> Prompt:
79
+ """
80
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
81
+ >>> i = InvigilatorBase.example()
82
+ >>> i.prompt_constructor.agent_instructions_prompt
83
+ Prompt(text=\"""You are answering questions as if you were a human. Do not break character.\""")
84
+ """
85
+ from edsl import Agent
86
+
87
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
88
+ return Prompt(text="")
89
+
90
+ return Prompt(text=self.agent.instruction)
91
+
92
+ @property
93
+ def agent_persona_prompt(self) -> Prompt:
94
+ """
95
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
96
+ >>> i = InvigilatorBase.example()
97
+ >>> i.prompt_constructor.agent_persona_prompt
98
+ Prompt(text=\"""Your traits: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
99
+ """
100
+ from edsl import Agent
101
+
102
+ if self.agent == Agent(): # if agent is empty, then return an empty prompt
103
+ return Prompt(text="")
104
+
105
+ return self.agent.prompt()
106
+
107
+ def prior_answers_dict(self) -> dict:
108
+ # this is all questions
109
+ d = self.survey.question_names_to_questions()
110
+ # This attaches the answer to the question
111
+ for question in d:
112
+ if question in self.current_answers:
113
+ d[question].answer = self.current_answers[question]
114
+ else:
115
+ d[question].answer = PlaceholderAnswer()
116
+
117
+ # if (new_question := question.split("_comment")[0]) in d:
118
+ # d[new_question].comment = answer
119
+ # d[question].answer = PlaceholderAnswer()
120
+
121
+ # breakpoint()
122
+ return d
123
+
124
+ @property
125
+ def question_file_keys(self):
126
+ raw_question_text = self.question.question_text
127
+ variables = get_jinja2_variables(raw_question_text)
128
+ question_file_keys = []
129
+ for var in variables:
130
+ if var in self.scenario_file_keys:
131
+ question_file_keys.append(var)
132
+ return question_file_keys
133
+
134
+ def build_replacement_dict(self, question_data: dict):
135
+ """
136
+ Builds a dictionary of replacement values by combining multiple data sources.
137
+ """
138
+ # File references dictionary
139
+ file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys}
140
+
141
+ # Scenario items excluding file keys
142
+ scenario_items = {
143
+ k: v for k, v in self.scenario.items() if k not in self.scenario_file_keys
144
+ }
145
+
146
+ # Question settings with defaults
147
+ question_settings = {
148
+ "use_code": getattr(self.question, "_use_code", True),
149
+ "include_comment": getattr(self.question, "_include_comment", False),
150
+ }
151
+
152
+ # Combine all dictionaries using dict.update() for clarity
153
+ replacement_dict = {}
154
+ for d in [
155
+ file_refs,
156
+ question_data,
157
+ scenario_items,
158
+ self.prior_answers_dict(),
159
+ {"agent": self.agent},
160
+ question_settings,
161
+ ]:
162
+ replacement_dict.update(d)
163
+
164
+ return replacement_dict
165
+
166
+ def _get_question_options(self, question_data):
167
+ question_options_entry = question_data.get("question_options", None)
168
+ question_options = question_options_entry
169
+
170
+ placeholder = ["<< Option 1 - Placholder >>", "<< Option 2 - Placholder >>"]
171
+
172
+ if isinstance(question_options_entry, str):
173
+ env = Environment()
174
+ parsed_content = env.parse(question_options_entry)
175
+ question_option_key = list(meta.find_undeclared_variables(parsed_content))[
176
+ 0
177
+ ]
178
+ if isinstance(self.scenario.get(question_option_key), list):
179
+ question_options = self.scenario.get(question_option_key)
180
+
181
+ # might be getting it from the prior answers
182
+ if self.prior_answers_dict().get(question_option_key) is not None:
183
+ prior_question = self.prior_answers_dict().get(question_option_key)
184
+ if hasattr(prior_question, "answer"):
185
+ if isinstance(prior_question.answer, list):
186
+ question_options = prior_question.answer
187
+ else:
188
+ question_options = placeholder
189
+ else:
190
+ question_options = placeholder
191
+
192
+ return question_options
193
+
194
+ def build_question_instructions_prompt(self):
195
+ """Buils the question instructions prompt."""
196
+
197
+ question_prompt = Prompt(self.question.get_instructions(model=self.model.model))
198
+
199
+ # Get the data for the question - this is a dictionary of the question data
200
+ # e.g., {'question_text': 'Do you like school?', 'question_name': 'q0', 'question_options': ['yes', 'no']}
201
+ question_data = self.question.data.copy()
202
+
203
+ if "question_options" in question_data:
204
+ question_options = self._get_question_options(question_data)
205
+ question_data["question_options"] = question_options
206
+
207
+ # check to see if the question_options is actually a string
208
+ # This is used when the user is using the question_options as a variable from a scenario
209
+ # if "question_options" in question_data:
210
+ replacement_dict = self.build_replacement_dict(question_data)
211
+ rendered_instructions = question_prompt.render(replacement_dict)
212
+
213
+ # is there anything left to render?
214
+ undefined_template_variables = (
215
+ rendered_instructions.undefined_template_variables({})
216
+ )
217
+
218
+ # Check if it's the name of a question in the survey
219
+ for question_name in self.survey.question_names:
220
+ if question_name in undefined_template_variables:
221
+ print(
222
+ "Question name found in undefined_template_variables: ",
223
+ question_name,
224
+ )
225
+
226
+ if undefined_template_variables:
227
+ msg = f"Question instructions still has variables: {undefined_template_variables}."
228
+ import warnings
229
+
230
+ warnings.warn(msg)
231
+ # raise QuestionScenarioRenderError(
232
+ # f"Question instructions still has variables: {undefined_template_variables}."
233
+ # )
234
+
235
+ # Check if question has instructions - these are instructions in a Survey that can apply to multiple follow-on questions
236
+ relevant_instructions = self.survey.relevant_instructions(
237
+ self.question.question_name
238
+ )
239
+
240
+ if relevant_instructions != []:
241
+ # preamble_text = Prompt(
242
+ # text="You were given the following instructions: "
243
+ # )
244
+ preamble_text = Prompt(text="")
245
+ for instruction in relevant_instructions:
246
+ preamble_text += instruction.text
247
+ rendered_instructions = preamble_text + rendered_instructions
248
+
249
+ return rendered_instructions
250
+
251
+ @property
252
+ def question_instructions_prompt(self) -> Prompt:
253
+ """
254
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
255
+ >>> i = InvigilatorBase.example()
256
+ >>> i.prompt_constructor.question_instructions_prompt
257
+ Prompt(text=\"""...
258
+ ...
259
+ """
260
+ if not hasattr(self, "_question_instructions_prompt"):
261
+ self._question_instructions_prompt = (
262
+ self.build_question_instructions_prompt()
263
+ )
264
+
265
+ return self._question_instructions_prompt
266
+
267
+ @property
268
+ def prior_question_memory_prompt(self) -> Prompt:
269
+ if not hasattr(self, "_prior_question_memory_prompt"):
270
+ from edsl.prompts.Prompt import Prompt
271
+
272
+ memory_prompt = Prompt(text="")
273
+ if self.memory_plan is not None:
274
+ memory_prompt += self.create_memory_prompt(
275
+ self.question.question_name
276
+ ).render(self.scenario | self.prior_answers_dict())
277
+ self._prior_question_memory_prompt = memory_prompt
278
+ return self._prior_question_memory_prompt
279
+
280
+ def create_memory_prompt(self, question_name: str) -> Prompt:
281
+ """Create a memory for the agent.
282
+
283
+ The returns a memory prompt for the agent.
284
+
285
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
286
+ >>> i = InvigilatorBase.example()
287
+ >>> i.current_answers = {"q0": "Prior answer"}
288
+ >>> i.memory_plan.add_single_memory("q1", "q0")
289
+ >>> p = i.prompt_constructor.create_memory_prompt("q1")
290
+ >>> p.text.strip().replace("\\n", " ").replace("\\t", " ")
291
+ 'Before the question you are now answering, you already answered the following question(s): Question: Do you like school? Answer: Prior answer'
292
+ """
293
+ return self.memory_plan.get_memory_prompt_fragment(
294
+ question_name, self.current_answers
295
+ )
296
+
297
+ def construct_system_prompt(self) -> Prompt:
298
+ """Construct the system prompt for the LLM call."""
299
+ import warnings
300
+
301
+ warnings.warn(
302
+ "This method is deprecated. Use get_prompts instead.", DeprecationWarning
303
+ )
304
+ return self.get_prompts()["system_prompt"]
305
+
306
+ def construct_user_prompt(self) -> Prompt:
307
+ """Construct the user prompt for the LLM call."""
308
+ import warnings
309
+
310
+ warnings.warn(
311
+ "This method is deprecated. Use get_prompts instead.", DeprecationWarning
312
+ )
313
+ return self.get_prompts()["user_prompt"]
314
+
315
+ def get_prompts(self) -> Dict[str, Prompt]:
316
+ """Get both prompts for the LLM call.
317
+
318
+ >>> from edsl import QuestionFreeText
319
+ >>> from edsl.agents.InvigilatorBase import InvigilatorBase
320
+ >>> q = QuestionFreeText(question_text="How are you today?", question_name="q_new")
321
+ >>> i = InvigilatorBase.example(question = q)
322
+ >>> i.get_prompts()
323
+ {'user_prompt': ..., 'system_prompt': ...}
324
+ """
325
+ # breakpoint()
326
+ prompts = self.prompt_plan.get_prompts(
327
+ agent_instructions=self.agent_instructions_prompt,
328
+ agent_persona=self.agent_persona_prompt,
329
+ question_instructions=Prompt(self.question_instructions_prompt),
330
+ prior_question_memory=self.prior_question_memory_prompt,
331
+ )
332
+ if self.question_file_keys:
333
+ files_list = []
334
+ for key in self.question_file_keys:
335
+ files_list.append(self.scenario[key])
336
+ prompts["files_list"] = files_list
337
+ return prompts
338
+
339
+ def _get_scenario_with_image(self) -> Scenario:
340
+ """This is a helper function to get a scenario with an image, for testing purposes."""
341
+ from edsl import Scenario
342
+
343
+ try:
344
+ scenario = Scenario.from_image("../../static/logo.png")
345
+ except FileNotFoundError:
346
+ scenario = Scenario.from_image("static/logo.png")
347
+ return scenario
348
+
349
+
350
+ if __name__ == "__main__":
351
+ import doctest
352
+
353
+ doctest.testmod(optionflags=doctest.ELLIPSIS)