edsl 0.1.37.dev6__py3-none-any.whl → 0.1.38__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (271) hide show
  1. edsl/Base.py +332 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +49 -48
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +867 -855
  7. edsl/agents/AgentList.py +413 -350
  8. edsl/agents/Invigilator.py +233 -222
  9. edsl/agents/InvigilatorBase.py +265 -284
  10. edsl/agents/PromptConstructor.py +354 -353
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -99
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +279 -289
  26. edsl/config.py +157 -149
  27. edsl/conversation/Conversation.py +290 -290
  28. edsl/conversation/car_buying.py +58 -58
  29. edsl/conversation/chips.py +95 -95
  30. edsl/conversation/mug_negotiation.py +81 -81
  31. edsl/conversation/next_speaker_utilities.py +93 -93
  32. edsl/coop/PriceFetcher.py +54 -54
  33. edsl/coop/__init__.py +2 -2
  34. edsl/coop/coop.py +1028 -958
  35. edsl/coop/utils.py +131 -131
  36. edsl/data/Cache.py +555 -527
  37. edsl/data/CacheEntry.py +233 -228
  38. edsl/data/CacheHandler.py +149 -149
  39. edsl/data/RemoteCacheSync.py +78 -97
  40. edsl/data/SQLiteDict.py +292 -292
  41. edsl/data/__init__.py +4 -4
  42. edsl/data/orm.py +10 -10
  43. edsl/data_transfer_models.py +73 -73
  44. edsl/enums.py +175 -173
  45. edsl/exceptions/BaseException.py +21 -21
  46. edsl/exceptions/__init__.py +54 -54
  47. edsl/exceptions/agents.py +42 -38
  48. edsl/exceptions/cache.py +5 -0
  49. edsl/exceptions/configuration.py +16 -16
  50. edsl/exceptions/coop.py +10 -10
  51. edsl/exceptions/data.py +14 -14
  52. edsl/exceptions/general.py +34 -34
  53. edsl/exceptions/jobs.py +33 -33
  54. edsl/exceptions/language_models.py +63 -63
  55. edsl/exceptions/prompts.py +15 -15
  56. edsl/exceptions/questions.py +91 -91
  57. edsl/exceptions/results.py +29 -29
  58. edsl/exceptions/scenarios.py +22 -22
  59. edsl/exceptions/surveys.py +37 -37
  60. edsl/inference_services/AnthropicService.py +87 -87
  61. edsl/inference_services/AwsBedrock.py +120 -120
  62. edsl/inference_services/AzureAI.py +217 -217
  63. edsl/inference_services/DeepInfraService.py +18 -18
  64. edsl/inference_services/GoogleService.py +148 -156
  65. edsl/inference_services/GroqService.py +20 -20
  66. edsl/inference_services/InferenceServiceABC.py +147 -147
  67. edsl/inference_services/InferenceServicesCollection.py +97 -97
  68. edsl/inference_services/MistralAIService.py +123 -123
  69. edsl/inference_services/OllamaService.py +18 -18
  70. edsl/inference_services/OpenAIService.py +224 -224
  71. edsl/inference_services/PerplexityService.py +163 -0
  72. edsl/inference_services/TestService.py +89 -89
  73. edsl/inference_services/TogetherAIService.py +170 -170
  74. edsl/inference_services/models_available_cache.py +118 -118
  75. edsl/inference_services/rate_limits_cache.py +25 -25
  76. edsl/inference_services/registry.py +41 -39
  77. edsl/inference_services/write_available.py +10 -10
  78. edsl/jobs/Answers.py +56 -56
  79. edsl/jobs/Jobs.py +898 -1347
  80. edsl/jobs/JobsChecks.py +147 -0
  81. edsl/jobs/JobsPrompts.py +268 -0
  82. edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
  83. edsl/jobs/__init__.py +1 -1
  84. edsl/jobs/buckets/BucketCollection.py +63 -63
  85. edsl/jobs/buckets/ModelBuckets.py +65 -65
  86. edsl/jobs/buckets/TokenBucket.py +251 -248
  87. edsl/jobs/interviews/Interview.py +661 -661
  88. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  89. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  90. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  91. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  92. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  93. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  94. edsl/jobs/interviews/ReportErrors.py +66 -66
  95. edsl/jobs/interviews/interview_status_enum.py +9 -9
  96. edsl/jobs/runners/JobsRunnerAsyncio.py +466 -338
  97. edsl/jobs/runners/JobsRunnerStatus.py +330 -332
  98. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  99. edsl/jobs/tasks/TaskCreators.py +64 -64
  100. edsl/jobs/tasks/TaskHistory.py +450 -442
  101. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  102. edsl/jobs/tasks/task_status_enum.py +163 -163
  103. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  104. edsl/jobs/tokens/TokenUsage.py +34 -34
  105. edsl/language_models/KeyLookup.py +30 -30
  106. edsl/language_models/LanguageModel.py +668 -706
  107. edsl/language_models/ModelList.py +155 -102
  108. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  109. edsl/language_models/__init__.py +3 -3
  110. edsl/language_models/fake_openai_call.py +15 -15
  111. edsl/language_models/fake_openai_service.py +61 -61
  112. edsl/language_models/registry.py +190 -137
  113. edsl/language_models/repair.py +156 -156
  114. edsl/language_models/unused/ReplicateBase.py +83 -83
  115. edsl/language_models/utilities.py +64 -64
  116. edsl/notebooks/Notebook.py +258 -259
  117. edsl/notebooks/__init__.py +1 -1
  118. edsl/prompts/Prompt.py +362 -357
  119. edsl/prompts/__init__.py +2 -2
  120. edsl/questions/AnswerValidatorMixin.py +289 -289
  121. edsl/questions/QuestionBase.py +664 -656
  122. edsl/questions/QuestionBaseGenMixin.py +161 -161
  123. edsl/questions/QuestionBasePromptsMixin.py +217 -234
  124. edsl/questions/QuestionBudget.py +227 -227
  125. edsl/questions/QuestionCheckBox.py +359 -359
  126. edsl/questions/QuestionExtract.py +182 -183
  127. edsl/questions/QuestionFreeText.py +114 -114
  128. edsl/questions/QuestionFunctional.py +166 -159
  129. edsl/questions/QuestionList.py +231 -231
  130. edsl/questions/QuestionMultipleChoice.py +286 -286
  131. edsl/questions/QuestionNumerical.py +153 -153
  132. edsl/questions/QuestionRank.py +324 -324
  133. edsl/questions/Quick.py +41 -41
  134. edsl/questions/RegisterQuestionsMeta.py +71 -71
  135. edsl/questions/ResponseValidatorABC.py +174 -174
  136. edsl/questions/SimpleAskMixin.py +73 -73
  137. edsl/questions/__init__.py +26 -26
  138. edsl/questions/compose_questions.py +98 -98
  139. edsl/questions/decorators.py +21 -21
  140. edsl/questions/derived/QuestionLikertFive.py +76 -76
  141. edsl/questions/derived/QuestionLinearScale.py +87 -87
  142. edsl/questions/derived/QuestionTopK.py +93 -91
  143. edsl/questions/derived/QuestionYesNo.py +82 -82
  144. edsl/questions/descriptors.py +413 -413
  145. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  146. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  147. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  148. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  149. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  150. edsl/questions/prompt_templates/question_list.jinja +17 -17
  151. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  152. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  153. edsl/questions/question_registry.py +177 -147
  154. edsl/questions/settings.py +12 -12
  155. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  156. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  157. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  158. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  159. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  160. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  161. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  162. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  163. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  164. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  165. edsl/questions/templates/list/question_presentation.jinja +5 -5
  166. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  167. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  168. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  169. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  170. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  171. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  172. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  173. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  174. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  175. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  176. edsl/results/CSSParameterizer.py +108 -0
  177. edsl/results/Dataset.py +424 -293
  178. edsl/results/DatasetExportMixin.py +731 -717
  179. edsl/results/DatasetTree.py +275 -145
  180. edsl/results/Result.py +465 -450
  181. edsl/results/Results.py +1165 -1071
  182. edsl/results/ResultsDBMixin.py +238 -238
  183. edsl/results/ResultsExportMixin.py +43 -43
  184. edsl/results/ResultsFetchMixin.py +33 -33
  185. edsl/results/ResultsGGMixin.py +121 -121
  186. edsl/results/ResultsToolsMixin.py +98 -98
  187. edsl/results/Selector.py +135 -135
  188. edsl/results/TableDisplay.py +198 -0
  189. edsl/results/__init__.py +2 -2
  190. edsl/results/table_display.css +78 -0
  191. edsl/results/tree_explore.py +115 -115
  192. edsl/scenarios/FileStore.py +632 -458
  193. edsl/scenarios/Scenario.py +601 -546
  194. edsl/scenarios/ScenarioHtmlMixin.py +64 -64
  195. edsl/scenarios/ScenarioJoin.py +127 -0
  196. edsl/scenarios/ScenarioList.py +1287 -1112
  197. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  198. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  199. edsl/scenarios/__init__.py +4 -4
  200. edsl/shared.py +1 -1
  201. edsl/study/ObjectEntry.py +173 -173
  202. edsl/study/ProofOfWork.py +113 -113
  203. edsl/study/SnapShot.py +80 -80
  204. edsl/study/Study.py +528 -528
  205. edsl/study/__init__.py +4 -4
  206. edsl/surveys/DAG.py +148 -148
  207. edsl/surveys/Memory.py +31 -31
  208. edsl/surveys/MemoryPlan.py +244 -244
  209. edsl/surveys/Rule.py +326 -330
  210. edsl/surveys/RuleCollection.py +387 -387
  211. edsl/surveys/Survey.py +1801 -1795
  212. edsl/surveys/SurveyCSS.py +261 -261
  213. edsl/surveys/SurveyExportMixin.py +259 -259
  214. edsl/surveys/SurveyFlowVisualizationMixin.py +179 -121
  215. edsl/surveys/SurveyQualtricsImport.py +284 -284
  216. edsl/surveys/__init__.py +3 -3
  217. edsl/surveys/base.py +53 -53
  218. edsl/surveys/descriptors.py +56 -56
  219. edsl/surveys/instructions/ChangeInstruction.py +49 -47
  220. edsl/surveys/instructions/Instruction.py +65 -51
  221. edsl/surveys/instructions/InstructionCollection.py +77 -77
  222. edsl/templates/error_reporting/base.html +23 -23
  223. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  224. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  225. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  226. edsl/templates/error_reporting/interview_details.html +115 -115
  227. edsl/templates/error_reporting/interviews.html +19 -10
  228. edsl/templates/error_reporting/overview.html +4 -4
  229. edsl/templates/error_reporting/performance_plot.html +1 -1
  230. edsl/templates/error_reporting/report.css +73 -73
  231. edsl/templates/error_reporting/report.html +117 -117
  232. edsl/templates/error_reporting/report.js +25 -25
  233. edsl/tools/__init__.py +1 -1
  234. edsl/tools/clusters.py +192 -192
  235. edsl/tools/embeddings.py +27 -27
  236. edsl/tools/embeddings_plotting.py +118 -118
  237. edsl/tools/plotting.py +112 -112
  238. edsl/tools/summarize.py +18 -18
  239. edsl/utilities/SystemInfo.py +28 -28
  240. edsl/utilities/__init__.py +22 -22
  241. edsl/utilities/ast_utilities.py +25 -25
  242. edsl/utilities/data/Registry.py +6 -6
  243. edsl/utilities/data/__init__.py +1 -1
  244. edsl/utilities/data/scooter_results.json +1 -1
  245. edsl/utilities/decorators.py +77 -77
  246. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  247. edsl/utilities/interface.py +627 -627
  248. edsl/{conjure → utilities}/naming_utilities.py +263 -263
  249. edsl/utilities/repair_functions.py +28 -28
  250. edsl/utilities/restricted_python.py +70 -70
  251. edsl/utilities/utilities.py +424 -409
  252. {edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/LICENSE +21 -21
  253. {edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/METADATA +2 -1
  254. edsl-0.1.38.dist-info/RECORD +277 -0
  255. edsl/conjure/AgentConstructionMixin.py +0 -160
  256. edsl/conjure/Conjure.py +0 -62
  257. edsl/conjure/InputData.py +0 -659
  258. edsl/conjure/InputDataCSV.py +0 -48
  259. edsl/conjure/InputDataMixinQuestionStats.py +0 -182
  260. edsl/conjure/InputDataPyRead.py +0 -91
  261. edsl/conjure/InputDataSPSS.py +0 -8
  262. edsl/conjure/InputDataStata.py +0 -8
  263. edsl/conjure/QuestionOptionMixin.py +0 -76
  264. edsl/conjure/QuestionTypeMixin.py +0 -23
  265. edsl/conjure/RawQuestion.py +0 -65
  266. edsl/conjure/SurveyResponses.py +0 -7
  267. edsl/conjure/__init__.py +0 -9
  268. edsl/conjure/examples/placeholder.txt +0 -0
  269. edsl/conjure/utilities.py +0 -201
  270. edsl-0.1.37.dev6.dist-info/RECORD +0 -283
  271. {edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/WHEEL +0 -0
@@ -1,413 +1,413 @@
1
- """This module contains the descriptors used to validate the attributes of the question classes."""
2
-
3
- from abc import ABC, abstractmethod
4
- import re
5
- from typing import Any, Callable, List, Optional
6
- from edsl.exceptions import (
7
- QuestionCreationValidationError,
8
- QuestionAnswerValidationError,
9
- )
10
- from edsl.questions.settings import Settings
11
-
12
-
13
- ################################
14
- # Helper functions
15
- ################################
16
-
17
-
18
- def contains_single_braced_substring(s: str) -> bool:
19
- """Check if the string contains a substring in single braces."""
20
- pattern = r"(?<!\{)\{[^{}]+\}(?!\})"
21
- match = re.search(pattern, s)
22
- return bool(match)
23
-
24
-
25
- def is_number(value: Any) -> bool:
26
- """Check if an object is a number."""
27
- return isinstance(value, int) or isinstance(value, float)
28
-
29
-
30
- def is_number_or_none(value: Any) -> bool:
31
- """Check if an object is a number or None."""
32
- return value is None or is_number(value)
33
-
34
-
35
- ################################
36
- # Descriptor ABC
37
- ################################
38
-
39
-
40
- class BaseDescriptor(ABC):
41
- """ABC for something."""
42
-
43
- @abstractmethod
44
- def validate(self, value: Any) -> None:
45
- """Validate the value. If it is invalid, raises an exception. If it is valid, does nothing."""
46
- pass
47
-
48
- def __get__(self, instance, owner):
49
- """Get the value of the attribute."""
50
- if self.name not in instance.__dict__:
51
- return {}
52
- return instance.__dict__[self.name]
53
-
54
- def __set__(self, instance, value: Any) -> None:
55
- """Set the value of the attribute."""
56
- new_value = self.validate(value, instance)
57
-
58
- if new_value is not None:
59
- instance.__dict__[self.name] = new_value
60
- else:
61
- instance.__dict__[self.name] = value
62
-
63
- def __set_name__(self, owner, name: str) -> None:
64
- """Set the name of the attribute."""
65
- self.name = "_" + name
66
-
67
-
68
- ################################
69
- # General descriptors
70
- ################################
71
-
72
-
73
- class FunctionDescriptor(BaseDescriptor):
74
- """Validate that a value is a function."""
75
-
76
- def validate(self, value: Any, instance) -> Callable:
77
- """Validate the value is a function, and if so, returns it."""
78
- if not callable(value):
79
- raise QuestionCreationValidationError(
80
- f"Expected a function (got {value}).)"
81
- )
82
- return value
83
-
84
-
85
- class IntegerDescriptor(BaseDescriptor):
86
- """
87
- Validate that a value is an integer.
88
-
89
- - `none_allowed` is whether None is allowed as a value.
90
- """
91
-
92
- def __init__(self, none_allowed: bool = False):
93
- """Initialize the descriptor."""
94
- self.none_allowed = none_allowed
95
-
96
- def validate(self, value, instance):
97
- """Validate the value is an integer."""
98
- if self.none_allowed:
99
- if not (isinstance(value, int) or value is None):
100
- raise QuestionAnswerValidationError(
101
- f"Expected an integer or None (got {value})."
102
- )
103
- else:
104
- if not isinstance(value, int):
105
- raise QuestionAnswerValidationError(
106
- f"Expected an integer (got {value})."
107
- )
108
-
109
-
110
- class IntegerOrNoneDescriptor(BaseDescriptor):
111
- """Validate that a value is an integer or None."""
112
-
113
- def validate(self, value, instance):
114
- """Validate the value is an integer or None."""
115
- if not (isinstance(value, int) or value is None):
116
- raise QuestionCreationValidationError(
117
- f"Expected an integer or None (got {value})."
118
- )
119
-
120
-
121
- class NumericalOrNoneDescriptor(BaseDescriptor):
122
- """Validate that a value is a number or None."""
123
-
124
- def validate(self, value, instance):
125
- """Validate the value is a number or None."""
126
- if not is_number_or_none(value):
127
- raise QuestionAnswerValidationError(
128
- f"Expected a number or None (got {value})."
129
- )
130
-
131
-
132
- ################################
133
- # Attribute-specific descriptors
134
- ################################
135
-
136
-
137
- class AnswerTemplateDescriptor(BaseDescriptor):
138
- """Validate that the answer template is a dictionary with string keys and string values."""
139
-
140
- def validate(self, value: Any, instance) -> None:
141
- """Validate the answer template."""
142
- if not isinstance(value, dict):
143
- raise QuestionCreationValidationError(
144
- f"`answer_template` must be a dictionary (got {value}).)"
145
- )
146
- if not all(isinstance(x, str) for x in value.keys()):
147
- raise QuestionCreationValidationError(
148
- f"`answer_template` keys must be strings (got {value})."
149
- )
150
-
151
-
152
- class InstructionsDescriptor(BaseDescriptor):
153
- """Validate that the `instructions` attribute is a string."""
154
-
155
- def validate(self, value, instance):
156
- """Validate the value is a string."""
157
- # if not isinstance(value, str):
158
- # raise QuestionCreationValidationError(
159
- # f"Question `instructions` must be a string (got {value})."
160
- # )
161
- pass
162
-
163
-
164
- class NumSelectionsDescriptor(BaseDescriptor):
165
- """Validate that `num_selections` is an integer, is less than the number of options, and is positive."""
166
-
167
- def validate(self, value, instance):
168
- """Validate the value is an integer, is less than the number of options, and is positive."""
169
- if not (isinstance(value, int)):
170
- raise QuestionCreationValidationError(
171
- f"`num_selections` must be an integer (got {value})."
172
- )
173
- if value > len(instance.question_options):
174
- raise QuestionAnswerValidationError(
175
- f"`num_selections` must be less than the number of options (got {value})."
176
- )
177
- if value < 1:
178
- raise QuestionAnswerValidationError(
179
- f"`num_selections` must a positive integer (got {value})."
180
- )
181
-
182
-
183
- class OptionLabelDescriptor(BaseDescriptor):
184
- """Validate that the `option_label` attribute is a string."""
185
-
186
- def validate(self, value, instance):
187
- """Validate the value is a string."""
188
- # key_values = [int(v) for v in value.keys()]
189
-
190
- if value and (key_values := [float(v) for v in value.keys()]) != []:
191
- if min(key_values) != min(instance.question_options):
192
- raise QuestionCreationValidationError(
193
- f"First option needs a label (got {value})"
194
- )
195
- if max(key_values) != max(instance.question_options):
196
- raise QuestionCreationValidationError(
197
- f"Last option needs a label (got {value})"
198
- )
199
- if not all(isinstance(x, str) for x in value.values()):
200
- raise QuestionCreationValidationError(
201
- "Option labels must be strings (got {value})."
202
- )
203
- for key in key_values:
204
- if key not in instance.question_options:
205
- raise QuestionCreationValidationError(
206
- f"Option label key ({key}) is not in question options ({instance.question_options})."
207
- )
208
-
209
- if len(value.values()) != len(set(value.values())):
210
- raise QuestionCreationValidationError(
211
- f"Option labels must be unique (got {value})."
212
- )
213
-
214
-
215
- class QuestionNameDescriptor(BaseDescriptor):
216
- """Validate that the `question_name` attribute is a valid variable name."""
217
-
218
- def validate(self, value, instance):
219
- """Validate the value is a valid variable name."""
220
- from edsl.utilities.utilities import is_valid_variable_name
221
-
222
- if "{{" in value and "}}" in value:
223
- # they're trying to use a dynamic question name - let's let this play out
224
- return None
225
-
226
- if value.endswith("_comment") or value.endswith("_generated_tokens"):
227
- raise QuestionCreationValidationError(
228
- f"`question_name` cannot end with '_comment' or '_generated_tokens - (got {value})."
229
- )
230
-
231
- if not is_valid_variable_name(value):
232
- raise QuestionCreationValidationError(
233
- f"`question_name` is not a valid variable name (got {value})."
234
- )
235
-
236
-
237
- class QuestionOptionsDescriptor(BaseDescriptor):
238
- """Validate that `question_options` is a list, does not exceed the min/max lengths, and has unique items."""
239
-
240
- @classmethod
241
- def example(cls):
242
- class TestQuestion:
243
- question_options = QuestionOptionsDescriptor()
244
-
245
- def __init__(self, question_options: List[str]):
246
- self.question_options = question_options
247
-
248
- return TestQuestion
249
-
250
- def __init__(
251
- self,
252
- num_choices: int = None,
253
- linear_scale: bool = False,
254
- q_budget: bool = False,
255
- ):
256
- """Initialize the descriptor."""
257
- self.num_choices = num_choices
258
- self.linear_scale = linear_scale
259
- self.q_budget = q_budget
260
-
261
- def validate(self, value: Any, instance) -> None:
262
- """Validate the question options.
263
-
264
- >>> q_class = QuestionOptionsDescriptor.example()
265
- >>> _ = q_class(["a", "b", "c"])
266
- >>> _ = q_class(["a", "b", "c", "d", "d"])
267
- Traceback (most recent call last):
268
- ...
269
- edsl.exceptions.questions.QuestionCreationValidationError: Question options must be unique (got ['a', 'b', 'c', 'd', 'd']).
270
-
271
- We allow dynamic question options, which are strings of the form '{{ question_options }}'.
272
-
273
- >>> _ = q_class("{{dynamic_options}}")
274
- >>> _ = q_class("dynamic_options")
275
- Traceback (most recent call last):
276
- ...
277
- edsl.exceptions.questions.QuestionCreationValidationError: ...
278
- """
279
- if isinstance(value, str):
280
- # Check if the string is a dynamic question option
281
- if "{{" in value and "}}" in value:
282
- return None
283
- else:
284
- raise QuestionCreationValidationError(
285
- f"Dynamic question options must have jinja2 braces - instead received: {value}."
286
- )
287
- if not isinstance(value, list):
288
- raise QuestionCreationValidationError(
289
- f"Question options must be a list (got {value})."
290
- )
291
- if len(value) > Settings.MAX_NUM_OPTIONS:
292
- raise QuestionCreationValidationError(
293
- f"Too many question options (got {value})."
294
- )
295
- if len(value) < Settings.MIN_NUM_OPTIONS:
296
- raise QuestionCreationValidationError(
297
- f"Too few question options (got {value})."
298
- )
299
- # handle the case when question_options is a list of lists (a list of list can be converted to set)
300
- tmp_value = [str(x) for x in value]
301
- if len(tmp_value) != len(set(tmp_value)):
302
- raise QuestionCreationValidationError(
303
- f"Question options must be unique (got {value})."
304
- )
305
- if not self.linear_scale:
306
- if not self.q_budget:
307
- pass
308
- # if not (
309
- # value
310
- # and all(type(x) == type(value[0]) for x in value)
311
- # and isinstance(value[0], (str, list, int, float))
312
- # ):
313
- # raise QuestionCreationValidationError(
314
- # f"Question options must be all same type (got {value}).)"
315
- # )
316
- else:
317
- if not all(isinstance(x, (str)) for x in value):
318
- raise QuestionCreationValidationError(
319
- f"Question options must be strings (got {value}).)"
320
- )
321
- if not all(
322
- [
323
- type(option) != str
324
- or (len(option) >= 1 and len(option) < Settings.MAX_OPTION_LENGTH)
325
- for option in value
326
- ]
327
- ):
328
- raise QuestionCreationValidationError(
329
- f"All question options must be at least 1 character long but less than {Settings.MAX_OPTION_LENGTH} characters long (got {value})."
330
- )
331
-
332
- if hasattr(instance, "min_selections") and instance.min_selections != None:
333
- if instance.min_selections > len(value):
334
- raise QuestionCreationValidationError(
335
- f"You asked for at least {instance.min_selections} selections, but provided fewer options (got {value})."
336
- )
337
- if hasattr(instance, "max_selections") and instance.max_selections != None:
338
- if instance.max_selections > len(value):
339
- raise QuestionCreationValidationError(
340
- f"You asked for at most {instance.max_selections} selections, but provided fewer options (got {value})."
341
- )
342
- if self.num_choices is not None:
343
- if len(value) != self.num_choices:
344
- raise QuestionCreationValidationError(
345
- f"You asked for {self.num_choices} selections, but provided {len(value)} options."
346
- )
347
- if self.linear_scale:
348
- if sorted(value) != list(range(min(value), max(value) + 1)):
349
- raise QuestionCreationValidationError(
350
- f"LinearScale.question_options must be a list of successive integers, e.g. [1, 2, 3] (got {value})."
351
- )
352
-
353
-
354
- class QuestionTextDescriptor(BaseDescriptor):
355
- """Validate that the `question_text` attribute is a string.
356
-
357
-
358
- >>> class TestQuestion:
359
- ... question_text = QuestionTextDescriptor()
360
- ... def __init__(self, question_text: str):
361
- ... self.question_text = question_text
362
-
363
- >>> _ = TestQuestion("What is the capital of France?")
364
- >>> _ = TestQuestion("What is the capital of France? {{variable}}")
365
- >>> _ = TestQuestion("What is the capital of France? {{variable name}}")
366
- Traceback (most recent call last):
367
- ...
368
- edsl.exceptions.questions.QuestionCreationValidationError: Question text contains an invalid identifier: 'variable name'
369
- """
370
-
371
- def validate(self, value, instance):
372
- """Validate the value is a string."""
373
- # if len(value) > Settings.MAX_QUESTION_LENGTH:
374
- # raise Exception("Question is too long!")
375
- if len(value) < 1:
376
- raise Exception("Question is too short!")
377
- if not isinstance(value, str):
378
- raise Exception("Question must be a string!")
379
- if contains_single_braced_substring(value):
380
- import warnings
381
-
382
- # # warnings.warn(
383
- # # f"WARNING: Question text contains a single-braced substring: If you intended to parameterize the question with a Scenario this should be changed to a double-braced substring, e.g. {{variable}}.\nSee details on constructing Scenarios in the docs: https://docs.expectedparrot.com/en/latest/scenarios.html",
384
- # # UserWarning,
385
- # # )
386
- warnings.warn(
387
- "WARNING: Question text contains a single-braced substring. "
388
- "If you intended to parameterize the question with a Scenario, this will "
389
- "be changed to a double-braced substring, e.g. {{variable}}.\n"
390
- "See details on constructing Scenarios in the docs: "
391
- "https://docs.expectedparrot.com/en/latest/scenarios.html",
392
- UserWarning,
393
- )
394
- # Automatically replace single braces with double braces
395
- # This is here because if the user is using an f-string, the double brace will get converted to a single brace.
396
- # This undoes that.
397
- value = re.sub(r"\{([^\{\}]+)\}", r"{{\1}}", value)
398
- return value
399
-
400
- # iterate through all doubles braces and check if they are valid python identifiers
401
- for match in re.finditer(r"\{\{([^\{\}]+)\}\}", value):
402
- if " " in match.group(1).strip():
403
- raise QuestionCreationValidationError(
404
- f"Question text contains an invalid identifier: '{match.group(1)}'"
405
- )
406
-
407
- return None
408
-
409
-
410
- if __name__ == "__main__":
411
- import doctest
412
-
413
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ """This module contains the descriptors used to validate the attributes of the question classes."""
2
+
3
+ from abc import ABC, abstractmethod
4
+ import re
5
+ from typing import Any, Callable, List, Optional
6
+ from edsl.exceptions import (
7
+ QuestionCreationValidationError,
8
+ QuestionAnswerValidationError,
9
+ )
10
+ from edsl.questions.settings import Settings
11
+
12
+
13
+ ################################
14
+ # Helper functions
15
+ ################################
16
+
17
+
18
+ def contains_single_braced_substring(s: str) -> bool:
19
+ """Check if the string contains a substring in single braces."""
20
+ pattern = r"(?<!\{)\{[^{}]+\}(?!\})"
21
+ match = re.search(pattern, s)
22
+ return bool(match)
23
+
24
+
25
+ def is_number(value: Any) -> bool:
26
+ """Check if an object is a number."""
27
+ return isinstance(value, int) or isinstance(value, float)
28
+
29
+
30
+ def is_number_or_none(value: Any) -> bool:
31
+ """Check if an object is a number or None."""
32
+ return value is None or is_number(value)
33
+
34
+
35
+ ################################
36
+ # Descriptor ABC
37
+ ################################
38
+
39
+
40
+ class BaseDescriptor(ABC):
41
+ """ABC for something."""
42
+
43
+ @abstractmethod
44
+ def validate(self, value: Any) -> None:
45
+ """Validate the value. If it is invalid, raises an exception. If it is valid, does nothing."""
46
+ pass
47
+
48
+ def __get__(self, instance, owner):
49
+ """Get the value of the attribute."""
50
+ if self.name not in instance.__dict__:
51
+ return {}
52
+ return instance.__dict__[self.name]
53
+
54
+ def __set__(self, instance, value: Any) -> None:
55
+ """Set the value of the attribute."""
56
+ new_value = self.validate(value, instance)
57
+
58
+ if new_value is not None:
59
+ instance.__dict__[self.name] = new_value
60
+ else:
61
+ instance.__dict__[self.name] = value
62
+
63
+ def __set_name__(self, owner, name: str) -> None:
64
+ """Set the name of the attribute."""
65
+ self.name = "_" + name
66
+
67
+
68
+ ################################
69
+ # General descriptors
70
+ ################################
71
+
72
+
73
+ class FunctionDescriptor(BaseDescriptor):
74
+ """Validate that a value is a function."""
75
+
76
+ def validate(self, value: Any, instance) -> Callable:
77
+ """Validate the value is a function, and if so, returns it."""
78
+ if not callable(value):
79
+ raise QuestionCreationValidationError(
80
+ f"Expected a function (got {value}).)"
81
+ )
82
+ return value
83
+
84
+
85
+ class IntegerDescriptor(BaseDescriptor):
86
+ """
87
+ Validate that a value is an integer.
88
+
89
+ - `none_allowed` is whether None is allowed as a value.
90
+ """
91
+
92
+ def __init__(self, none_allowed: bool = False):
93
+ """Initialize the descriptor."""
94
+ self.none_allowed = none_allowed
95
+
96
+ def validate(self, value, instance):
97
+ """Validate the value is an integer."""
98
+ if self.none_allowed:
99
+ if not (isinstance(value, int) or value is None):
100
+ raise QuestionAnswerValidationError(
101
+ f"Expected an integer or None (got {value})."
102
+ )
103
+ else:
104
+ if not isinstance(value, int):
105
+ raise QuestionAnswerValidationError(
106
+ f"Expected an integer (got {value})."
107
+ )
108
+
109
+
110
+ class IntegerOrNoneDescriptor(BaseDescriptor):
111
+ """Validate that a value is an integer or None."""
112
+
113
+ def validate(self, value, instance):
114
+ """Validate the value is an integer or None."""
115
+ if not (isinstance(value, int) or value is None):
116
+ raise QuestionCreationValidationError(
117
+ f"Expected an integer or None (got {value})."
118
+ )
119
+
120
+
121
+ class NumericalOrNoneDescriptor(BaseDescriptor):
122
+ """Validate that a value is a number or None."""
123
+
124
+ def validate(self, value, instance):
125
+ """Validate the value is a number or None."""
126
+ if not is_number_or_none(value):
127
+ raise QuestionAnswerValidationError(
128
+ f"Expected a number or None (got {value})."
129
+ )
130
+
131
+
132
+ ################################
133
+ # Attribute-specific descriptors
134
+ ################################
135
+
136
+
137
+ class AnswerTemplateDescriptor(BaseDescriptor):
138
+ """Validate that the answer template is a dictionary with string keys and string values."""
139
+
140
+ def validate(self, value: Any, instance) -> None:
141
+ """Validate the answer template."""
142
+ if not isinstance(value, dict):
143
+ raise QuestionCreationValidationError(
144
+ f"`answer_template` must be a dictionary (got {value}).)"
145
+ )
146
+ if not all(isinstance(x, str) for x in value.keys()):
147
+ raise QuestionCreationValidationError(
148
+ f"`answer_template` keys must be strings (got {value})."
149
+ )
150
+
151
+
152
+ class InstructionsDescriptor(BaseDescriptor):
153
+ """Validate that the `instructions` attribute is a string."""
154
+
155
+ def validate(self, value, instance):
156
+ """Validate the value is a string."""
157
+ # if not isinstance(value, str):
158
+ # raise QuestionCreationValidationError(
159
+ # f"Question `instructions` must be a string (got {value})."
160
+ # )
161
+ pass
162
+
163
+
164
+ class NumSelectionsDescriptor(BaseDescriptor):
165
+ """Validate that `num_selections` is an integer, is less than the number of options, and is positive."""
166
+
167
+ def validate(self, value, instance):
168
+ """Validate the value is an integer, is less than the number of options, and is positive."""
169
+ if not (isinstance(value, int)):
170
+ raise QuestionCreationValidationError(
171
+ f"`num_selections` must be an integer (got {value})."
172
+ )
173
+ if value > len(instance.question_options):
174
+ raise QuestionAnswerValidationError(
175
+ f"`num_selections` must be less than the number of options (got {value})."
176
+ )
177
+ if value < 1:
178
+ raise QuestionAnswerValidationError(
179
+ f"`num_selections` must a positive integer (got {value})."
180
+ )
181
+
182
+
183
+ class OptionLabelDescriptor(BaseDescriptor):
184
+ """Validate that the `option_label` attribute is a string."""
185
+
186
+ def validate(self, value, instance):
187
+ """Validate the value is a string."""
188
+ # key_values = [int(v) for v in value.keys()]
189
+
190
+ if value and (key_values := [float(v) for v in value.keys()]) != []:
191
+ if min(key_values) != min(instance.question_options):
192
+ raise QuestionCreationValidationError(
193
+ f"First option needs a label (got {value})"
194
+ )
195
+ if max(key_values) != max(instance.question_options):
196
+ raise QuestionCreationValidationError(
197
+ f"Last option needs a label (got {value})"
198
+ )
199
+ if not all(isinstance(x, str) for x in value.values()):
200
+ raise QuestionCreationValidationError(
201
+ "Option labels must be strings (got {value})."
202
+ )
203
+ for key in key_values:
204
+ if key not in instance.question_options:
205
+ raise QuestionCreationValidationError(
206
+ f"Option label key ({key}) is not in question options ({instance.question_options})."
207
+ )
208
+
209
+ if len(value.values()) != len(set(value.values())):
210
+ raise QuestionCreationValidationError(
211
+ f"Option labels must be unique (got {value})."
212
+ )
213
+
214
+
215
+ class QuestionNameDescriptor(BaseDescriptor):
216
+ """Validate that the `question_name` attribute is a valid variable name."""
217
+
218
+ def validate(self, value, instance):
219
+ """Validate the value is a valid variable name."""
220
+ from edsl.utilities.utilities import is_valid_variable_name
221
+
222
+ if "{{" in value and "}}" in value:
223
+ # they're trying to use a dynamic question name - let's let this play out
224
+ return None
225
+
226
+ if value.endswith("_comment") or value.endswith("_generated_tokens"):
227
+ raise QuestionCreationValidationError(
228
+ f"`question_name` cannot end with '_comment' or '_generated_tokens - (got {value})."
229
+ )
230
+
231
+ if not is_valid_variable_name(value):
232
+ raise QuestionCreationValidationError(
233
+ f"`question_name` is not a valid variable name (got {value})."
234
+ )
235
+
236
+
237
+ class QuestionOptionsDescriptor(BaseDescriptor):
238
+ """Validate that `question_options` is a list, does not exceed the min/max lengths, and has unique items."""
239
+
240
+ @classmethod
241
+ def example(cls):
242
+ class TestQuestion:
243
+ question_options = QuestionOptionsDescriptor()
244
+
245
+ def __init__(self, question_options: List[str]):
246
+ self.question_options = question_options
247
+
248
+ return TestQuestion
249
+
250
+ def __init__(
251
+ self,
252
+ num_choices: int = None,
253
+ linear_scale: bool = False,
254
+ q_budget: bool = False,
255
+ ):
256
+ """Initialize the descriptor."""
257
+ self.num_choices = num_choices
258
+ self.linear_scale = linear_scale
259
+ self.q_budget = q_budget
260
+
261
+ def validate(self, value: Any, instance) -> None:
262
+ """Validate the question options.
263
+
264
+ >>> q_class = QuestionOptionsDescriptor.example()
265
+ >>> _ = q_class(["a", "b", "c"])
266
+ >>> _ = q_class(["a", "b", "c", "d", "d"])
267
+ Traceback (most recent call last):
268
+ ...
269
+ edsl.exceptions.questions.QuestionCreationValidationError: Question options must be unique (got ['a', 'b', 'c', 'd', 'd']).
270
+
271
+ We allow dynamic question options, which are strings of the form '{{ question_options }}'.
272
+
273
+ >>> _ = q_class("{{dynamic_options}}")
274
+ >>> _ = q_class("dynamic_options")
275
+ Traceback (most recent call last):
276
+ ...
277
+ edsl.exceptions.questions.QuestionCreationValidationError: ...
278
+ """
279
+ if isinstance(value, str):
280
+ # Check if the string is a dynamic question option
281
+ if "{{" in value and "}}" in value:
282
+ return None
283
+ else:
284
+ raise QuestionCreationValidationError(
285
+ f"Dynamic question options must have jinja2 braces - instead received: {value}."
286
+ )
287
+ if not isinstance(value, list):
288
+ raise QuestionCreationValidationError(
289
+ f"Question options must be a list (got {value})."
290
+ )
291
+ if len(value) > Settings.MAX_NUM_OPTIONS:
292
+ raise QuestionCreationValidationError(
293
+ f"Too many question options (got {value})."
294
+ )
295
+ if len(value) < Settings.MIN_NUM_OPTIONS:
296
+ raise QuestionCreationValidationError(
297
+ f"Too few question options (got {value})."
298
+ )
299
+ # handle the case when question_options is a list of lists (a list of list can be converted to set)
300
+ tmp_value = [str(x) for x in value]
301
+ if len(tmp_value) != len(set(tmp_value)):
302
+ raise QuestionCreationValidationError(
303
+ f"Question options must be unique (got {value})."
304
+ )
305
+ if not self.linear_scale:
306
+ if not self.q_budget:
307
+ pass
308
+ # if not (
309
+ # value
310
+ # and all(type(x) == type(value[0]) for x in value)
311
+ # and isinstance(value[0], (str, list, int, float))
312
+ # ):
313
+ # raise QuestionCreationValidationError(
314
+ # f"Question options must be all same type (got {value}).)"
315
+ # )
316
+ else:
317
+ if not all(isinstance(x, (str)) for x in value):
318
+ raise QuestionCreationValidationError(
319
+ f"Question options must be strings (got {value}).)"
320
+ )
321
+ if not all(
322
+ [
323
+ type(option) != str
324
+ or (len(option) >= 1 and len(option) < Settings.MAX_OPTION_LENGTH)
325
+ for option in value
326
+ ]
327
+ ):
328
+ raise QuestionCreationValidationError(
329
+ f"All question options must be at least 1 character long but less than {Settings.MAX_OPTION_LENGTH} characters long (got {value})."
330
+ )
331
+
332
+ if hasattr(instance, "min_selections") and instance.min_selections != None:
333
+ if instance.min_selections > len(value):
334
+ raise QuestionCreationValidationError(
335
+ f"You asked for at least {instance.min_selections} selections, but provided fewer options (got {value})."
336
+ )
337
+ if hasattr(instance, "max_selections") and instance.max_selections != None:
338
+ if instance.max_selections > len(value):
339
+ raise QuestionCreationValidationError(
340
+ f"You asked for at most {instance.max_selections} selections, but provided fewer options (got {value})."
341
+ )
342
+ if self.num_choices is not None:
343
+ if len(value) != self.num_choices:
344
+ raise QuestionCreationValidationError(
345
+ f"You asked for {self.num_choices} selections, but provided {len(value)} options."
346
+ )
347
+ if self.linear_scale:
348
+ if sorted(value) != list(range(min(value), max(value) + 1)):
349
+ raise QuestionCreationValidationError(
350
+ f"LinearScale.question_options must be a list of successive integers, e.g. [1, 2, 3] (got {value})."
351
+ )
352
+
353
+
354
+ class QuestionTextDescriptor(BaseDescriptor):
355
+ """Validate that the `question_text` attribute is a string.
356
+
357
+
358
+ >>> class TestQuestion:
359
+ ... question_text = QuestionTextDescriptor()
360
+ ... def __init__(self, question_text: str):
361
+ ... self.question_text = question_text
362
+
363
+ >>> _ = TestQuestion("What is the capital of France?")
364
+ >>> _ = TestQuestion("What is the capital of France? {{variable}}")
365
+ >>> _ = TestQuestion("What is the capital of France? {{variable name}}")
366
+ Traceback (most recent call last):
367
+ ...
368
+ edsl.exceptions.questions.QuestionCreationValidationError: Question text contains an invalid identifier: 'variable name'
369
+ """
370
+
371
+ def validate(self, value, instance):
372
+ """Validate the value is a string."""
373
+ # if len(value) > Settings.MAX_QUESTION_LENGTH:
374
+ # raise Exception("Question is too long!")
375
+ if len(value) < 1:
376
+ raise Exception("Question is too short!")
377
+ if not isinstance(value, str):
378
+ raise Exception("Question must be a string!")
379
+ if contains_single_braced_substring(value):
380
+ import warnings
381
+
382
+ # # warnings.warn(
383
+ # # f"WARNING: Question text contains a single-braced substring: If you intended to parameterize the question with a Scenario this should be changed to a double-braced substring, e.g. {{variable}}.\nSee details on constructing Scenarios in the docs: https://docs.expectedparrot.com/en/latest/scenarios.html",
384
+ # # UserWarning,
385
+ # # )
386
+ warnings.warn(
387
+ "WARNING: Question text contains a single-braced substring. "
388
+ "If you intended to parameterize the question with a Scenario, this will "
389
+ "be changed to a double-braced substring, e.g. {{variable}}.\n"
390
+ "See details on constructing Scenarios in the docs: "
391
+ "https://docs.expectedparrot.com/en/latest/scenarios.html",
392
+ UserWarning,
393
+ )
394
+ # Automatically replace single braces with double braces
395
+ # This is here because if the user is using an f-string, the double brace will get converted to a single brace.
396
+ # This undoes that.
397
+ value = re.sub(r"\{([^\{\}]+)\}", r"{{\1}}", value)
398
+ return value
399
+
400
+ # iterate through all doubles braces and check if they are valid python identifiers
401
+ for match in re.finditer(r"\{\{([^\{\}]+)\}\}", value):
402
+ if " " in match.group(1).strip():
403
+ raise QuestionCreationValidationError(
404
+ f"Question text contains an invalid identifier: '{match.group(1)}'"
405
+ )
406
+
407
+ return None
408
+
409
+
410
+ if __name__ == "__main__":
411
+ import doctest
412
+
413
+ doctest.testmod(optionflags=doctest.ELLIPSIS)