edsl 0.1.36.dev6__py3-none-any.whl → 0.1.37__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. edsl/Base.py +303 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +48 -47
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +855 -804
  7. edsl/agents/AgentList.py +350 -337
  8. edsl/agents/Invigilator.py +222 -222
  9. edsl/agents/InvigilatorBase.py +284 -294
  10. edsl/agents/PromptConstructor.py +353 -312
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -86
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +289 -289
  26. edsl/config.py +149 -149
  27. edsl/conjure/AgentConstructionMixin.py +160 -152
  28. edsl/conjure/Conjure.py +62 -62
  29. edsl/conjure/InputData.py +659 -659
  30. edsl/conjure/InputDataCSV.py +48 -48
  31. edsl/conjure/InputDataMixinQuestionStats.py +182 -182
  32. edsl/conjure/InputDataPyRead.py +91 -91
  33. edsl/conjure/InputDataSPSS.py +8 -8
  34. edsl/conjure/InputDataStata.py +8 -8
  35. edsl/conjure/QuestionOptionMixin.py +76 -76
  36. edsl/conjure/QuestionTypeMixin.py +23 -23
  37. edsl/conjure/RawQuestion.py +65 -65
  38. edsl/conjure/SurveyResponses.py +7 -7
  39. edsl/conjure/__init__.py +9 -9
  40. edsl/conjure/naming_utilities.py +263 -263
  41. edsl/conjure/utilities.py +201 -201
  42. edsl/conversation/Conversation.py +290 -238
  43. edsl/conversation/car_buying.py +58 -58
  44. edsl/conversation/chips.py +95 -0
  45. edsl/conversation/mug_negotiation.py +81 -81
  46. edsl/conversation/next_speaker_utilities.py +93 -93
  47. edsl/coop/PriceFetcher.py +54 -54
  48. edsl/coop/__init__.py +2 -2
  49. edsl/coop/coop.py +958 -849
  50. edsl/coop/utils.py +131 -131
  51. edsl/data/Cache.py +527 -527
  52. edsl/data/CacheEntry.py +228 -228
  53. edsl/data/CacheHandler.py +149 -149
  54. edsl/data/RemoteCacheSync.py +97 -84
  55. edsl/data/SQLiteDict.py +292 -292
  56. edsl/data/__init__.py +4 -4
  57. edsl/data/orm.py +10 -10
  58. edsl/data_transfer_models.py +73 -73
  59. edsl/enums.py +173 -173
  60. edsl/exceptions/BaseException.py +21 -0
  61. edsl/exceptions/__init__.py +54 -50
  62. edsl/exceptions/agents.py +38 -40
  63. edsl/exceptions/configuration.py +16 -16
  64. edsl/exceptions/coop.py +10 -10
  65. edsl/exceptions/data.py +14 -14
  66. edsl/exceptions/general.py +34 -34
  67. edsl/exceptions/jobs.py +33 -33
  68. edsl/exceptions/language_models.py +63 -63
  69. edsl/exceptions/prompts.py +15 -15
  70. edsl/exceptions/questions.py +91 -91
  71. edsl/exceptions/results.py +29 -26
  72. edsl/exceptions/scenarios.py +22 -0
  73. edsl/exceptions/surveys.py +37 -34
  74. edsl/inference_services/AnthropicService.py +87 -87
  75. edsl/inference_services/AwsBedrock.py +120 -115
  76. edsl/inference_services/AzureAI.py +217 -217
  77. edsl/inference_services/DeepInfraService.py +18 -18
  78. edsl/inference_services/GoogleService.py +156 -156
  79. edsl/inference_services/GroqService.py +20 -20
  80. edsl/inference_services/InferenceServiceABC.py +147 -147
  81. edsl/inference_services/InferenceServicesCollection.py +97 -72
  82. edsl/inference_services/MistralAIService.py +123 -123
  83. edsl/inference_services/OllamaService.py +18 -18
  84. edsl/inference_services/OpenAIService.py +224 -224
  85. edsl/inference_services/TestService.py +89 -89
  86. edsl/inference_services/TogetherAIService.py +170 -170
  87. edsl/inference_services/models_available_cache.py +118 -118
  88. edsl/inference_services/rate_limits_cache.py +25 -25
  89. edsl/inference_services/registry.py +39 -39
  90. edsl/inference_services/write_available.py +10 -10
  91. edsl/jobs/Answers.py +56 -56
  92. edsl/jobs/Jobs.py +1347 -1112
  93. edsl/jobs/__init__.py +1 -1
  94. edsl/jobs/buckets/BucketCollection.py +63 -63
  95. edsl/jobs/buckets/ModelBuckets.py +65 -65
  96. edsl/jobs/buckets/TokenBucket.py +248 -248
  97. edsl/jobs/interviews/Interview.py +661 -651
  98. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  99. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -182
  100. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  101. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  102. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  103. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  104. edsl/jobs/interviews/ReportErrors.py +66 -66
  105. edsl/jobs/interviews/interview_status_enum.py +9 -9
  106. edsl/jobs/runners/JobsRunnerAsyncio.py +338 -337
  107. edsl/jobs/runners/JobsRunnerStatus.py +332 -332
  108. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  109. edsl/jobs/tasks/TaskCreators.py +64 -64
  110. edsl/jobs/tasks/TaskHistory.py +442 -441
  111. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  112. edsl/jobs/tasks/task_status_enum.py +163 -163
  113. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  114. edsl/jobs/tokens/TokenUsage.py +34 -34
  115. edsl/language_models/KeyLookup.py +30 -0
  116. edsl/language_models/LanguageModel.py +706 -718
  117. edsl/language_models/ModelList.py +102 -102
  118. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  119. edsl/language_models/__init__.py +3 -2
  120. edsl/language_models/fake_openai_call.py +15 -15
  121. edsl/language_models/fake_openai_service.py +61 -61
  122. edsl/language_models/registry.py +137 -137
  123. edsl/language_models/repair.py +156 -156
  124. edsl/language_models/unused/ReplicateBase.py +83 -83
  125. edsl/language_models/utilities.py +64 -64
  126. edsl/notebooks/Notebook.py +259 -259
  127. edsl/notebooks/__init__.py +1 -1
  128. edsl/prompts/Prompt.py +357 -358
  129. edsl/prompts/__init__.py +2 -2
  130. edsl/questions/AnswerValidatorMixin.py +289 -289
  131. edsl/questions/QuestionBase.py +656 -616
  132. edsl/questions/QuestionBaseGenMixin.py +161 -161
  133. edsl/questions/QuestionBasePromptsMixin.py +234 -266
  134. edsl/questions/QuestionBudget.py +227 -227
  135. edsl/questions/QuestionCheckBox.py +359 -359
  136. edsl/questions/QuestionExtract.py +183 -183
  137. edsl/questions/QuestionFreeText.py +114 -113
  138. edsl/questions/QuestionFunctional.py +159 -159
  139. edsl/questions/QuestionList.py +231 -231
  140. edsl/questions/QuestionMultipleChoice.py +286 -286
  141. edsl/questions/QuestionNumerical.py +153 -153
  142. edsl/questions/QuestionRank.py +324 -324
  143. edsl/questions/Quick.py +41 -41
  144. edsl/questions/RegisterQuestionsMeta.py +71 -71
  145. edsl/questions/ResponseValidatorABC.py +174 -174
  146. edsl/questions/SimpleAskMixin.py +73 -73
  147. edsl/questions/__init__.py +26 -26
  148. edsl/questions/compose_questions.py +98 -98
  149. edsl/questions/decorators.py +21 -21
  150. edsl/questions/derived/QuestionLikertFive.py +76 -76
  151. edsl/questions/derived/QuestionLinearScale.py +87 -87
  152. edsl/questions/derived/QuestionTopK.py +91 -91
  153. edsl/questions/derived/QuestionYesNo.py +82 -82
  154. edsl/questions/descriptors.py +413 -418
  155. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  156. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  157. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  158. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  159. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  160. edsl/questions/prompt_templates/question_list.jinja +17 -17
  161. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  162. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  163. edsl/questions/question_registry.py +147 -147
  164. edsl/questions/settings.py +12 -12
  165. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  166. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  167. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  168. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  169. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  170. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  171. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  172. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  173. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  174. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  175. edsl/questions/templates/list/question_presentation.jinja +5 -5
  176. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  177. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  178. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  179. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  180. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  181. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  182. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  183. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  184. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  185. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  186. edsl/results/Dataset.py +293 -293
  187. edsl/results/DatasetExportMixin.py +717 -693
  188. edsl/results/DatasetTree.py +145 -145
  189. edsl/results/Result.py +450 -433
  190. edsl/results/Results.py +1071 -1158
  191. edsl/results/ResultsDBMixin.py +238 -238
  192. edsl/results/ResultsExportMixin.py +43 -43
  193. edsl/results/ResultsFetchMixin.py +33 -33
  194. edsl/results/ResultsGGMixin.py +121 -121
  195. edsl/results/ResultsToolsMixin.py +98 -98
  196. edsl/results/Selector.py +135 -118
  197. edsl/results/__init__.py +2 -2
  198. edsl/results/tree_explore.py +115 -115
  199. edsl/scenarios/FileStore.py +458 -443
  200. edsl/scenarios/Scenario.py +546 -507
  201. edsl/scenarios/ScenarioHtmlMixin.py +64 -59
  202. edsl/scenarios/ScenarioList.py +1112 -1101
  203. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  204. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  205. edsl/scenarios/__init__.py +4 -2
  206. edsl/shared.py +1 -1
  207. edsl/study/ObjectEntry.py +173 -173
  208. edsl/study/ProofOfWork.py +113 -113
  209. edsl/study/SnapShot.py +80 -80
  210. edsl/study/Study.py +528 -528
  211. edsl/study/__init__.py +4 -4
  212. edsl/surveys/DAG.py +148 -148
  213. edsl/surveys/Memory.py +31 -31
  214. edsl/surveys/MemoryPlan.py +244 -244
  215. edsl/surveys/Rule.py +330 -324
  216. edsl/surveys/RuleCollection.py +387 -387
  217. edsl/surveys/Survey.py +1795 -1772
  218. edsl/surveys/SurveyCSS.py +261 -261
  219. edsl/surveys/SurveyExportMixin.py +259 -259
  220. edsl/surveys/SurveyFlowVisualizationMixin.py +121 -121
  221. edsl/surveys/SurveyQualtricsImport.py +284 -284
  222. edsl/surveys/__init__.py +3 -3
  223. edsl/surveys/base.py +53 -53
  224. edsl/surveys/descriptors.py +56 -56
  225. edsl/surveys/instructions/ChangeInstruction.py +47 -47
  226. edsl/surveys/instructions/Instruction.py +51 -51
  227. edsl/surveys/instructions/InstructionCollection.py +77 -77
  228. edsl/templates/error_reporting/base.html +23 -23
  229. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  230. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  231. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  232. edsl/templates/error_reporting/interview_details.html +115 -115
  233. edsl/templates/error_reporting/interviews.html +9 -9
  234. edsl/templates/error_reporting/overview.html +4 -4
  235. edsl/templates/error_reporting/performance_plot.html +1 -1
  236. edsl/templates/error_reporting/report.css +73 -73
  237. edsl/templates/error_reporting/report.html +117 -117
  238. edsl/templates/error_reporting/report.js +25 -25
  239. edsl/tools/__init__.py +1 -1
  240. edsl/tools/clusters.py +192 -192
  241. edsl/tools/embeddings.py +27 -27
  242. edsl/tools/embeddings_plotting.py +118 -118
  243. edsl/tools/plotting.py +112 -112
  244. edsl/tools/summarize.py +18 -18
  245. edsl/utilities/SystemInfo.py +28 -28
  246. edsl/utilities/__init__.py +22 -22
  247. edsl/utilities/ast_utilities.py +25 -25
  248. edsl/utilities/data/Registry.py +6 -6
  249. edsl/utilities/data/__init__.py +1 -1
  250. edsl/utilities/data/scooter_results.json +1 -1
  251. edsl/utilities/decorators.py +77 -77
  252. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  253. edsl/utilities/interface.py +627 -627
  254. edsl/utilities/repair_functions.py +28 -28
  255. edsl/utilities/restricted_python.py +70 -70
  256. edsl/utilities/utilities.py +409 -391
  257. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/LICENSE +21 -21
  258. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/METADATA +1 -1
  259. edsl-0.1.37.dist-info/RECORD +283 -0
  260. edsl-0.1.36.dev6.dist-info/RECORD +0 -279
  261. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/WHEEL +0 -0
@@ -1,387 +1,387 @@
1
- """A collection of rules for a survey."""
2
-
3
- from typing import List, Union, Any, Optional
4
- from collections import defaultdict, UserList
5
-
6
- from edsl.exceptions import (
7
- SurveyRuleCannotEvaluateError,
8
- SurveyRuleCollectionHasNoRulesAtNodeError,
9
- )
10
- from edsl.utilities.interface import print_table_with_rich
11
- from edsl.surveys.Rule import Rule
12
- from edsl.surveys.base import EndOfSurvey
13
- from edsl.surveys.DAG import DAG
14
-
15
- # from graphlib import TopologicalSorter
16
-
17
- from collections import namedtuple
18
-
19
- NextQuestion = namedtuple(
20
- "NextQuestion", "next_q, num_rules_found, expressions_evaluating_to_true, priority"
21
- )
22
-
23
-
24
- class RuleCollection(UserList):
25
- """A collection of rules for a particular survey."""
26
-
27
- def __init__(self, num_questions: Optional[int] = None, rules: List[Rule] = None):
28
- """Initialize the RuleCollection object.
29
-
30
- :param num_questions: The number of questions in the survey.
31
- :param rules: A list of Rule objects.
32
- """
33
- super().__init__(rules or [])
34
- self.num_questions = num_questions
35
-
36
- def __repr__(self):
37
- """Return a string representation of the RuleCollection object.
38
-
39
- Example usage:
40
-
41
- .. code-block:: python
42
-
43
- rule_collection = RuleCollection.example()
44
- _ = eval(repr(rule_collection))
45
-
46
- """
47
- return f"RuleCollection(rules={self.data}, num_questions={self.num_questions})"
48
-
49
- def to_dict(self):
50
- """Create a dictionary representation of the RuleCollection object."""
51
- return {
52
- "rules": [rule.to_dict() for rule in self],
53
- "num_questions": self.num_questions,
54
- }
55
-
56
- @classmethod
57
- def from_dict(cls, rule_collection_dict):
58
- """Create a RuleCollection object from a dictionary.
59
-
60
- >>> rule_collection = RuleCollection.example()
61
- >>> rule_collection_dict = rule_collection.to_dict()
62
- >>> new_rule_collection = RuleCollection.from_dict(rule_collection_dict)
63
- >>> repr(new_rule_collection) == repr(rule_collection)
64
- True
65
- """
66
- rules = [
67
- Rule.from_dict(rule_dict) for rule_dict in rule_collection_dict["rules"]
68
- ]
69
- num_questions = rule_collection_dict["num_questions"]
70
- new_rc = cls(rules=rules)
71
- new_rc.num_questions = num_questions
72
- return new_rc
73
-
74
- def add_rule(self, rule: Rule) -> None:
75
- """Add a rule to a survey.
76
-
77
- >>> rule_collection = RuleCollection()
78
- >>> rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}))
79
- >>> len(rule_collection)
80
- 1
81
-
82
- >>> rule_collection = RuleCollection()
83
- >>> r = Rule(current_q=1, expression="True", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule = True)
84
- >>> rule_collection.add_rule(r)
85
- >>> rule_collection[0] == r
86
- True
87
- >>> len(rule_collection.applicable_rules(1, before_rule=True))
88
- 1
89
- >>> len(rule_collection.applicable_rules(1, before_rule=False))
90
- 0
91
- """
92
- self.append(rule)
93
-
94
- def show_rules(self) -> None:
95
- """Print the rules in a table.
96
-
97
-
98
- .. code-block:: python
99
-
100
- rule_collection = RuleCollection.example()
101
- rule_collection.show_rules()
102
- ┏━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━┳━━━━━━━━━━┳━━━━━━━━━━━━━┓
103
- ┃ current_q ┃ expression ┃ next_q ┃ priority ┃ before_rule ┃
104
- ┡━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━╇━━━━━━━━━━╇━━━━━━━━━━━━━┩
105
- │ 1 │ q1 == 'yes' │ 3 │ 1 │ False │
106
- │ 1 │ q1 == 'no' │ 2 │ 1 │ False │
107
- └───────────┴─────────────┴────────┴──────────┴─────────────┘
108
- """
109
- keys = ["current_q", "expression", "next_q", "priority", "before_rule"]
110
- rule_list = []
111
- for rule in sorted(self, key=lambda r: r.current_q):
112
- rule_list.append({k: getattr(rule, k) for k in keys})
113
-
114
- print_table_with_rich(rule_list)
115
-
116
- def skip_question_before_running(self, q_now: int, answers: dict[str, Any]) -> bool:
117
- """Determine if a question should be skipped before running the question.
118
-
119
- :param q_now: The current question index.
120
- :param answers: The answers to the survey questions.
121
-
122
- >>> rule_collection = RuleCollection()
123
- >>> r = Rule(current_q=1, expression="True", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
124
- >>> rule_collection.add_rule(r)
125
- >>> rule_collection.skip_question_before_running(1, {})
126
- True
127
-
128
- >>> rule_collection = RuleCollection()
129
- >>> r = Rule(current_q=1, expression="False", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
130
- >>> rule_collection.add_rule(r)
131
- >>> rule_collection.skip_question_before_running(1, {})
132
- False
133
-
134
- """
135
- for rule in self.applicable_rules(q_now, before_rule=True):
136
- if rule.evaluate(answers):
137
- return True
138
- return False
139
-
140
- def applicable_rules(self, q_now: int, before_rule: bool = False) -> list:
141
- """Show the rules that apply at the current node.
142
-
143
- :param q_now: The current question index.
144
- :param before_rule: If True, return rules that are of the type that apply before the question is asked.
145
-
146
- Example usage:
147
-
148
- >>> rule_collection = RuleCollection.example()
149
- >>> rule_collection.applicable_rules(1)
150
- [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False)]
151
-
152
- The default is that the rule is applied after the question is asked.
153
- If we want to see the rules that apply before the question is asked, we can set before_rule=True.
154
-
155
- .. code-block:: python
156
-
157
- rule_collection = RuleCollection.example()
158
- rule_collection.applicable_rules(1)
159
- [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4})]
160
-
161
- More than one rule can apply. For example, suppose we are at node 1.
162
- We could have three rules:
163
- 1. "q1 == 'a' ==> 3
164
- 2. "q1 == 'b' ==> 4
165
- 3. "q1 == 'c' ==> 5
166
- """
167
- return [
168
- rule
169
- for rule in self
170
- if rule.current_q == q_now and rule.before_rule == before_rule
171
- ]
172
-
173
- def next_question(self, q_now: int, answers: dict[str, Any]) -> NextQuestion:
174
- """Find the next question by index, given the rule collection.
175
-
176
- This rule is applied after the question is answered.
177
-
178
- :param q_now: The current question index.
179
- :param answers: The answers to the survey questions so far, including the current question.
180
-
181
- >>> rule_collection = RuleCollection.example()
182
- >>> rule_collection.next_question(1, {'q1': 'yes'})
183
- NextQuestion(next_q=3, num_rules_found=2, expressions_evaluating_to_true=1, priority=1)
184
-
185
- """
186
- # # is this the first question? If it is, we need to check if it should be skipped.
187
- # if q_now == 0:
188
- # if self.skip_question_before_running(q_now, answers):
189
- # return NextQuestion(
190
- # next_q=q_now + 1,
191
- # num_rules_found=0,
192
- # expressions_evaluating_to_true=0,
193
- # priority=-1,
194
- # )
195
-
196
- # breakpoint()
197
- expressions_evaluating_to_true = 0
198
- next_q = None
199
- highest_priority = -2 # start with -2 to 'pick up' the default rule added
200
- num_rules_found = 0
201
-
202
- for rule in self.applicable_rules(q_now, before_rule=False):
203
- num_rules_found += 1
204
- try:
205
- if rule.evaluate(answers): # evaluates to True
206
- expressions_evaluating_to_true += 1
207
- if rule.priority > highest_priority: # higher priority
208
- # we have a new champ!
209
- next_q, highest_priority = rule.next_q, rule.priority
210
- except SurveyRuleCannotEvaluateError:
211
- raise
212
-
213
- if num_rules_found == 0:
214
- raise SurveyRuleCollectionHasNoRulesAtNodeError(
215
- f"No rules found for question {q_now}"
216
- )
217
-
218
- # breakpoint()
219
- ## Now we need to check if the *next question* has any 'before; rules that we should follow
220
- for rule in self.applicable_rules(next_q, before_rule=True):
221
- if rule.evaluate(answers): # rule evaluates to True
222
- return self.next_question(next_q, answers)
223
-
224
- return NextQuestion(
225
- next_q, num_rules_found, expressions_evaluating_to_true, highest_priority
226
- )
227
-
228
- @property
229
- def non_default_rules(self) -> List[Rule]:
230
- """Return all rules that are not the default rule.
231
-
232
- >>> rule_collection = RuleCollection.example()
233
- >>> len(rule_collection.non_default_rules)
234
- 2
235
-
236
- Example usage:
237
-
238
- .. code-block:: python
239
-
240
- rule_collection = RuleCollection.example()
241
- len(rule_collection.non_default_rules)
242
- 2
243
-
244
- """
245
- return [rule for rule in self if rule.priority > -1]
246
-
247
- def keys_between(self, start_q, end_q, right_inclusive=True):
248
- """Return a list of all question indices between start_q and end_q.
249
-
250
- Example usage:
251
-
252
- .. code-block:: python
253
-
254
- rule_collection = RuleCollection(num_questions=5)
255
- rule_collection.keys_between(1, 3)
256
- [2, 3]
257
- rule_collection.keys_between(1, 4)
258
- [2, 3, 4]
259
- rule_collection.keys_between(1, EndOfSurvey, right_inclusive=False)
260
- [2, 3]
261
-
262
- """
263
- # If it's the end of the survey, all questions between the start_q and the end of the survey
264
- # now depend on the start_q
265
- if end_q == EndOfSurvey:
266
- if self.num_questions is None:
267
- raise ValueError(
268
- "Cannot determine DAG when EndOfSurvey and when num_questions is not known."
269
- )
270
- end_q = self.num_questions - 1
271
-
272
- question_range = list(range(start_q + 1, end_q + int(right_inclusive)))
273
-
274
- return question_range
275
-
276
- @property
277
- def dag(self) -> dict:
278
- """
279
- Find the DAG of the survey, based on the skip logic.
280
-
281
- Keys are children questions; the list of values are nodes that must be answered first
282
-
283
- Rules are designated at the current question and then direct where
284
- control goes next. As such, the destination nodes are the keys
285
- and the current nodes are the values. Furthermore, all questions between
286
- the current and destination nodes are also included as keys, as they will depend
287
- on the answer to the focal node as well.
288
-
289
- For exmaple, if we have a rule that says "if q1 == 'yes', go to q3", then q3 depends on q1, but so does q2.
290
- So the DAG would be {3: [1], 2: [1]}.
291
-
292
- Example usage:
293
-
294
- .. code-block:: python
295
-
296
- rule_collection = RuleCollection(num_questions=5)
297
- qn2i = {'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}
298
- rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index = qn2i))
299
- rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index = qn2i))
300
- rule_collection.dag
301
- {2: {1}, 3: {1}}
302
-
303
- """
304
- children_to_parents = defaultdict(set)
305
- # We are only interested in non-default rules. Default rules are those
306
- # that just go to the next question, so they don't add any dependencies
307
-
308
- ## I think for a skip-question, the potenially-skippable question
309
- ## depends on all the other questions bein answered first.
310
- for rule in self.non_default_rules:
311
- if not rule.before_rule:
312
- # for a regular rule, the next question depends on the current question answer
313
- current_q, next_q = rule.current_q, rule.next_q
314
- for q in self.keys_between(current_q, next_q):
315
- children_to_parents[q].add(current_q)
316
- else:
317
- # for the 'before rule' skipping depends on all previous answers.
318
- focal_q = rule.current_q
319
- for q in range(0, focal_q):
320
- children_to_parents[focal_q].add(q)
321
-
322
- return DAG(dict(sorted(children_to_parents.items())))
323
-
324
- def detect_cycles(self):
325
- """
326
- Detect cycles in the survey rules using depth-first search.
327
-
328
- :return: A list of cycles if any are found, otherwise an empty list.
329
- """
330
- dag = self.dag
331
- visited = set()
332
- path = []
333
- cycles = []
334
-
335
- def dfs(node):
336
- if node in path:
337
- cycle = path[path.index(node) :]
338
- cycles.append(cycle + [node])
339
- return
340
-
341
- if node in visited:
342
- return
343
-
344
- visited.add(node)
345
- path.append(node)
346
-
347
- for child in dag.get(node, []):
348
- dfs(child)
349
-
350
- path.pop()
351
-
352
- for node in dag:
353
- if node not in visited:
354
- dfs(node)
355
-
356
- return cycles
357
-
358
- @classmethod
359
- def example(cls):
360
- """Create an example RuleCollection object."""
361
- qn2i = {"q1": 1, "q2": 2, "q3": 3, "q4": 4}
362
- return cls(
363
- num_questions=5,
364
- rules=[
365
- Rule(
366
- current_q=1,
367
- expression="q1 == 'yes'",
368
- next_q=3,
369
- priority=1,
370
- question_name_to_index=qn2i,
371
- ),
372
- Rule(
373
- current_q=1,
374
- expression="q1 == 'no'",
375
- next_q=2,
376
- priority=1,
377
- question_name_to_index=qn2i,
378
- ),
379
- ],
380
- )
381
-
382
-
383
- if __name__ == "__main__":
384
- # pass
385
- import doctest
386
-
387
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ """A collection of rules for a survey."""
2
+
3
+ from typing import List, Union, Any, Optional
4
+ from collections import defaultdict, UserList
5
+
6
+ from edsl.exceptions import (
7
+ SurveyRuleCannotEvaluateError,
8
+ SurveyRuleCollectionHasNoRulesAtNodeError,
9
+ )
10
+ from edsl.utilities.interface import print_table_with_rich
11
+ from edsl.surveys.Rule import Rule
12
+ from edsl.surveys.base import EndOfSurvey
13
+ from edsl.surveys.DAG import DAG
14
+
15
+ # from graphlib import TopologicalSorter
16
+
17
+ from collections import namedtuple
18
+
19
+ NextQuestion = namedtuple(
20
+ "NextQuestion", "next_q, num_rules_found, expressions_evaluating_to_true, priority"
21
+ )
22
+
23
+
24
+ class RuleCollection(UserList):
25
+ """A collection of rules for a particular survey."""
26
+
27
+ def __init__(self, num_questions: Optional[int] = None, rules: List[Rule] = None):
28
+ """Initialize the RuleCollection object.
29
+
30
+ :param num_questions: The number of questions in the survey.
31
+ :param rules: A list of Rule objects.
32
+ """
33
+ super().__init__(rules or [])
34
+ self.num_questions = num_questions
35
+
36
+ def __repr__(self):
37
+ """Return a string representation of the RuleCollection object.
38
+
39
+ Example usage:
40
+
41
+ .. code-block:: python
42
+
43
+ rule_collection = RuleCollection.example()
44
+ _ = eval(repr(rule_collection))
45
+
46
+ """
47
+ return f"RuleCollection(rules={self.data}, num_questions={self.num_questions})"
48
+
49
+ def to_dict(self):
50
+ """Create a dictionary representation of the RuleCollection object."""
51
+ return {
52
+ "rules": [rule.to_dict() for rule in self],
53
+ "num_questions": self.num_questions,
54
+ }
55
+
56
+ @classmethod
57
+ def from_dict(cls, rule_collection_dict):
58
+ """Create a RuleCollection object from a dictionary.
59
+
60
+ >>> rule_collection = RuleCollection.example()
61
+ >>> rule_collection_dict = rule_collection.to_dict()
62
+ >>> new_rule_collection = RuleCollection.from_dict(rule_collection_dict)
63
+ >>> repr(new_rule_collection) == repr(rule_collection)
64
+ True
65
+ """
66
+ rules = [
67
+ Rule.from_dict(rule_dict) for rule_dict in rule_collection_dict["rules"]
68
+ ]
69
+ num_questions = rule_collection_dict["num_questions"]
70
+ new_rc = cls(rules=rules)
71
+ new_rc.num_questions = num_questions
72
+ return new_rc
73
+
74
+ def add_rule(self, rule: Rule) -> None:
75
+ """Add a rule to a survey.
76
+
77
+ >>> rule_collection = RuleCollection()
78
+ >>> rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}))
79
+ >>> len(rule_collection)
80
+ 1
81
+
82
+ >>> rule_collection = RuleCollection()
83
+ >>> r = Rule(current_q=1, expression="True", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule = True)
84
+ >>> rule_collection.add_rule(r)
85
+ >>> rule_collection[0] == r
86
+ True
87
+ >>> len(rule_collection.applicable_rules(1, before_rule=True))
88
+ 1
89
+ >>> len(rule_collection.applicable_rules(1, before_rule=False))
90
+ 0
91
+ """
92
+ self.append(rule)
93
+
94
+ def show_rules(self) -> None:
95
+ """Print the rules in a table.
96
+
97
+
98
+ .. code-block:: python
99
+
100
+ rule_collection = RuleCollection.example()
101
+ rule_collection.show_rules()
102
+ ┏━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━┳━━━━━━━━━━┳━━━━━━━━━━━━━┓
103
+ ┃ current_q ┃ expression ┃ next_q ┃ priority ┃ before_rule ┃
104
+ ┡━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━╇━━━━━━━━━━╇━━━━━━━━━━━━━┩
105
+ │ 1 │ q1 == 'yes' │ 3 │ 1 │ False │
106
+ │ 1 │ q1 == 'no' │ 2 │ 1 │ False │
107
+ └───────────┴─────────────┴────────┴──────────┴─────────────┘
108
+ """
109
+ keys = ["current_q", "expression", "next_q", "priority", "before_rule"]
110
+ rule_list = []
111
+ for rule in sorted(self, key=lambda r: r.current_q):
112
+ rule_list.append({k: getattr(rule, k) for k in keys})
113
+
114
+ print_table_with_rich(rule_list)
115
+
116
+ def skip_question_before_running(self, q_now: int, answers: dict[str, Any]) -> bool:
117
+ """Determine if a question should be skipped before running the question.
118
+
119
+ :param q_now: The current question index.
120
+ :param answers: The answers to the survey questions.
121
+
122
+ >>> rule_collection = RuleCollection()
123
+ >>> r = Rule(current_q=1, expression="True", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
124
+ >>> rule_collection.add_rule(r)
125
+ >>> rule_collection.skip_question_before_running(1, {})
126
+ True
127
+
128
+ >>> rule_collection = RuleCollection()
129
+ >>> r = Rule(current_q=1, expression="False", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
130
+ >>> rule_collection.add_rule(r)
131
+ >>> rule_collection.skip_question_before_running(1, {})
132
+ False
133
+
134
+ """
135
+ for rule in self.applicable_rules(q_now, before_rule=True):
136
+ if rule.evaluate(answers):
137
+ return True
138
+ return False
139
+
140
+ def applicable_rules(self, q_now: int, before_rule: bool = False) -> list:
141
+ """Show the rules that apply at the current node.
142
+
143
+ :param q_now: The current question index.
144
+ :param before_rule: If True, return rules that are of the type that apply before the question is asked.
145
+
146
+ Example usage:
147
+
148
+ >>> rule_collection = RuleCollection.example()
149
+ >>> rule_collection.applicable_rules(1)
150
+ [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False)]
151
+
152
+ The default is that the rule is applied after the question is asked.
153
+ If we want to see the rules that apply before the question is asked, we can set before_rule=True.
154
+
155
+ .. code-block:: python
156
+
157
+ rule_collection = RuleCollection.example()
158
+ rule_collection.applicable_rules(1)
159
+ [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4})]
160
+
161
+ More than one rule can apply. For example, suppose we are at node 1.
162
+ We could have three rules:
163
+ 1. "q1 == 'a' ==> 3
164
+ 2. "q1 == 'b' ==> 4
165
+ 3. "q1 == 'c' ==> 5
166
+ """
167
+ return [
168
+ rule
169
+ for rule in self
170
+ if rule.current_q == q_now and rule.before_rule == before_rule
171
+ ]
172
+
173
+ def next_question(self, q_now: int, answers: dict[str, Any]) -> NextQuestion:
174
+ """Find the next question by index, given the rule collection.
175
+
176
+ This rule is applied after the question is answered.
177
+
178
+ :param q_now: The current question index.
179
+ :param answers: The answers to the survey questions so far, including the current question.
180
+
181
+ >>> rule_collection = RuleCollection.example()
182
+ >>> rule_collection.next_question(1, {'q1': 'yes'})
183
+ NextQuestion(next_q=3, num_rules_found=2, expressions_evaluating_to_true=1, priority=1)
184
+
185
+ """
186
+ # # is this the first question? If it is, we need to check if it should be skipped.
187
+ # if q_now == 0:
188
+ # if self.skip_question_before_running(q_now, answers):
189
+ # return NextQuestion(
190
+ # next_q=q_now + 1,
191
+ # num_rules_found=0,
192
+ # expressions_evaluating_to_true=0,
193
+ # priority=-1,
194
+ # )
195
+
196
+ # breakpoint()
197
+ expressions_evaluating_to_true = 0
198
+ next_q = None
199
+ highest_priority = -2 # start with -2 to 'pick up' the default rule added
200
+ num_rules_found = 0
201
+
202
+ for rule in self.applicable_rules(q_now, before_rule=False):
203
+ num_rules_found += 1
204
+ try:
205
+ if rule.evaluate(answers): # evaluates to True
206
+ expressions_evaluating_to_true += 1
207
+ if rule.priority > highest_priority: # higher priority
208
+ # we have a new champ!
209
+ next_q, highest_priority = rule.next_q, rule.priority
210
+ except SurveyRuleCannotEvaluateError:
211
+ raise
212
+
213
+ if num_rules_found == 0:
214
+ raise SurveyRuleCollectionHasNoRulesAtNodeError(
215
+ f"No rules found for question {q_now}"
216
+ )
217
+
218
+ # breakpoint()
219
+ ## Now we need to check if the *next question* has any 'before; rules that we should follow
220
+ for rule in self.applicable_rules(next_q, before_rule=True):
221
+ if rule.evaluate(answers): # rule evaluates to True
222
+ return self.next_question(next_q, answers)
223
+
224
+ return NextQuestion(
225
+ next_q, num_rules_found, expressions_evaluating_to_true, highest_priority
226
+ )
227
+
228
+ @property
229
+ def non_default_rules(self) -> List[Rule]:
230
+ """Return all rules that are not the default rule.
231
+
232
+ >>> rule_collection = RuleCollection.example()
233
+ >>> len(rule_collection.non_default_rules)
234
+ 2
235
+
236
+ Example usage:
237
+
238
+ .. code-block:: python
239
+
240
+ rule_collection = RuleCollection.example()
241
+ len(rule_collection.non_default_rules)
242
+ 2
243
+
244
+ """
245
+ return [rule for rule in self if rule.priority > -1]
246
+
247
+ def keys_between(self, start_q, end_q, right_inclusive=True):
248
+ """Return a list of all question indices between start_q and end_q.
249
+
250
+ Example usage:
251
+
252
+ .. code-block:: python
253
+
254
+ rule_collection = RuleCollection(num_questions=5)
255
+ rule_collection.keys_between(1, 3)
256
+ [2, 3]
257
+ rule_collection.keys_between(1, 4)
258
+ [2, 3, 4]
259
+ rule_collection.keys_between(1, EndOfSurvey, right_inclusive=False)
260
+ [2, 3]
261
+
262
+ """
263
+ # If it's the end of the survey, all questions between the start_q and the end of the survey
264
+ # now depend on the start_q
265
+ if end_q == EndOfSurvey:
266
+ if self.num_questions is None:
267
+ raise ValueError(
268
+ "Cannot determine DAG when EndOfSurvey and when num_questions is not known."
269
+ )
270
+ end_q = self.num_questions - 1
271
+
272
+ question_range = list(range(start_q + 1, end_q + int(right_inclusive)))
273
+
274
+ return question_range
275
+
276
+ @property
277
+ def dag(self) -> dict:
278
+ """
279
+ Find the DAG of the survey, based on the skip logic.
280
+
281
+ Keys are children questions; the list of values are nodes that must be answered first
282
+
283
+ Rules are designated at the current question and then direct where
284
+ control goes next. As such, the destination nodes are the keys
285
+ and the current nodes are the values. Furthermore, all questions between
286
+ the current and destination nodes are also included as keys, as they will depend
287
+ on the answer to the focal node as well.
288
+
289
+ For exmaple, if we have a rule that says "if q1 == 'yes', go to q3", then q3 depends on q1, but so does q2.
290
+ So the DAG would be {3: [1], 2: [1]}.
291
+
292
+ Example usage:
293
+
294
+ .. code-block:: python
295
+
296
+ rule_collection = RuleCollection(num_questions=5)
297
+ qn2i = {'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}
298
+ rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index = qn2i))
299
+ rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index = qn2i))
300
+ rule_collection.dag
301
+ {2: {1}, 3: {1}}
302
+
303
+ """
304
+ children_to_parents = defaultdict(set)
305
+ # We are only interested in non-default rules. Default rules are those
306
+ # that just go to the next question, so they don't add any dependencies
307
+
308
+ ## I think for a skip-question, the potenially-skippable question
309
+ ## depends on all the other questions bein answered first.
310
+ for rule in self.non_default_rules:
311
+ if not rule.before_rule:
312
+ # for a regular rule, the next question depends on the current question answer
313
+ current_q, next_q = rule.current_q, rule.next_q
314
+ for q in self.keys_between(current_q, next_q):
315
+ children_to_parents[q].add(current_q)
316
+ else:
317
+ # for the 'before rule' skipping depends on all previous answers.
318
+ focal_q = rule.current_q
319
+ for q in range(0, focal_q):
320
+ children_to_parents[focal_q].add(q)
321
+
322
+ return DAG(dict(sorted(children_to_parents.items())))
323
+
324
+ def detect_cycles(self):
325
+ """
326
+ Detect cycles in the survey rules using depth-first search.
327
+
328
+ :return: A list of cycles if any are found, otherwise an empty list.
329
+ """
330
+ dag = self.dag
331
+ visited = set()
332
+ path = []
333
+ cycles = []
334
+
335
+ def dfs(node):
336
+ if node in path:
337
+ cycle = path[path.index(node) :]
338
+ cycles.append(cycle + [node])
339
+ return
340
+
341
+ if node in visited:
342
+ return
343
+
344
+ visited.add(node)
345
+ path.append(node)
346
+
347
+ for child in dag.get(node, []):
348
+ dfs(child)
349
+
350
+ path.pop()
351
+
352
+ for node in dag:
353
+ if node not in visited:
354
+ dfs(node)
355
+
356
+ return cycles
357
+
358
+ @classmethod
359
+ def example(cls):
360
+ """Create an example RuleCollection object."""
361
+ qn2i = {"q1": 1, "q2": 2, "q3": 3, "q4": 4}
362
+ return cls(
363
+ num_questions=5,
364
+ rules=[
365
+ Rule(
366
+ current_q=1,
367
+ expression="q1 == 'yes'",
368
+ next_q=3,
369
+ priority=1,
370
+ question_name_to_index=qn2i,
371
+ ),
372
+ Rule(
373
+ current_q=1,
374
+ expression="q1 == 'no'",
375
+ next_q=2,
376
+ priority=1,
377
+ question_name_to_index=qn2i,
378
+ ),
379
+ ],
380
+ )
381
+
382
+
383
+ if __name__ == "__main__":
384
+ # pass
385
+ import doctest
386
+
387
+ doctest.testmod(optionflags=doctest.ELLIPSIS)