edsl 0.1.37__py3-none-any.whl → 0.1.37.dev3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. edsl/Base.py +303 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +48 -48
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +804 -855
  7. edsl/agents/AgentList.py +345 -350
  8. edsl/agents/Invigilator.py +222 -222
  9. edsl/agents/InvigilatorBase.py +305 -284
  10. edsl/agents/PromptConstructor.py +312 -353
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +86 -99
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +289 -289
  26. edsl/config.py +149 -149
  27. edsl/conjure/AgentConstructionMixin.py +152 -160
  28. edsl/conjure/Conjure.py +62 -62
  29. edsl/conjure/InputData.py +659 -659
  30. edsl/conjure/InputDataCSV.py +48 -48
  31. edsl/conjure/InputDataMixinQuestionStats.py +182 -182
  32. edsl/conjure/InputDataPyRead.py +91 -91
  33. edsl/conjure/InputDataSPSS.py +8 -8
  34. edsl/conjure/InputDataStata.py +8 -8
  35. edsl/conjure/QuestionOptionMixin.py +76 -76
  36. edsl/conjure/QuestionTypeMixin.py +23 -23
  37. edsl/conjure/RawQuestion.py +65 -65
  38. edsl/conjure/SurveyResponses.py +7 -7
  39. edsl/conjure/__init__.py +9 -9
  40. edsl/conjure/naming_utilities.py +263 -263
  41. edsl/conjure/utilities.py +201 -201
  42. edsl/conversation/Conversation.py +238 -290
  43. edsl/conversation/car_buying.py +58 -58
  44. edsl/conversation/mug_negotiation.py +81 -81
  45. edsl/conversation/next_speaker_utilities.py +93 -93
  46. edsl/coop/PriceFetcher.py +54 -54
  47. edsl/coop/__init__.py +2 -2
  48. edsl/coop/coop.py +824 -958
  49. edsl/coop/utils.py +131 -131
  50. edsl/data/Cache.py +527 -527
  51. edsl/data/CacheEntry.py +228 -228
  52. edsl/data/CacheHandler.py +149 -149
  53. edsl/data/RemoteCacheSync.py +97 -97
  54. edsl/data/SQLiteDict.py +292 -292
  55. edsl/data/__init__.py +4 -4
  56. edsl/data/orm.py +10 -10
  57. edsl/data_transfer_models.py +73 -73
  58. edsl/enums.py +173 -173
  59. edsl/exceptions/__init__.py +50 -54
  60. edsl/exceptions/agents.py +40 -38
  61. edsl/exceptions/configuration.py +16 -16
  62. edsl/exceptions/coop.py +10 -10
  63. edsl/exceptions/data.py +14 -14
  64. edsl/exceptions/general.py +34 -34
  65. edsl/exceptions/jobs.py +33 -33
  66. edsl/exceptions/language_models.py +63 -63
  67. edsl/exceptions/prompts.py +15 -15
  68. edsl/exceptions/questions.py +91 -91
  69. edsl/exceptions/results.py +26 -29
  70. edsl/exceptions/surveys.py +34 -37
  71. edsl/inference_services/AnthropicService.py +87 -87
  72. edsl/inference_services/AwsBedrock.py +115 -120
  73. edsl/inference_services/AzureAI.py +217 -217
  74. edsl/inference_services/DeepInfraService.py +18 -18
  75. edsl/inference_services/GoogleService.py +156 -156
  76. edsl/inference_services/GroqService.py +20 -20
  77. edsl/inference_services/InferenceServiceABC.py +147 -147
  78. edsl/inference_services/InferenceServicesCollection.py +74 -97
  79. edsl/inference_services/MistralAIService.py +123 -123
  80. edsl/inference_services/OllamaService.py +18 -18
  81. edsl/inference_services/OpenAIService.py +224 -224
  82. edsl/inference_services/TestService.py +89 -89
  83. edsl/inference_services/TogetherAIService.py +170 -170
  84. edsl/inference_services/models_available_cache.py +118 -118
  85. edsl/inference_services/rate_limits_cache.py +25 -25
  86. edsl/inference_services/registry.py +39 -39
  87. edsl/inference_services/write_available.py +10 -10
  88. edsl/jobs/Answers.py +56 -56
  89. edsl/jobs/Jobs.py +1121 -1347
  90. edsl/jobs/__init__.py +1 -1
  91. edsl/jobs/buckets/BucketCollection.py +63 -63
  92. edsl/jobs/buckets/ModelBuckets.py +65 -65
  93. edsl/jobs/buckets/TokenBucket.py +248 -248
  94. edsl/jobs/interviews/Interview.py +661 -661
  95. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  96. edsl/jobs/interviews/InterviewExceptionEntry.py +182 -186
  97. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  98. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  99. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  100. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  101. edsl/jobs/interviews/ReportErrors.py +66 -66
  102. edsl/jobs/interviews/interview_status_enum.py +9 -9
  103. edsl/jobs/runners/JobsRunnerAsyncio.py +338 -338
  104. edsl/jobs/runners/JobsRunnerStatus.py +332 -332
  105. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  106. edsl/jobs/tasks/TaskCreators.py +64 -64
  107. edsl/jobs/tasks/TaskHistory.py +441 -442
  108. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  109. edsl/jobs/tasks/task_status_enum.py +163 -163
  110. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  111. edsl/jobs/tokens/TokenUsage.py +34 -34
  112. edsl/language_models/LanguageModel.py +718 -706
  113. edsl/language_models/ModelList.py +102 -102
  114. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  115. edsl/language_models/__init__.py +2 -3
  116. edsl/language_models/fake_openai_call.py +15 -15
  117. edsl/language_models/fake_openai_service.py +61 -61
  118. edsl/language_models/registry.py +137 -137
  119. edsl/language_models/repair.py +156 -156
  120. edsl/language_models/unused/ReplicateBase.py +83 -83
  121. edsl/language_models/utilities.py +64 -64
  122. edsl/notebooks/Notebook.py +259 -259
  123. edsl/notebooks/__init__.py +1 -1
  124. edsl/prompts/Prompt.py +353 -357
  125. edsl/prompts/__init__.py +2 -2
  126. edsl/questions/AnswerValidatorMixin.py +289 -289
  127. edsl/questions/QuestionBase.py +616 -656
  128. edsl/questions/QuestionBaseGenMixin.py +161 -161
  129. edsl/questions/QuestionBasePromptsMixin.py +266 -234
  130. edsl/questions/QuestionBudget.py +227 -227
  131. edsl/questions/QuestionCheckBox.py +359 -359
  132. edsl/questions/QuestionExtract.py +183 -183
  133. edsl/questions/QuestionFreeText.py +114 -114
  134. edsl/questions/QuestionFunctional.py +159 -159
  135. edsl/questions/QuestionList.py +231 -231
  136. edsl/questions/QuestionMultipleChoice.py +286 -286
  137. edsl/questions/QuestionNumerical.py +153 -153
  138. edsl/questions/QuestionRank.py +324 -324
  139. edsl/questions/Quick.py +41 -41
  140. edsl/questions/RegisterQuestionsMeta.py +71 -71
  141. edsl/questions/ResponseValidatorABC.py +174 -174
  142. edsl/questions/SimpleAskMixin.py +73 -73
  143. edsl/questions/__init__.py +26 -26
  144. edsl/questions/compose_questions.py +98 -98
  145. edsl/questions/decorators.py +21 -21
  146. edsl/questions/derived/QuestionLikertFive.py +76 -76
  147. edsl/questions/derived/QuestionLinearScale.py +87 -87
  148. edsl/questions/derived/QuestionTopK.py +91 -91
  149. edsl/questions/derived/QuestionYesNo.py +82 -82
  150. edsl/questions/descriptors.py +418 -413
  151. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  152. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  153. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  154. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  155. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  156. edsl/questions/prompt_templates/question_list.jinja +17 -17
  157. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  158. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  159. edsl/questions/question_registry.py +147 -147
  160. edsl/questions/settings.py +12 -12
  161. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  162. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  163. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  164. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  165. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  166. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  167. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  168. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  169. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  170. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  171. edsl/questions/templates/list/question_presentation.jinja +5 -5
  172. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  173. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  174. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  175. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  176. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  177. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  178. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  179. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  180. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  181. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  182. edsl/results/Dataset.py +293 -293
  183. edsl/results/DatasetExportMixin.py +693 -717
  184. edsl/results/DatasetTree.py +145 -145
  185. edsl/results/Result.py +435 -450
  186. edsl/results/Results.py +1160 -1071
  187. edsl/results/ResultsDBMixin.py +238 -238
  188. edsl/results/ResultsExportMixin.py +43 -43
  189. edsl/results/ResultsFetchMixin.py +33 -33
  190. edsl/results/ResultsGGMixin.py +121 -121
  191. edsl/results/ResultsToolsMixin.py +98 -98
  192. edsl/results/Selector.py +118 -135
  193. edsl/results/__init__.py +2 -2
  194. edsl/results/tree_explore.py +115 -115
  195. edsl/scenarios/FileStore.py +458 -458
  196. edsl/scenarios/Scenario.py +510 -546
  197. edsl/scenarios/ScenarioHtmlMixin.py +59 -64
  198. edsl/scenarios/ScenarioList.py +1101 -1112
  199. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  200. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  201. edsl/scenarios/__init__.py +4 -4
  202. edsl/shared.py +1 -1
  203. edsl/study/ObjectEntry.py +173 -173
  204. edsl/study/ProofOfWork.py +113 -113
  205. edsl/study/SnapShot.py +80 -80
  206. edsl/study/Study.py +528 -528
  207. edsl/study/__init__.py +4 -4
  208. edsl/surveys/DAG.py +148 -148
  209. edsl/surveys/Memory.py +31 -31
  210. edsl/surveys/MemoryPlan.py +244 -244
  211. edsl/surveys/Rule.py +324 -330
  212. edsl/surveys/RuleCollection.py +387 -387
  213. edsl/surveys/Survey.py +1772 -1795
  214. edsl/surveys/SurveyCSS.py +261 -261
  215. edsl/surveys/SurveyExportMixin.py +259 -259
  216. edsl/surveys/SurveyFlowVisualizationMixin.py +121 -121
  217. edsl/surveys/SurveyQualtricsImport.py +284 -284
  218. edsl/surveys/__init__.py +3 -3
  219. edsl/surveys/base.py +53 -53
  220. edsl/surveys/descriptors.py +56 -56
  221. edsl/surveys/instructions/ChangeInstruction.py +47 -47
  222. edsl/surveys/instructions/Instruction.py +51 -51
  223. edsl/surveys/instructions/InstructionCollection.py +77 -77
  224. edsl/templates/error_reporting/base.html +23 -23
  225. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  226. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  227. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  228. edsl/templates/error_reporting/interview_details.html +115 -115
  229. edsl/templates/error_reporting/interviews.html +9 -9
  230. edsl/templates/error_reporting/overview.html +4 -4
  231. edsl/templates/error_reporting/performance_plot.html +1 -1
  232. edsl/templates/error_reporting/report.css +73 -73
  233. edsl/templates/error_reporting/report.html +117 -117
  234. edsl/templates/error_reporting/report.js +25 -25
  235. edsl/tools/__init__.py +1 -1
  236. edsl/tools/clusters.py +192 -192
  237. edsl/tools/embeddings.py +27 -27
  238. edsl/tools/embeddings_plotting.py +118 -118
  239. edsl/tools/plotting.py +112 -112
  240. edsl/tools/summarize.py +18 -18
  241. edsl/utilities/SystemInfo.py +28 -28
  242. edsl/utilities/__init__.py +22 -22
  243. edsl/utilities/ast_utilities.py +25 -25
  244. edsl/utilities/data/Registry.py +6 -6
  245. edsl/utilities/data/__init__.py +1 -1
  246. edsl/utilities/data/scooter_results.json +1 -1
  247. edsl/utilities/decorators.py +77 -77
  248. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  249. edsl/utilities/interface.py +627 -627
  250. edsl/utilities/repair_functions.py +28 -28
  251. edsl/utilities/restricted_python.py +70 -70
  252. edsl/utilities/utilities.py +391 -409
  253. {edsl-0.1.37.dist-info → edsl-0.1.37.dev3.dist-info}/LICENSE +21 -21
  254. {edsl-0.1.37.dist-info → edsl-0.1.37.dev3.dist-info}/METADATA +1 -1
  255. edsl-0.1.37.dev3.dist-info/RECORD +279 -0
  256. edsl/conversation/chips.py +0 -95
  257. edsl/exceptions/BaseException.py +0 -21
  258. edsl/exceptions/scenarios.py +0 -22
  259. edsl/language_models/KeyLookup.py +0 -30
  260. edsl-0.1.37.dist-info/RECORD +0 -283
  261. {edsl-0.1.37.dist-info → edsl-0.1.37.dev3.dist-info}/WHEEL +0 -0
@@ -1,387 +1,387 @@
1
- """A collection of rules for a survey."""
2
-
3
- from typing import List, Union, Any, Optional
4
- from collections import defaultdict, UserList
5
-
6
- from edsl.exceptions import (
7
- SurveyRuleCannotEvaluateError,
8
- SurveyRuleCollectionHasNoRulesAtNodeError,
9
- )
10
- from edsl.utilities.interface import print_table_with_rich
11
- from edsl.surveys.Rule import Rule
12
- from edsl.surveys.base import EndOfSurvey
13
- from edsl.surveys.DAG import DAG
14
-
15
- # from graphlib import TopologicalSorter
16
-
17
- from collections import namedtuple
18
-
19
- NextQuestion = namedtuple(
20
- "NextQuestion", "next_q, num_rules_found, expressions_evaluating_to_true, priority"
21
- )
22
-
23
-
24
- class RuleCollection(UserList):
25
- """A collection of rules for a particular survey."""
26
-
27
- def __init__(self, num_questions: Optional[int] = None, rules: List[Rule] = None):
28
- """Initialize the RuleCollection object.
29
-
30
- :param num_questions: The number of questions in the survey.
31
- :param rules: A list of Rule objects.
32
- """
33
- super().__init__(rules or [])
34
- self.num_questions = num_questions
35
-
36
- def __repr__(self):
37
- """Return a string representation of the RuleCollection object.
38
-
39
- Example usage:
40
-
41
- .. code-block:: python
42
-
43
- rule_collection = RuleCollection.example()
44
- _ = eval(repr(rule_collection))
45
-
46
- """
47
- return f"RuleCollection(rules={self.data}, num_questions={self.num_questions})"
48
-
49
- def to_dict(self):
50
- """Create a dictionary representation of the RuleCollection object."""
51
- return {
52
- "rules": [rule.to_dict() for rule in self],
53
- "num_questions": self.num_questions,
54
- }
55
-
56
- @classmethod
57
- def from_dict(cls, rule_collection_dict):
58
- """Create a RuleCollection object from a dictionary.
59
-
60
- >>> rule_collection = RuleCollection.example()
61
- >>> rule_collection_dict = rule_collection.to_dict()
62
- >>> new_rule_collection = RuleCollection.from_dict(rule_collection_dict)
63
- >>> repr(new_rule_collection) == repr(rule_collection)
64
- True
65
- """
66
- rules = [
67
- Rule.from_dict(rule_dict) for rule_dict in rule_collection_dict["rules"]
68
- ]
69
- num_questions = rule_collection_dict["num_questions"]
70
- new_rc = cls(rules=rules)
71
- new_rc.num_questions = num_questions
72
- return new_rc
73
-
74
- def add_rule(self, rule: Rule) -> None:
75
- """Add a rule to a survey.
76
-
77
- >>> rule_collection = RuleCollection()
78
- >>> rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}))
79
- >>> len(rule_collection)
80
- 1
81
-
82
- >>> rule_collection = RuleCollection()
83
- >>> r = Rule(current_q=1, expression="True", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule = True)
84
- >>> rule_collection.add_rule(r)
85
- >>> rule_collection[0] == r
86
- True
87
- >>> len(rule_collection.applicable_rules(1, before_rule=True))
88
- 1
89
- >>> len(rule_collection.applicable_rules(1, before_rule=False))
90
- 0
91
- """
92
- self.append(rule)
93
-
94
- def show_rules(self) -> None:
95
- """Print the rules in a table.
96
-
97
-
98
- .. code-block:: python
99
-
100
- rule_collection = RuleCollection.example()
101
- rule_collection.show_rules()
102
- ┏━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━┳━━━━━━━━━━┳━━━━━━━━━━━━━┓
103
- ┃ current_q ┃ expression ┃ next_q ┃ priority ┃ before_rule ┃
104
- ┡━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━╇━━━━━━━━━━╇━━━━━━━━━━━━━┩
105
- │ 1 │ q1 == 'yes' │ 3 │ 1 │ False │
106
- │ 1 │ q1 == 'no' │ 2 │ 1 │ False │
107
- └───────────┴─────────────┴────────┴──────────┴─────────────┘
108
- """
109
- keys = ["current_q", "expression", "next_q", "priority", "before_rule"]
110
- rule_list = []
111
- for rule in sorted(self, key=lambda r: r.current_q):
112
- rule_list.append({k: getattr(rule, k) for k in keys})
113
-
114
- print_table_with_rich(rule_list)
115
-
116
- def skip_question_before_running(self, q_now: int, answers: dict[str, Any]) -> bool:
117
- """Determine if a question should be skipped before running the question.
118
-
119
- :param q_now: The current question index.
120
- :param answers: The answers to the survey questions.
121
-
122
- >>> rule_collection = RuleCollection()
123
- >>> r = Rule(current_q=1, expression="True", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
124
- >>> rule_collection.add_rule(r)
125
- >>> rule_collection.skip_question_before_running(1, {})
126
- True
127
-
128
- >>> rule_collection = RuleCollection()
129
- >>> r = Rule(current_q=1, expression="False", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
130
- >>> rule_collection.add_rule(r)
131
- >>> rule_collection.skip_question_before_running(1, {})
132
- False
133
-
134
- """
135
- for rule in self.applicable_rules(q_now, before_rule=True):
136
- if rule.evaluate(answers):
137
- return True
138
- return False
139
-
140
- def applicable_rules(self, q_now: int, before_rule: bool = False) -> list:
141
- """Show the rules that apply at the current node.
142
-
143
- :param q_now: The current question index.
144
- :param before_rule: If True, return rules that are of the type that apply before the question is asked.
145
-
146
- Example usage:
147
-
148
- >>> rule_collection = RuleCollection.example()
149
- >>> rule_collection.applicable_rules(1)
150
- [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False)]
151
-
152
- The default is that the rule is applied after the question is asked.
153
- If we want to see the rules that apply before the question is asked, we can set before_rule=True.
154
-
155
- .. code-block:: python
156
-
157
- rule_collection = RuleCollection.example()
158
- rule_collection.applicable_rules(1)
159
- [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4})]
160
-
161
- More than one rule can apply. For example, suppose we are at node 1.
162
- We could have three rules:
163
- 1. "q1 == 'a' ==> 3
164
- 2. "q1 == 'b' ==> 4
165
- 3. "q1 == 'c' ==> 5
166
- """
167
- return [
168
- rule
169
- for rule in self
170
- if rule.current_q == q_now and rule.before_rule == before_rule
171
- ]
172
-
173
- def next_question(self, q_now: int, answers: dict[str, Any]) -> NextQuestion:
174
- """Find the next question by index, given the rule collection.
175
-
176
- This rule is applied after the question is answered.
177
-
178
- :param q_now: The current question index.
179
- :param answers: The answers to the survey questions so far, including the current question.
180
-
181
- >>> rule_collection = RuleCollection.example()
182
- >>> rule_collection.next_question(1, {'q1': 'yes'})
183
- NextQuestion(next_q=3, num_rules_found=2, expressions_evaluating_to_true=1, priority=1)
184
-
185
- """
186
- # # is this the first question? If it is, we need to check if it should be skipped.
187
- # if q_now == 0:
188
- # if self.skip_question_before_running(q_now, answers):
189
- # return NextQuestion(
190
- # next_q=q_now + 1,
191
- # num_rules_found=0,
192
- # expressions_evaluating_to_true=0,
193
- # priority=-1,
194
- # )
195
-
196
- # breakpoint()
197
- expressions_evaluating_to_true = 0
198
- next_q = None
199
- highest_priority = -2 # start with -2 to 'pick up' the default rule added
200
- num_rules_found = 0
201
-
202
- for rule in self.applicable_rules(q_now, before_rule=False):
203
- num_rules_found += 1
204
- try:
205
- if rule.evaluate(answers): # evaluates to True
206
- expressions_evaluating_to_true += 1
207
- if rule.priority > highest_priority: # higher priority
208
- # we have a new champ!
209
- next_q, highest_priority = rule.next_q, rule.priority
210
- except SurveyRuleCannotEvaluateError:
211
- raise
212
-
213
- if num_rules_found == 0:
214
- raise SurveyRuleCollectionHasNoRulesAtNodeError(
215
- f"No rules found for question {q_now}"
216
- )
217
-
218
- # breakpoint()
219
- ## Now we need to check if the *next question* has any 'before; rules that we should follow
220
- for rule in self.applicable_rules(next_q, before_rule=True):
221
- if rule.evaluate(answers): # rule evaluates to True
222
- return self.next_question(next_q, answers)
223
-
224
- return NextQuestion(
225
- next_q, num_rules_found, expressions_evaluating_to_true, highest_priority
226
- )
227
-
228
- @property
229
- def non_default_rules(self) -> List[Rule]:
230
- """Return all rules that are not the default rule.
231
-
232
- >>> rule_collection = RuleCollection.example()
233
- >>> len(rule_collection.non_default_rules)
234
- 2
235
-
236
- Example usage:
237
-
238
- .. code-block:: python
239
-
240
- rule_collection = RuleCollection.example()
241
- len(rule_collection.non_default_rules)
242
- 2
243
-
244
- """
245
- return [rule for rule in self if rule.priority > -1]
246
-
247
- def keys_between(self, start_q, end_q, right_inclusive=True):
248
- """Return a list of all question indices between start_q and end_q.
249
-
250
- Example usage:
251
-
252
- .. code-block:: python
253
-
254
- rule_collection = RuleCollection(num_questions=5)
255
- rule_collection.keys_between(1, 3)
256
- [2, 3]
257
- rule_collection.keys_between(1, 4)
258
- [2, 3, 4]
259
- rule_collection.keys_between(1, EndOfSurvey, right_inclusive=False)
260
- [2, 3]
261
-
262
- """
263
- # If it's the end of the survey, all questions between the start_q and the end of the survey
264
- # now depend on the start_q
265
- if end_q == EndOfSurvey:
266
- if self.num_questions is None:
267
- raise ValueError(
268
- "Cannot determine DAG when EndOfSurvey and when num_questions is not known."
269
- )
270
- end_q = self.num_questions - 1
271
-
272
- question_range = list(range(start_q + 1, end_q + int(right_inclusive)))
273
-
274
- return question_range
275
-
276
- @property
277
- def dag(self) -> dict:
278
- """
279
- Find the DAG of the survey, based on the skip logic.
280
-
281
- Keys are children questions; the list of values are nodes that must be answered first
282
-
283
- Rules are designated at the current question and then direct where
284
- control goes next. As such, the destination nodes are the keys
285
- and the current nodes are the values. Furthermore, all questions between
286
- the current and destination nodes are also included as keys, as they will depend
287
- on the answer to the focal node as well.
288
-
289
- For exmaple, if we have a rule that says "if q1 == 'yes', go to q3", then q3 depends on q1, but so does q2.
290
- So the DAG would be {3: [1], 2: [1]}.
291
-
292
- Example usage:
293
-
294
- .. code-block:: python
295
-
296
- rule_collection = RuleCollection(num_questions=5)
297
- qn2i = {'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}
298
- rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index = qn2i))
299
- rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index = qn2i))
300
- rule_collection.dag
301
- {2: {1}, 3: {1}}
302
-
303
- """
304
- children_to_parents = defaultdict(set)
305
- # We are only interested in non-default rules. Default rules are those
306
- # that just go to the next question, so they don't add any dependencies
307
-
308
- ## I think for a skip-question, the potenially-skippable question
309
- ## depends on all the other questions bein answered first.
310
- for rule in self.non_default_rules:
311
- if not rule.before_rule:
312
- # for a regular rule, the next question depends on the current question answer
313
- current_q, next_q = rule.current_q, rule.next_q
314
- for q in self.keys_between(current_q, next_q):
315
- children_to_parents[q].add(current_q)
316
- else:
317
- # for the 'before rule' skipping depends on all previous answers.
318
- focal_q = rule.current_q
319
- for q in range(0, focal_q):
320
- children_to_parents[focal_q].add(q)
321
-
322
- return DAG(dict(sorted(children_to_parents.items())))
323
-
324
- def detect_cycles(self):
325
- """
326
- Detect cycles in the survey rules using depth-first search.
327
-
328
- :return: A list of cycles if any are found, otherwise an empty list.
329
- """
330
- dag = self.dag
331
- visited = set()
332
- path = []
333
- cycles = []
334
-
335
- def dfs(node):
336
- if node in path:
337
- cycle = path[path.index(node) :]
338
- cycles.append(cycle + [node])
339
- return
340
-
341
- if node in visited:
342
- return
343
-
344
- visited.add(node)
345
- path.append(node)
346
-
347
- for child in dag.get(node, []):
348
- dfs(child)
349
-
350
- path.pop()
351
-
352
- for node in dag:
353
- if node not in visited:
354
- dfs(node)
355
-
356
- return cycles
357
-
358
- @classmethod
359
- def example(cls):
360
- """Create an example RuleCollection object."""
361
- qn2i = {"q1": 1, "q2": 2, "q3": 3, "q4": 4}
362
- return cls(
363
- num_questions=5,
364
- rules=[
365
- Rule(
366
- current_q=1,
367
- expression="q1 == 'yes'",
368
- next_q=3,
369
- priority=1,
370
- question_name_to_index=qn2i,
371
- ),
372
- Rule(
373
- current_q=1,
374
- expression="q1 == 'no'",
375
- next_q=2,
376
- priority=1,
377
- question_name_to_index=qn2i,
378
- ),
379
- ],
380
- )
381
-
382
-
383
- if __name__ == "__main__":
384
- # pass
385
- import doctest
386
-
387
- doctest.testmod(optionflags=doctest.ELLIPSIS)
1
+ """A collection of rules for a survey."""
2
+
3
+ from typing import List, Union, Any, Optional
4
+ from collections import defaultdict, UserList
5
+
6
+ from edsl.exceptions import (
7
+ SurveyRuleCannotEvaluateError,
8
+ SurveyRuleCollectionHasNoRulesAtNodeError,
9
+ )
10
+ from edsl.utilities.interface import print_table_with_rich
11
+ from edsl.surveys.Rule import Rule
12
+ from edsl.surveys.base import EndOfSurvey
13
+ from edsl.surveys.DAG import DAG
14
+
15
+ # from graphlib import TopologicalSorter
16
+
17
+ from collections import namedtuple
18
+
19
+ NextQuestion = namedtuple(
20
+ "NextQuestion", "next_q, num_rules_found, expressions_evaluating_to_true, priority"
21
+ )
22
+
23
+
24
+ class RuleCollection(UserList):
25
+ """A collection of rules for a particular survey."""
26
+
27
+ def __init__(self, num_questions: Optional[int] = None, rules: List[Rule] = None):
28
+ """Initialize the RuleCollection object.
29
+
30
+ :param num_questions: The number of questions in the survey.
31
+ :param rules: A list of Rule objects.
32
+ """
33
+ super().__init__(rules or [])
34
+ self.num_questions = num_questions
35
+
36
+ def __repr__(self):
37
+ """Return a string representation of the RuleCollection object.
38
+
39
+ Example usage:
40
+
41
+ .. code-block:: python
42
+
43
+ rule_collection = RuleCollection.example()
44
+ _ = eval(repr(rule_collection))
45
+
46
+ """
47
+ return f"RuleCollection(rules={self.data}, num_questions={self.num_questions})"
48
+
49
+ def to_dict(self):
50
+ """Create a dictionary representation of the RuleCollection object."""
51
+ return {
52
+ "rules": [rule.to_dict() for rule in self],
53
+ "num_questions": self.num_questions,
54
+ }
55
+
56
+ @classmethod
57
+ def from_dict(cls, rule_collection_dict):
58
+ """Create a RuleCollection object from a dictionary.
59
+
60
+ >>> rule_collection = RuleCollection.example()
61
+ >>> rule_collection_dict = rule_collection.to_dict()
62
+ >>> new_rule_collection = RuleCollection.from_dict(rule_collection_dict)
63
+ >>> repr(new_rule_collection) == repr(rule_collection)
64
+ True
65
+ """
66
+ rules = [
67
+ Rule.from_dict(rule_dict) for rule_dict in rule_collection_dict["rules"]
68
+ ]
69
+ num_questions = rule_collection_dict["num_questions"]
70
+ new_rc = cls(rules=rules)
71
+ new_rc.num_questions = num_questions
72
+ return new_rc
73
+
74
+ def add_rule(self, rule: Rule) -> None:
75
+ """Add a rule to a survey.
76
+
77
+ >>> rule_collection = RuleCollection()
78
+ >>> rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}))
79
+ >>> len(rule_collection)
80
+ 1
81
+
82
+ >>> rule_collection = RuleCollection()
83
+ >>> r = Rule(current_q=1, expression="True", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule = True)
84
+ >>> rule_collection.add_rule(r)
85
+ >>> rule_collection[0] == r
86
+ True
87
+ >>> len(rule_collection.applicable_rules(1, before_rule=True))
88
+ 1
89
+ >>> len(rule_collection.applicable_rules(1, before_rule=False))
90
+ 0
91
+ """
92
+ self.append(rule)
93
+
94
+ def show_rules(self) -> None:
95
+ """Print the rules in a table.
96
+
97
+
98
+ .. code-block:: python
99
+
100
+ rule_collection = RuleCollection.example()
101
+ rule_collection.show_rules()
102
+ ┏━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━┳━━━━━━━━━━┳━━━━━━━━━━━━━┓
103
+ ┃ current_q ┃ expression ┃ next_q ┃ priority ┃ before_rule ┃
104
+ ┡━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━╇━━━━━━━━━━╇━━━━━━━━━━━━━┩
105
+ │ 1 │ q1 == 'yes' │ 3 │ 1 │ False │
106
+ │ 1 │ q1 == 'no' │ 2 │ 1 │ False │
107
+ └───────────┴─────────────┴────────┴──────────┴─────────────┘
108
+ """
109
+ keys = ["current_q", "expression", "next_q", "priority", "before_rule"]
110
+ rule_list = []
111
+ for rule in sorted(self, key=lambda r: r.current_q):
112
+ rule_list.append({k: getattr(rule, k) for k in keys})
113
+
114
+ print_table_with_rich(rule_list)
115
+
116
+ def skip_question_before_running(self, q_now: int, answers: dict[str, Any]) -> bool:
117
+ """Determine if a question should be skipped before running the question.
118
+
119
+ :param q_now: The current question index.
120
+ :param answers: The answers to the survey questions.
121
+
122
+ >>> rule_collection = RuleCollection()
123
+ >>> r = Rule(current_q=1, expression="True", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
124
+ >>> rule_collection.add_rule(r)
125
+ >>> rule_collection.skip_question_before_running(1, {})
126
+ True
127
+
128
+ >>> rule_collection = RuleCollection()
129
+ >>> r = Rule(current_q=1, expression="False", next_q=2, priority=1, question_name_to_index={}, before_rule = True)
130
+ >>> rule_collection.add_rule(r)
131
+ >>> rule_collection.skip_question_before_running(1, {})
132
+ False
133
+
134
+ """
135
+ for rule in self.applicable_rules(q_now, before_rule=True):
136
+ if rule.evaluate(answers):
137
+ return True
138
+ return False
139
+
140
+ def applicable_rules(self, q_now: int, before_rule: bool = False) -> list:
141
+ """Show the rules that apply at the current node.
142
+
143
+ :param q_now: The current question index.
144
+ :param before_rule: If True, return rules that are of the type that apply before the question is asked.
145
+
146
+ Example usage:
147
+
148
+ >>> rule_collection = RuleCollection.example()
149
+ >>> rule_collection.applicable_rules(1)
150
+ [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}, before_rule=False)]
151
+
152
+ The default is that the rule is applied after the question is asked.
153
+ If we want to see the rules that apply before the question is asked, we can set before_rule=True.
154
+
155
+ .. code-block:: python
156
+
157
+ rule_collection = RuleCollection.example()
158
+ rule_collection.applicable_rules(1)
159
+ [Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}), Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index={'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4})]
160
+
161
+ More than one rule can apply. For example, suppose we are at node 1.
162
+ We could have three rules:
163
+ 1. "q1 == 'a' ==> 3
164
+ 2. "q1 == 'b' ==> 4
165
+ 3. "q1 == 'c' ==> 5
166
+ """
167
+ return [
168
+ rule
169
+ for rule in self
170
+ if rule.current_q == q_now and rule.before_rule == before_rule
171
+ ]
172
+
173
+ def next_question(self, q_now: int, answers: dict[str, Any]) -> NextQuestion:
174
+ """Find the next question by index, given the rule collection.
175
+
176
+ This rule is applied after the question is answered.
177
+
178
+ :param q_now: The current question index.
179
+ :param answers: The answers to the survey questions so far, including the current question.
180
+
181
+ >>> rule_collection = RuleCollection.example()
182
+ >>> rule_collection.next_question(1, {'q1': 'yes'})
183
+ NextQuestion(next_q=3, num_rules_found=2, expressions_evaluating_to_true=1, priority=1)
184
+
185
+ """
186
+ # # is this the first question? If it is, we need to check if it should be skipped.
187
+ # if q_now == 0:
188
+ # if self.skip_question_before_running(q_now, answers):
189
+ # return NextQuestion(
190
+ # next_q=q_now + 1,
191
+ # num_rules_found=0,
192
+ # expressions_evaluating_to_true=0,
193
+ # priority=-1,
194
+ # )
195
+
196
+ # breakpoint()
197
+ expressions_evaluating_to_true = 0
198
+ next_q = None
199
+ highest_priority = -2 # start with -2 to 'pick up' the default rule added
200
+ num_rules_found = 0
201
+
202
+ for rule in self.applicable_rules(q_now, before_rule=False):
203
+ num_rules_found += 1
204
+ try:
205
+ if rule.evaluate(answers): # evaluates to True
206
+ expressions_evaluating_to_true += 1
207
+ if rule.priority > highest_priority: # higher priority
208
+ # we have a new champ!
209
+ next_q, highest_priority = rule.next_q, rule.priority
210
+ except SurveyRuleCannotEvaluateError:
211
+ raise
212
+
213
+ if num_rules_found == 0:
214
+ raise SurveyRuleCollectionHasNoRulesAtNodeError(
215
+ f"No rules found for question {q_now}"
216
+ )
217
+
218
+ # breakpoint()
219
+ ## Now we need to check if the *next question* has any 'before; rules that we should follow
220
+ for rule in self.applicable_rules(next_q, before_rule=True):
221
+ if rule.evaluate(answers): # rule evaluates to True
222
+ return self.next_question(next_q, answers)
223
+
224
+ return NextQuestion(
225
+ next_q, num_rules_found, expressions_evaluating_to_true, highest_priority
226
+ )
227
+
228
+ @property
229
+ def non_default_rules(self) -> List[Rule]:
230
+ """Return all rules that are not the default rule.
231
+
232
+ >>> rule_collection = RuleCollection.example()
233
+ >>> len(rule_collection.non_default_rules)
234
+ 2
235
+
236
+ Example usage:
237
+
238
+ .. code-block:: python
239
+
240
+ rule_collection = RuleCollection.example()
241
+ len(rule_collection.non_default_rules)
242
+ 2
243
+
244
+ """
245
+ return [rule for rule in self if rule.priority > -1]
246
+
247
+ def keys_between(self, start_q, end_q, right_inclusive=True):
248
+ """Return a list of all question indices between start_q and end_q.
249
+
250
+ Example usage:
251
+
252
+ .. code-block:: python
253
+
254
+ rule_collection = RuleCollection(num_questions=5)
255
+ rule_collection.keys_between(1, 3)
256
+ [2, 3]
257
+ rule_collection.keys_between(1, 4)
258
+ [2, 3, 4]
259
+ rule_collection.keys_between(1, EndOfSurvey, right_inclusive=False)
260
+ [2, 3]
261
+
262
+ """
263
+ # If it's the end of the survey, all questions between the start_q and the end of the survey
264
+ # now depend on the start_q
265
+ if end_q == EndOfSurvey:
266
+ if self.num_questions is None:
267
+ raise ValueError(
268
+ "Cannot determine DAG when EndOfSurvey and when num_questions is not known."
269
+ )
270
+ end_q = self.num_questions - 1
271
+
272
+ question_range = list(range(start_q + 1, end_q + int(right_inclusive)))
273
+
274
+ return question_range
275
+
276
+ @property
277
+ def dag(self) -> dict:
278
+ """
279
+ Find the DAG of the survey, based on the skip logic.
280
+
281
+ Keys are children questions; the list of values are nodes that must be answered first
282
+
283
+ Rules are designated at the current question and then direct where
284
+ control goes next. As such, the destination nodes are the keys
285
+ and the current nodes are the values. Furthermore, all questions between
286
+ the current and destination nodes are also included as keys, as they will depend
287
+ on the answer to the focal node as well.
288
+
289
+ For exmaple, if we have a rule that says "if q1 == 'yes', go to q3", then q3 depends on q1, but so does q2.
290
+ So the DAG would be {3: [1], 2: [1]}.
291
+
292
+ Example usage:
293
+
294
+ .. code-block:: python
295
+
296
+ rule_collection = RuleCollection(num_questions=5)
297
+ qn2i = {'q1': 1, 'q2': 2, 'q3': 3, 'q4': 4}
298
+ rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'yes'", next_q=3, priority=1, question_name_to_index = qn2i))
299
+ rule_collection.add_rule(Rule(current_q=1, expression="q1 == 'no'", next_q=2, priority=1, question_name_to_index = qn2i))
300
+ rule_collection.dag
301
+ {2: {1}, 3: {1}}
302
+
303
+ """
304
+ children_to_parents = defaultdict(set)
305
+ # We are only interested in non-default rules. Default rules are those
306
+ # that just go to the next question, so they don't add any dependencies
307
+
308
+ ## I think for a skip-question, the potenially-skippable question
309
+ ## depends on all the other questions bein answered first.
310
+ for rule in self.non_default_rules:
311
+ if not rule.before_rule:
312
+ # for a regular rule, the next question depends on the current question answer
313
+ current_q, next_q = rule.current_q, rule.next_q
314
+ for q in self.keys_between(current_q, next_q):
315
+ children_to_parents[q].add(current_q)
316
+ else:
317
+ # for the 'before rule' skipping depends on all previous answers.
318
+ focal_q = rule.current_q
319
+ for q in range(0, focal_q):
320
+ children_to_parents[focal_q].add(q)
321
+
322
+ return DAG(dict(sorted(children_to_parents.items())))
323
+
324
+ def detect_cycles(self):
325
+ """
326
+ Detect cycles in the survey rules using depth-first search.
327
+
328
+ :return: A list of cycles if any are found, otherwise an empty list.
329
+ """
330
+ dag = self.dag
331
+ visited = set()
332
+ path = []
333
+ cycles = []
334
+
335
+ def dfs(node):
336
+ if node in path:
337
+ cycle = path[path.index(node) :]
338
+ cycles.append(cycle + [node])
339
+ return
340
+
341
+ if node in visited:
342
+ return
343
+
344
+ visited.add(node)
345
+ path.append(node)
346
+
347
+ for child in dag.get(node, []):
348
+ dfs(child)
349
+
350
+ path.pop()
351
+
352
+ for node in dag:
353
+ if node not in visited:
354
+ dfs(node)
355
+
356
+ return cycles
357
+
358
+ @classmethod
359
+ def example(cls):
360
+ """Create an example RuleCollection object."""
361
+ qn2i = {"q1": 1, "q2": 2, "q3": 3, "q4": 4}
362
+ return cls(
363
+ num_questions=5,
364
+ rules=[
365
+ Rule(
366
+ current_q=1,
367
+ expression="q1 == 'yes'",
368
+ next_q=3,
369
+ priority=1,
370
+ question_name_to_index=qn2i,
371
+ ),
372
+ Rule(
373
+ current_q=1,
374
+ expression="q1 == 'no'",
375
+ next_q=2,
376
+ priority=1,
377
+ question_name_to_index=qn2i,
378
+ ),
379
+ ],
380
+ )
381
+
382
+
383
+ if __name__ == "__main__":
384
+ # pass
385
+ import doctest
386
+
387
+ doctest.testmod(optionflags=doctest.ELLIPSIS)