edsl 0.1.36.dev6__py3-none-any.whl → 0.1.37__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. edsl/Base.py +303 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +48 -47
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +855 -804
  7. edsl/agents/AgentList.py +350 -337
  8. edsl/agents/Invigilator.py +222 -222
  9. edsl/agents/InvigilatorBase.py +284 -294
  10. edsl/agents/PromptConstructor.py +353 -312
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -86
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +289 -289
  26. edsl/config.py +149 -149
  27. edsl/conjure/AgentConstructionMixin.py +160 -152
  28. edsl/conjure/Conjure.py +62 -62
  29. edsl/conjure/InputData.py +659 -659
  30. edsl/conjure/InputDataCSV.py +48 -48
  31. edsl/conjure/InputDataMixinQuestionStats.py +182 -182
  32. edsl/conjure/InputDataPyRead.py +91 -91
  33. edsl/conjure/InputDataSPSS.py +8 -8
  34. edsl/conjure/InputDataStata.py +8 -8
  35. edsl/conjure/QuestionOptionMixin.py +76 -76
  36. edsl/conjure/QuestionTypeMixin.py +23 -23
  37. edsl/conjure/RawQuestion.py +65 -65
  38. edsl/conjure/SurveyResponses.py +7 -7
  39. edsl/conjure/__init__.py +9 -9
  40. edsl/conjure/naming_utilities.py +263 -263
  41. edsl/conjure/utilities.py +201 -201
  42. edsl/conversation/Conversation.py +290 -238
  43. edsl/conversation/car_buying.py +58 -58
  44. edsl/conversation/chips.py +95 -0
  45. edsl/conversation/mug_negotiation.py +81 -81
  46. edsl/conversation/next_speaker_utilities.py +93 -93
  47. edsl/coop/PriceFetcher.py +54 -54
  48. edsl/coop/__init__.py +2 -2
  49. edsl/coop/coop.py +958 -849
  50. edsl/coop/utils.py +131 -131
  51. edsl/data/Cache.py +527 -527
  52. edsl/data/CacheEntry.py +228 -228
  53. edsl/data/CacheHandler.py +149 -149
  54. edsl/data/RemoteCacheSync.py +97 -84
  55. edsl/data/SQLiteDict.py +292 -292
  56. edsl/data/__init__.py +4 -4
  57. edsl/data/orm.py +10 -10
  58. edsl/data_transfer_models.py +73 -73
  59. edsl/enums.py +173 -173
  60. edsl/exceptions/BaseException.py +21 -0
  61. edsl/exceptions/__init__.py +54 -50
  62. edsl/exceptions/agents.py +38 -40
  63. edsl/exceptions/configuration.py +16 -16
  64. edsl/exceptions/coop.py +10 -10
  65. edsl/exceptions/data.py +14 -14
  66. edsl/exceptions/general.py +34 -34
  67. edsl/exceptions/jobs.py +33 -33
  68. edsl/exceptions/language_models.py +63 -63
  69. edsl/exceptions/prompts.py +15 -15
  70. edsl/exceptions/questions.py +91 -91
  71. edsl/exceptions/results.py +29 -26
  72. edsl/exceptions/scenarios.py +22 -0
  73. edsl/exceptions/surveys.py +37 -34
  74. edsl/inference_services/AnthropicService.py +87 -87
  75. edsl/inference_services/AwsBedrock.py +120 -115
  76. edsl/inference_services/AzureAI.py +217 -217
  77. edsl/inference_services/DeepInfraService.py +18 -18
  78. edsl/inference_services/GoogleService.py +156 -156
  79. edsl/inference_services/GroqService.py +20 -20
  80. edsl/inference_services/InferenceServiceABC.py +147 -147
  81. edsl/inference_services/InferenceServicesCollection.py +97 -72
  82. edsl/inference_services/MistralAIService.py +123 -123
  83. edsl/inference_services/OllamaService.py +18 -18
  84. edsl/inference_services/OpenAIService.py +224 -224
  85. edsl/inference_services/TestService.py +89 -89
  86. edsl/inference_services/TogetherAIService.py +170 -170
  87. edsl/inference_services/models_available_cache.py +118 -118
  88. edsl/inference_services/rate_limits_cache.py +25 -25
  89. edsl/inference_services/registry.py +39 -39
  90. edsl/inference_services/write_available.py +10 -10
  91. edsl/jobs/Answers.py +56 -56
  92. edsl/jobs/Jobs.py +1347 -1112
  93. edsl/jobs/__init__.py +1 -1
  94. edsl/jobs/buckets/BucketCollection.py +63 -63
  95. edsl/jobs/buckets/ModelBuckets.py +65 -65
  96. edsl/jobs/buckets/TokenBucket.py +248 -248
  97. edsl/jobs/interviews/Interview.py +661 -651
  98. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  99. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -182
  100. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  101. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  102. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  103. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  104. edsl/jobs/interviews/ReportErrors.py +66 -66
  105. edsl/jobs/interviews/interview_status_enum.py +9 -9
  106. edsl/jobs/runners/JobsRunnerAsyncio.py +338 -337
  107. edsl/jobs/runners/JobsRunnerStatus.py +332 -332
  108. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  109. edsl/jobs/tasks/TaskCreators.py +64 -64
  110. edsl/jobs/tasks/TaskHistory.py +442 -441
  111. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  112. edsl/jobs/tasks/task_status_enum.py +163 -163
  113. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  114. edsl/jobs/tokens/TokenUsage.py +34 -34
  115. edsl/language_models/KeyLookup.py +30 -0
  116. edsl/language_models/LanguageModel.py +706 -718
  117. edsl/language_models/ModelList.py +102 -102
  118. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  119. edsl/language_models/__init__.py +3 -2
  120. edsl/language_models/fake_openai_call.py +15 -15
  121. edsl/language_models/fake_openai_service.py +61 -61
  122. edsl/language_models/registry.py +137 -137
  123. edsl/language_models/repair.py +156 -156
  124. edsl/language_models/unused/ReplicateBase.py +83 -83
  125. edsl/language_models/utilities.py +64 -64
  126. edsl/notebooks/Notebook.py +259 -259
  127. edsl/notebooks/__init__.py +1 -1
  128. edsl/prompts/Prompt.py +357 -358
  129. edsl/prompts/__init__.py +2 -2
  130. edsl/questions/AnswerValidatorMixin.py +289 -289
  131. edsl/questions/QuestionBase.py +656 -616
  132. edsl/questions/QuestionBaseGenMixin.py +161 -161
  133. edsl/questions/QuestionBasePromptsMixin.py +234 -266
  134. edsl/questions/QuestionBudget.py +227 -227
  135. edsl/questions/QuestionCheckBox.py +359 -359
  136. edsl/questions/QuestionExtract.py +183 -183
  137. edsl/questions/QuestionFreeText.py +114 -113
  138. edsl/questions/QuestionFunctional.py +159 -159
  139. edsl/questions/QuestionList.py +231 -231
  140. edsl/questions/QuestionMultipleChoice.py +286 -286
  141. edsl/questions/QuestionNumerical.py +153 -153
  142. edsl/questions/QuestionRank.py +324 -324
  143. edsl/questions/Quick.py +41 -41
  144. edsl/questions/RegisterQuestionsMeta.py +71 -71
  145. edsl/questions/ResponseValidatorABC.py +174 -174
  146. edsl/questions/SimpleAskMixin.py +73 -73
  147. edsl/questions/__init__.py +26 -26
  148. edsl/questions/compose_questions.py +98 -98
  149. edsl/questions/decorators.py +21 -21
  150. edsl/questions/derived/QuestionLikertFive.py +76 -76
  151. edsl/questions/derived/QuestionLinearScale.py +87 -87
  152. edsl/questions/derived/QuestionTopK.py +91 -91
  153. edsl/questions/derived/QuestionYesNo.py +82 -82
  154. edsl/questions/descriptors.py +413 -418
  155. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  156. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  157. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  158. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  159. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  160. edsl/questions/prompt_templates/question_list.jinja +17 -17
  161. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  162. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  163. edsl/questions/question_registry.py +147 -147
  164. edsl/questions/settings.py +12 -12
  165. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  166. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  167. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  168. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  169. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  170. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  171. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  172. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  173. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  174. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  175. edsl/questions/templates/list/question_presentation.jinja +5 -5
  176. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  177. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  178. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  179. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  180. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  181. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  182. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  183. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  184. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  185. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  186. edsl/results/Dataset.py +293 -293
  187. edsl/results/DatasetExportMixin.py +717 -693
  188. edsl/results/DatasetTree.py +145 -145
  189. edsl/results/Result.py +450 -433
  190. edsl/results/Results.py +1071 -1158
  191. edsl/results/ResultsDBMixin.py +238 -238
  192. edsl/results/ResultsExportMixin.py +43 -43
  193. edsl/results/ResultsFetchMixin.py +33 -33
  194. edsl/results/ResultsGGMixin.py +121 -121
  195. edsl/results/ResultsToolsMixin.py +98 -98
  196. edsl/results/Selector.py +135 -118
  197. edsl/results/__init__.py +2 -2
  198. edsl/results/tree_explore.py +115 -115
  199. edsl/scenarios/FileStore.py +458 -443
  200. edsl/scenarios/Scenario.py +546 -507
  201. edsl/scenarios/ScenarioHtmlMixin.py +64 -59
  202. edsl/scenarios/ScenarioList.py +1112 -1101
  203. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  204. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  205. edsl/scenarios/__init__.py +4 -2
  206. edsl/shared.py +1 -1
  207. edsl/study/ObjectEntry.py +173 -173
  208. edsl/study/ProofOfWork.py +113 -113
  209. edsl/study/SnapShot.py +80 -80
  210. edsl/study/Study.py +528 -528
  211. edsl/study/__init__.py +4 -4
  212. edsl/surveys/DAG.py +148 -148
  213. edsl/surveys/Memory.py +31 -31
  214. edsl/surveys/MemoryPlan.py +244 -244
  215. edsl/surveys/Rule.py +330 -324
  216. edsl/surveys/RuleCollection.py +387 -387
  217. edsl/surveys/Survey.py +1795 -1772
  218. edsl/surveys/SurveyCSS.py +261 -261
  219. edsl/surveys/SurveyExportMixin.py +259 -259
  220. edsl/surveys/SurveyFlowVisualizationMixin.py +121 -121
  221. edsl/surveys/SurveyQualtricsImport.py +284 -284
  222. edsl/surveys/__init__.py +3 -3
  223. edsl/surveys/base.py +53 -53
  224. edsl/surveys/descriptors.py +56 -56
  225. edsl/surveys/instructions/ChangeInstruction.py +47 -47
  226. edsl/surveys/instructions/Instruction.py +51 -51
  227. edsl/surveys/instructions/InstructionCollection.py +77 -77
  228. edsl/templates/error_reporting/base.html +23 -23
  229. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  230. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  231. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  232. edsl/templates/error_reporting/interview_details.html +115 -115
  233. edsl/templates/error_reporting/interviews.html +9 -9
  234. edsl/templates/error_reporting/overview.html +4 -4
  235. edsl/templates/error_reporting/performance_plot.html +1 -1
  236. edsl/templates/error_reporting/report.css +73 -73
  237. edsl/templates/error_reporting/report.html +117 -117
  238. edsl/templates/error_reporting/report.js +25 -25
  239. edsl/tools/__init__.py +1 -1
  240. edsl/tools/clusters.py +192 -192
  241. edsl/tools/embeddings.py +27 -27
  242. edsl/tools/embeddings_plotting.py +118 -118
  243. edsl/tools/plotting.py +112 -112
  244. edsl/tools/summarize.py +18 -18
  245. edsl/utilities/SystemInfo.py +28 -28
  246. edsl/utilities/__init__.py +22 -22
  247. edsl/utilities/ast_utilities.py +25 -25
  248. edsl/utilities/data/Registry.py +6 -6
  249. edsl/utilities/data/__init__.py +1 -1
  250. edsl/utilities/data/scooter_results.json +1 -1
  251. edsl/utilities/decorators.py +77 -77
  252. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  253. edsl/utilities/interface.py +627 -627
  254. edsl/utilities/repair_functions.py +28 -28
  255. edsl/utilities/restricted_python.py +70 -70
  256. edsl/utilities/utilities.py +409 -391
  257. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/LICENSE +21 -21
  258. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/METADATA +1 -1
  259. edsl-0.1.37.dist-info/RECORD +283 -0
  260. edsl-0.1.36.dev6.dist-info/RECORD +0 -279
  261. {edsl-0.1.36.dev6.dist-info → edsl-0.1.37.dist-info}/WHEEL +0 -0
@@ -1,118 +1,118 @@
1
- import json
2
- import numpy as np
3
- from sklearn.manifold import TSNE
4
- from IPython.display import display_html
5
-
6
-
7
- def compute_tsne(embeddings, labels):
8
- embeddings_np = np.array(embeddings)
9
- tsne = TSNE(n_components=2, random_state=42)
10
- tsne_results = tsne.fit_transform(embeddings_np)
11
- data = [
12
- {
13
- "x": float(tsne_results[i, 0]),
14
- "y": float(tsne_results[i, 1]),
15
- "label": labels[i],
16
- }
17
- for i in range(len(labels))
18
- ]
19
- return data
20
-
21
-
22
- def plot_tsne_in_notebook(embeddings, labels):
23
- # Compute t-SNE
24
- data = compute_tsne(embeddings, labels)
25
-
26
- # Convert data to JSON
27
- data_json = json.dumps(data)
28
-
29
- # HTML content with embedded data
30
- html_content = f"""
31
- <!DOCTYPE html>
32
- <html lang="en">
33
- <head>
34
- <meta charset="UTF-8">
35
- <title>t-SNE Plot with D3.js</title>
36
- <script src="https://d3js.org/d3.v6.min.js"></script>
37
- <style>
38
- .tooltip {{
39
- position: absolute;
40
- text-align: center;
41
- width: 80px;
42
- height: 28px;
43
- padding: 2px;
44
- font: 12px sans-serif;
45
- background: lightsteelblue;
46
- border: 0px;
47
- border-radius: 8px;
48
- pointer-events: none;
49
- }}
50
- </style>
51
- </head>
52
- <body>
53
- <svg width="600" height="600"></svg>
54
-
55
- <script>
56
- // Embedded data
57
- const data = {data_json};
58
-
59
- const svg = d3.select("svg"),
60
- width = +svg.attr("width"),
61
- height = +svg.attr("height");
62
-
63
- // Set up scales
64
- const x = d3.scaleLinear()
65
- .domain(d3.extent(data, d => d.x))
66
- .range([0, width]);
67
-
68
- const y = d3.scaleLinear()
69
- .domain(d3.extent(data, d => d.y))
70
- .range([height, 0]);
71
-
72
- // Create tooltip
73
- const tooltip = d3.select("body").append("div")
74
- .attr("class", "tooltip")
75
- .style("opacity", 0);
76
-
77
- // Create circles for each point
78
- svg.selectAll("circle")
79
- .data(data)
80
- .enter().append("circle")
81
- .attr("cx", d => x(d.x))
82
- .attr("cy", d => y(d.y))
83
- .attr("r", 5)
84
- .style("fill", "steelblue")
85
- .on("mouseover", function(event, d) {{
86
- tooltip.transition()
87
- .duration(200)
88
- .style("opacity", .9);
89
- tooltip.html(d.label)
90
- .style("left", (event.pageX + 5) + "px")
91
- .style("top", (event.pageY - 28) + "px");
92
- }})
93
- .on("mouseout", function(d) {{
94
- tooltip.transition()
95
- .duration(500)
96
- .style("opacity", 0);
97
- }});
98
- </script>
99
- </body>
100
- </html>
101
- """
102
-
103
- # Write HTML content to a temporary file
104
- html_file = "tsne_plot.html"
105
- with open(html_file, "w") as file:
106
- file.write(html_content)
107
-
108
- # Display the HTML content in an iframe within a Jupyter notebook
109
- display_html(
110
- f'<iframe src="{html_file}" width="600" height="600"></iframe>', raw=True
111
- )
112
-
113
-
114
- # Example usage
115
- if __name__ == "__main__":
116
- embeddings = [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6], [0.7, 0.8, 0.9]]
117
- labels = ["String 1", "String 2", "String 3"]
118
- plot_tsne_in_notebook(embeddings, labels)
1
+ import json
2
+ import numpy as np
3
+ from sklearn.manifold import TSNE
4
+ from IPython.display import display_html
5
+
6
+
7
+ def compute_tsne(embeddings, labels):
8
+ embeddings_np = np.array(embeddings)
9
+ tsne = TSNE(n_components=2, random_state=42)
10
+ tsne_results = tsne.fit_transform(embeddings_np)
11
+ data = [
12
+ {
13
+ "x": float(tsne_results[i, 0]),
14
+ "y": float(tsne_results[i, 1]),
15
+ "label": labels[i],
16
+ }
17
+ for i in range(len(labels))
18
+ ]
19
+ return data
20
+
21
+
22
+ def plot_tsne_in_notebook(embeddings, labels):
23
+ # Compute t-SNE
24
+ data = compute_tsne(embeddings, labels)
25
+
26
+ # Convert data to JSON
27
+ data_json = json.dumps(data)
28
+
29
+ # HTML content with embedded data
30
+ html_content = f"""
31
+ <!DOCTYPE html>
32
+ <html lang="en">
33
+ <head>
34
+ <meta charset="UTF-8">
35
+ <title>t-SNE Plot with D3.js</title>
36
+ <script src="https://d3js.org/d3.v6.min.js"></script>
37
+ <style>
38
+ .tooltip {{
39
+ position: absolute;
40
+ text-align: center;
41
+ width: 80px;
42
+ height: 28px;
43
+ padding: 2px;
44
+ font: 12px sans-serif;
45
+ background: lightsteelblue;
46
+ border: 0px;
47
+ border-radius: 8px;
48
+ pointer-events: none;
49
+ }}
50
+ </style>
51
+ </head>
52
+ <body>
53
+ <svg width="600" height="600"></svg>
54
+
55
+ <script>
56
+ // Embedded data
57
+ const data = {data_json};
58
+
59
+ const svg = d3.select("svg"),
60
+ width = +svg.attr("width"),
61
+ height = +svg.attr("height");
62
+
63
+ // Set up scales
64
+ const x = d3.scaleLinear()
65
+ .domain(d3.extent(data, d => d.x))
66
+ .range([0, width]);
67
+
68
+ const y = d3.scaleLinear()
69
+ .domain(d3.extent(data, d => d.y))
70
+ .range([height, 0]);
71
+
72
+ // Create tooltip
73
+ const tooltip = d3.select("body").append("div")
74
+ .attr("class", "tooltip")
75
+ .style("opacity", 0);
76
+
77
+ // Create circles for each point
78
+ svg.selectAll("circle")
79
+ .data(data)
80
+ .enter().append("circle")
81
+ .attr("cx", d => x(d.x))
82
+ .attr("cy", d => y(d.y))
83
+ .attr("r", 5)
84
+ .style("fill", "steelblue")
85
+ .on("mouseover", function(event, d) {{
86
+ tooltip.transition()
87
+ .duration(200)
88
+ .style("opacity", .9);
89
+ tooltip.html(d.label)
90
+ .style("left", (event.pageX + 5) + "px")
91
+ .style("top", (event.pageY - 28) + "px");
92
+ }})
93
+ .on("mouseout", function(d) {{
94
+ tooltip.transition()
95
+ .duration(500)
96
+ .style("opacity", 0);
97
+ }});
98
+ </script>
99
+ </body>
100
+ </html>
101
+ """
102
+
103
+ # Write HTML content to a temporary file
104
+ html_file = "tsne_plot.html"
105
+ with open(html_file, "w") as file:
106
+ file.write(html_content)
107
+
108
+ # Display the HTML content in an iframe within a Jupyter notebook
109
+ display_html(
110
+ f'<iframe src="{html_file}" width="600" height="600"></iframe>', raw=True
111
+ )
112
+
113
+
114
+ # Example usage
115
+ if __name__ == "__main__":
116
+ embeddings = [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6], [0.7, 0.8, 0.9]]
117
+ labels = ["String 1", "String 2", "String 3"]
118
+ plot_tsne_in_notebook(embeddings, labels)
edsl/tools/plotting.py CHANGED
@@ -1,112 +1,112 @@
1
- from typing import Optional
2
-
3
-
4
- def count_query(field):
5
- return f"""SELECT
6
- {field},
7
- COUNT(*) as number
8
- FROM self
9
- GROUP BY {field}
10
- """
11
-
12
-
13
- def get_options(results, field):
14
- question_type = results.survey.get_question(field).question_type
15
- if question_type in ["multiple_choice", "checkbox"]:
16
- return results.select(f"{field}_question_options").first()
17
- else:
18
- return None
19
-
20
-
21
- def interpret_image(path, analysis):
22
- from edsl import QuestionFreeText
23
- from edsl import Model
24
- from edsl import Scenario
25
-
26
- s = Scenario.from_image(path)
27
- if isinstance(analysis, str):
28
- plot_question_texts = [analysis]
29
- elif isinstance(analysis, list):
30
- plot_question_texts = analysis
31
-
32
- scenario_list = s.replicate(len(plot_question_texts))
33
- scenario_list.add_list("plot_question_text", plot_question_texts)
34
-
35
- m = Model("gpt-4o")
36
- q = QuestionFreeText(
37
- question_text="{{ plot_question_text }}", question_name="interpretation"
38
- )
39
- results = q.by(m).by(scenario_list).run()
40
- return results.select("plot_question_text", "interpretation").print(
41
- format="rich",
42
- pretty_labels={
43
- "scenario.plot_question_text": "Question to the model",
44
- "answer.interpretation": "Model answer",
45
- },
46
- )
47
-
48
-
49
- def barchart(
50
- results,
51
- field: str,
52
- fetch_options=True,
53
- xlab: Optional[str] = None,
54
- ylab: Optional[str] = None,
55
- analysis: Optional[str] = None,
56
- format: str = "png",
57
- ):
58
- labels = ""
59
- if xlab:
60
- labels += f"+ xlab('{xlab}')"
61
- if ylab:
62
- labels += f"+ ylab('{ylab}')"
63
-
64
- if fetch_options:
65
- factor_orders = {field: get_options(results, field)}
66
- else:
67
- factor_orders = None
68
-
69
- plot = results.ggplot2(
70
- f"""ggplot(data = self, aes(x = {field}, y = number)) +
71
- geom_bar(stat = "identity") +
72
- theme_bw() +
73
- theme(axis.text.x = element_text(angle = 45, hjust = 1)) {labels}""",
74
- sql=count_query(field),
75
- factor_orders=factor_orders,
76
- format=format,
77
- filename=f"barchart_{field}.{format}",
78
- )
79
- if analysis:
80
- interpret_image(f"barchart_{field}.{format}", analysis)
81
-
82
- return plot
83
-
84
-
85
- def theme_plot(results, field, context, themes=None, progress_bar=False):
86
- _, themes = results.auto_theme(
87
- field=field, context=context, themes=themes, progress_bar=progress_bar
88
- )
89
-
90
- themes_query = f"""
91
- SELECT theme, COUNT(*) AS mentions
92
- FROM (
93
- SELECT json_each.value AS theme
94
- FROM self,
95
- json_each({ field }_themes)
96
- )
97
- GROUP BY theme
98
- HAVING theme <> 'Other'
99
- ORDER BY mentions DESC
100
- """
101
- themes = results.sql(themes_query, to_list=True)
102
-
103
- (
104
- results.filter(f"{field} != ''").ggplot2(
105
- """ggplot(data = self, aes(x = theme, y = mentions)) +
106
- geom_bar(stat = "identity") +
107
- coord_flip() +
108
- theme_bw()""",
109
- sql=themes_query,
110
- factor_orders={"theme": [t[0] for t in themes]},
111
- )
112
- )
1
+ from typing import Optional
2
+
3
+
4
+ def count_query(field):
5
+ return f"""SELECT
6
+ {field},
7
+ COUNT(*) as number
8
+ FROM self
9
+ GROUP BY {field}
10
+ """
11
+
12
+
13
+ def get_options(results, field):
14
+ question_type = results.survey.get_question(field).question_type
15
+ if question_type in ["multiple_choice", "checkbox"]:
16
+ return results.select(f"{field}_question_options").first()
17
+ else:
18
+ return None
19
+
20
+
21
+ def interpret_image(path, analysis):
22
+ from edsl import QuestionFreeText
23
+ from edsl import Model
24
+ from edsl import Scenario
25
+
26
+ s = Scenario.from_image(path)
27
+ if isinstance(analysis, str):
28
+ plot_question_texts = [analysis]
29
+ elif isinstance(analysis, list):
30
+ plot_question_texts = analysis
31
+
32
+ scenario_list = s.replicate(len(plot_question_texts))
33
+ scenario_list.add_list("plot_question_text", plot_question_texts)
34
+
35
+ m = Model("gpt-4o")
36
+ q = QuestionFreeText(
37
+ question_text="{{ plot_question_text }}", question_name="interpretation"
38
+ )
39
+ results = q.by(m).by(scenario_list).run()
40
+ return results.select("plot_question_text", "interpretation").print(
41
+ format="rich",
42
+ pretty_labels={
43
+ "scenario.plot_question_text": "Question to the model",
44
+ "answer.interpretation": "Model answer",
45
+ },
46
+ )
47
+
48
+
49
+ def barchart(
50
+ results,
51
+ field: str,
52
+ fetch_options=True,
53
+ xlab: Optional[str] = None,
54
+ ylab: Optional[str] = None,
55
+ analysis: Optional[str] = None,
56
+ format: str = "png",
57
+ ):
58
+ labels = ""
59
+ if xlab:
60
+ labels += f"+ xlab('{xlab}')"
61
+ if ylab:
62
+ labels += f"+ ylab('{ylab}')"
63
+
64
+ if fetch_options:
65
+ factor_orders = {field: get_options(results, field)}
66
+ else:
67
+ factor_orders = None
68
+
69
+ plot = results.ggplot2(
70
+ f"""ggplot(data = self, aes(x = {field}, y = number)) +
71
+ geom_bar(stat = "identity") +
72
+ theme_bw() +
73
+ theme(axis.text.x = element_text(angle = 45, hjust = 1)) {labels}""",
74
+ sql=count_query(field),
75
+ factor_orders=factor_orders,
76
+ format=format,
77
+ filename=f"barchart_{field}.{format}",
78
+ )
79
+ if analysis:
80
+ interpret_image(f"barchart_{field}.{format}", analysis)
81
+
82
+ return plot
83
+
84
+
85
+ def theme_plot(results, field, context, themes=None, progress_bar=False):
86
+ _, themes = results.auto_theme(
87
+ field=field, context=context, themes=themes, progress_bar=progress_bar
88
+ )
89
+
90
+ themes_query = f"""
91
+ SELECT theme, COUNT(*) AS mentions
92
+ FROM (
93
+ SELECT json_each.value AS theme
94
+ FROM self,
95
+ json_each({ field }_themes)
96
+ )
97
+ GROUP BY theme
98
+ HAVING theme <> 'Other'
99
+ ORDER BY mentions DESC
100
+ """
101
+ themes = results.sql(themes_query, to_list=True)
102
+
103
+ (
104
+ results.filter(f"{field} != ''").ggplot2(
105
+ """ggplot(data = self, aes(x = theme, y = mentions)) +
106
+ geom_bar(stat = "identity") +
107
+ coord_flip() +
108
+ theme_bw()""",
109
+ sql=themes_query,
110
+ factor_orders={"theme": [t[0] for t in themes]},
111
+ )
112
+ )
edsl/tools/summarize.py CHANGED
@@ -1,18 +1,18 @@
1
- from edsl import QuestionList, Scenario, Model
2
-
3
-
4
- def summarize(texts, seed_phrase, n_bullets, n_words, models=None):
5
- if models is None:
6
- models = Model()
7
- s = Scenario(
8
- text=texts, seed_phrase=seed_phrase, n_bullets=n_bullets, n_words=n_words
9
- ).expand("text")
10
- QuestionList(
11
- question_text="""
12
- I have the following TEXT EXAMPLE :
13
- {{ text_example_json }}
14
- Please summarize the main point of this EXAMPLE {{seed_phrase }} into {{ n_bullets }} bullet points, where
15
- each bullet point is a {{ n_words }} word phrase.
16
- """,
17
- question_name="summarize",
18
- ).by(s).by(models).run()
1
+ from edsl import QuestionList, Scenario, Model
2
+
3
+
4
+ def summarize(texts, seed_phrase, n_bullets, n_words, models=None):
5
+ if models is None:
6
+ models = Model()
7
+ s = Scenario(
8
+ text=texts, seed_phrase=seed_phrase, n_bullets=n_bullets, n_words=n_words
9
+ ).expand("text")
10
+ QuestionList(
11
+ question_text="""
12
+ I have the following TEXT EXAMPLE :
13
+ {{ text_example_json }}
14
+ Please summarize the main point of this EXAMPLE {{seed_phrase }} into {{ n_bullets }} bullet points, where
15
+ each bullet point is a {{ n_words }} word phrase.
16
+ """,
17
+ question_name="summarize",
18
+ ).by(s).by(models).run()
@@ -1,28 +1,28 @@
1
- """Module to store system information."""
2
-
3
- from dataclasses import dataclass
4
- import getpass
5
- import platform
6
- import pkg_resources
7
-
8
-
9
- @dataclass
10
- class SystemInfo:
11
- """Dataclass to store system information."""
12
-
13
- username: str
14
- system_info: str
15
- release_info: str
16
- package_name: str
17
- package_version: str
18
-
19
- def __init__(self, package_name: str):
20
- """Initialize the dataclass with system."""
21
- self.username = getpass.getuser()
22
- self.system_info = platform.system()
23
- self.release_info = platform.release()
24
- self.package_name = package_name
25
- try:
26
- self.package_version = pkg_resources.get_distribution(package_name).version
27
- except pkg_resources.DistributionNotFound:
28
- self.package_version = "Not installed"
1
+ """Module to store system information."""
2
+
3
+ from dataclasses import dataclass
4
+ import getpass
5
+ import platform
6
+ import pkg_resources
7
+
8
+
9
+ @dataclass
10
+ class SystemInfo:
11
+ """Dataclass to store system information."""
12
+
13
+ username: str
14
+ system_info: str
15
+ release_info: str
16
+ package_name: str
17
+ package_version: str
18
+
19
+ def __init__(self, package_name: str):
20
+ """Initialize the dataclass with system."""
21
+ self.username = getpass.getuser()
22
+ self.system_info = platform.system()
23
+ self.release_info = platform.release()
24
+ self.package_name = package_name
25
+ try:
26
+ self.package_version = pkg_resources.get_distribution(package_name).version
27
+ except pkg_resources.DistributionNotFound:
28
+ self.package_version = "Not installed"
@@ -1,22 +1,22 @@
1
- # from edsl.utilities.interface import (
2
- # print_dict_as_html_table,
3
- # print_dict_with_rich,
4
- # print_list_of_dicts_as_html_table,
5
- # print_table_with_rich,
6
- # print_public_methods_with_doc,
7
- # print_list_of_dicts_as_markdown_table,
8
- # )
9
-
10
- # from edsl.utilities.utilities import (
11
- # create_valid_var_name,
12
- # dict_to_html,
13
- # hash_value,
14
- # HTMLSnippet,
15
- # is_notebook,
16
- # is_gzipped,
17
- # is_valid_variable_name,
18
- # random_string,
19
- # repair_json,
20
- # shorten_string,
21
- # time_all_functions,
22
- # )
1
+ # from edsl.utilities.interface import (
2
+ # print_dict_as_html_table,
3
+ # print_dict_with_rich,
4
+ # print_list_of_dicts_as_html_table,
5
+ # print_table_with_rich,
6
+ # print_public_methods_with_doc,
7
+ # print_list_of_dicts_as_markdown_table,
8
+ # )
9
+
10
+ # from edsl.utilities.utilities import (
11
+ # create_valid_var_name,
12
+ # dict_to_html,
13
+ # hash_value,
14
+ # HTMLSnippet,
15
+ # is_notebook,
16
+ # is_gzipped,
17
+ # is_valid_variable_name,
18
+ # random_string,
19
+ # repair_json,
20
+ # shorten_string,
21
+ # time_all_functions,
22
+ # )
@@ -1,25 +1,25 @@
1
- """Utilities for working with abstract syntax trees (ASTs)."""
2
-
3
- import ast
4
-
5
-
6
- def extract_variable_names(node):
7
- """Extract variable names from an abstract syntax tree (AST) node."""
8
- if isinstance(node, ast.Name):
9
- return [node.id] # Extract variable name
10
- elif isinstance(node, ast.BinOp):
11
- left_names = extract_variable_names(node.left)
12
- right_names = extract_variable_names(node.right)
13
- return left_names + right_names
14
- elif isinstance(node, ast.UnaryOp):
15
- return extract_variable_names(node.operand)
16
- elif isinstance(node, ast.Call):
17
- names = []
18
- for arg in node.args:
19
- names.extend(extract_variable_names(arg))
20
- return names
21
- else:
22
- names = []
23
- for child in ast.iter_child_nodes(node):
24
- names.extend(extract_variable_names(child))
25
- return names
1
+ """Utilities for working with abstract syntax trees (ASTs)."""
2
+
3
+ import ast
4
+
5
+
6
+ def extract_variable_names(node):
7
+ """Extract variable names from an abstract syntax tree (AST) node."""
8
+ if isinstance(node, ast.Name):
9
+ return [node.id] # Extract variable name
10
+ elif isinstance(node, ast.BinOp):
11
+ left_names = extract_variable_names(node.left)
12
+ right_names = extract_variable_names(node.right)
13
+ return left_names + right_names
14
+ elif isinstance(node, ast.UnaryOp):
15
+ return extract_variable_names(node.operand)
16
+ elif isinstance(node, ast.Call):
17
+ names = []
18
+ for arg in node.args:
19
+ names.extend(extract_variable_names(arg))
20
+ return names
21
+ else:
22
+ names = []
23
+ for child in ast.iter_child_nodes(node):
24
+ names.extend(extract_variable_names(child))
25
+ return names
@@ -1,6 +1,6 @@
1
- """This file contains the path to a results file."""
2
-
3
- import os
4
- from edsl import BASE_DIR
5
-
6
- SCOOTER_RESULTS_PATH = os.path.join(BASE_DIR, "utilities/data/scooter_results.json")
1
+ """This file contains the path to a results file."""
2
+
3
+ import os
4
+ from edsl import BASE_DIR
5
+
6
+ SCOOTER_RESULTS_PATH = os.path.join(BASE_DIR, "utilities/data/scooter_results.json")
@@ -1 +1 @@
1
- from edsl.utilities.data.Registry import SCOOTER_RESULTS_PATH
1
+ from edsl.utilities.data.Registry import SCOOTER_RESULTS_PATH