edsl 0.1.38.dev3__py3-none-any.whl → 0.1.38.dev4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (256) hide show
  1. edsl/Base.py +332 -303
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +49 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +867 -858
  7. edsl/agents/AgentList.py +413 -362
  8. edsl/agents/Invigilator.py +233 -222
  9. edsl/agents/InvigilatorBase.py +265 -284
  10. edsl/agents/PromptConstructor.py +354 -353
  11. edsl/agents/__init__.py +3 -3
  12. edsl/agents/descriptors.py +99 -99
  13. edsl/agents/prompt_helpers.py +129 -129
  14. edsl/auto/AutoStudy.py +117 -117
  15. edsl/auto/StageBase.py +230 -230
  16. edsl/auto/StageGenerateSurvey.py +178 -178
  17. edsl/auto/StageLabelQuestions.py +125 -125
  18. edsl/auto/StagePersona.py +61 -61
  19. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  20. edsl/auto/StagePersonaDimensionValues.py +74 -74
  21. edsl/auto/StagePersonaDimensions.py +69 -69
  22. edsl/auto/StageQuestions.py +73 -73
  23. edsl/auto/SurveyCreatorPipeline.py +21 -21
  24. edsl/auto/utilities.py +224 -224
  25. edsl/base/Base.py +279 -279
  26. edsl/config.py +157 -149
  27. edsl/conversation/Conversation.py +290 -290
  28. edsl/conversation/car_buying.py +58 -58
  29. edsl/conversation/chips.py +95 -95
  30. edsl/conversation/mug_negotiation.py +81 -81
  31. edsl/conversation/next_speaker_utilities.py +93 -93
  32. edsl/coop/PriceFetcher.py +54 -54
  33. edsl/coop/__init__.py +2 -2
  34. edsl/coop/coop.py +1028 -961
  35. edsl/coop/utils.py +131 -131
  36. edsl/data/Cache.py +555 -530
  37. edsl/data/CacheEntry.py +233 -228
  38. edsl/data/CacheHandler.py +149 -149
  39. edsl/data/RemoteCacheSync.py +78 -97
  40. edsl/data/SQLiteDict.py +292 -292
  41. edsl/data/__init__.py +4 -4
  42. edsl/data/orm.py +10 -10
  43. edsl/data_transfer_models.py +73 -73
  44. edsl/enums.py +175 -173
  45. edsl/exceptions/BaseException.py +21 -21
  46. edsl/exceptions/__init__.py +54 -54
  47. edsl/exceptions/agents.py +42 -42
  48. edsl/exceptions/cache.py +5 -5
  49. edsl/exceptions/configuration.py +16 -16
  50. edsl/exceptions/coop.py +10 -10
  51. edsl/exceptions/data.py +14 -14
  52. edsl/exceptions/general.py +34 -34
  53. edsl/exceptions/jobs.py +33 -33
  54. edsl/exceptions/language_models.py +63 -63
  55. edsl/exceptions/prompts.py +15 -15
  56. edsl/exceptions/questions.py +91 -91
  57. edsl/exceptions/results.py +29 -29
  58. edsl/exceptions/scenarios.py +22 -22
  59. edsl/exceptions/surveys.py +37 -37
  60. edsl/inference_services/AnthropicService.py +87 -87
  61. edsl/inference_services/AwsBedrock.py +120 -120
  62. edsl/inference_services/AzureAI.py +217 -217
  63. edsl/inference_services/DeepInfraService.py +18 -18
  64. edsl/inference_services/GoogleService.py +148 -156
  65. edsl/inference_services/GroqService.py +20 -20
  66. edsl/inference_services/InferenceServiceABC.py +147 -147
  67. edsl/inference_services/InferenceServicesCollection.py +97 -97
  68. edsl/inference_services/MistralAIService.py +123 -123
  69. edsl/inference_services/OllamaService.py +18 -18
  70. edsl/inference_services/OpenAIService.py +224 -224
  71. edsl/inference_services/PerplexityService.py +163 -0
  72. edsl/inference_services/TestService.py +89 -89
  73. edsl/inference_services/TogetherAIService.py +170 -170
  74. edsl/inference_services/models_available_cache.py +118 -118
  75. edsl/inference_services/rate_limits_cache.py +25 -25
  76. edsl/inference_services/registry.py +41 -39
  77. edsl/inference_services/write_available.py +10 -10
  78. edsl/jobs/Answers.py +56 -56
  79. edsl/jobs/Jobs.py +898 -1358
  80. edsl/jobs/JobsChecks.py +147 -0
  81. edsl/jobs/JobsPrompts.py +268 -0
  82. edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
  83. edsl/jobs/__init__.py +1 -1
  84. edsl/jobs/buckets/BucketCollection.py +63 -63
  85. edsl/jobs/buckets/ModelBuckets.py +65 -65
  86. edsl/jobs/buckets/TokenBucket.py +251 -251
  87. edsl/jobs/interviews/Interview.py +661 -661
  88. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  89. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  90. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  91. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  92. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  93. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  94. edsl/jobs/interviews/ReportErrors.py +66 -66
  95. edsl/jobs/interviews/interview_status_enum.py +9 -9
  96. edsl/jobs/runners/JobsRunnerAsyncio.py +466 -361
  97. edsl/jobs/runners/JobsRunnerStatus.py +330 -332
  98. edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
  99. edsl/jobs/tasks/TaskCreators.py +64 -64
  100. edsl/jobs/tasks/TaskHistory.py +450 -451
  101. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  102. edsl/jobs/tasks/task_status_enum.py +163 -163
  103. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  104. edsl/jobs/tokens/TokenUsage.py +34 -34
  105. edsl/language_models/KeyLookup.py +30 -30
  106. edsl/language_models/LanguageModel.py +668 -708
  107. edsl/language_models/ModelList.py +155 -109
  108. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  109. edsl/language_models/__init__.py +3 -3
  110. edsl/language_models/fake_openai_call.py +15 -15
  111. edsl/language_models/fake_openai_service.py +61 -61
  112. edsl/language_models/registry.py +190 -137
  113. edsl/language_models/repair.py +156 -156
  114. edsl/language_models/unused/ReplicateBase.py +83 -83
  115. edsl/language_models/utilities.py +64 -64
  116. edsl/notebooks/Notebook.py +258 -258
  117. edsl/notebooks/__init__.py +1 -1
  118. edsl/prompts/Prompt.py +362 -357
  119. edsl/prompts/__init__.py +2 -2
  120. edsl/questions/AnswerValidatorMixin.py +289 -289
  121. edsl/questions/QuestionBase.py +664 -660
  122. edsl/questions/QuestionBaseGenMixin.py +161 -161
  123. edsl/questions/QuestionBasePromptsMixin.py +217 -217
  124. edsl/questions/QuestionBudget.py +227 -227
  125. edsl/questions/QuestionCheckBox.py +359 -359
  126. edsl/questions/QuestionExtract.py +182 -183
  127. edsl/questions/QuestionFreeText.py +114 -114
  128. edsl/questions/QuestionFunctional.py +166 -166
  129. edsl/questions/QuestionList.py +231 -231
  130. edsl/questions/QuestionMultipleChoice.py +286 -286
  131. edsl/questions/QuestionNumerical.py +153 -153
  132. edsl/questions/QuestionRank.py +324 -324
  133. edsl/questions/Quick.py +41 -41
  134. edsl/questions/RegisterQuestionsMeta.py +71 -71
  135. edsl/questions/ResponseValidatorABC.py +174 -174
  136. edsl/questions/SimpleAskMixin.py +73 -73
  137. edsl/questions/__init__.py +26 -26
  138. edsl/questions/compose_questions.py +98 -98
  139. edsl/questions/decorators.py +21 -21
  140. edsl/questions/derived/QuestionLikertFive.py +76 -76
  141. edsl/questions/derived/QuestionLinearScale.py +87 -87
  142. edsl/questions/derived/QuestionTopK.py +93 -93
  143. edsl/questions/derived/QuestionYesNo.py +82 -82
  144. edsl/questions/descriptors.py +413 -413
  145. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  146. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  147. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  148. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  149. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  150. edsl/questions/prompt_templates/question_list.jinja +17 -17
  151. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  152. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  153. edsl/questions/question_registry.py +177 -147
  154. edsl/questions/settings.py +12 -12
  155. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  156. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  157. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  158. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  159. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  160. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  161. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  162. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  163. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  164. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  165. edsl/questions/templates/list/question_presentation.jinja +5 -5
  166. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  167. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  168. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  169. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  170. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  171. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  172. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  173. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  174. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  175. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  176. edsl/results/CSSParameterizer.py +108 -0
  177. edsl/results/Dataset.py +424 -293
  178. edsl/results/DatasetExportMixin.py +731 -717
  179. edsl/results/DatasetTree.py +275 -145
  180. edsl/results/Result.py +465 -456
  181. edsl/results/Results.py +1165 -1071
  182. edsl/results/ResultsDBMixin.py +238 -238
  183. edsl/results/ResultsExportMixin.py +43 -43
  184. edsl/results/ResultsFetchMixin.py +33 -33
  185. edsl/results/ResultsGGMixin.py +121 -121
  186. edsl/results/ResultsToolsMixin.py +98 -98
  187. edsl/results/Selector.py +135 -135
  188. edsl/results/TableDisplay.py +198 -0
  189. edsl/results/__init__.py +2 -2
  190. edsl/results/table_display.css +78 -0
  191. edsl/results/tree_explore.py +115 -115
  192. edsl/scenarios/FileStore.py +632 -458
  193. edsl/scenarios/Scenario.py +601 -544
  194. edsl/scenarios/ScenarioHtmlMixin.py +64 -64
  195. edsl/scenarios/ScenarioJoin.py +127 -0
  196. edsl/scenarios/ScenarioList.py +1287 -1112
  197. edsl/scenarios/ScenarioListExportMixin.py +52 -52
  198. edsl/scenarios/ScenarioListPdfMixin.py +261 -261
  199. edsl/scenarios/__init__.py +4 -4
  200. edsl/shared.py +1 -1
  201. edsl/study/ObjectEntry.py +173 -173
  202. edsl/study/ProofOfWork.py +113 -113
  203. edsl/study/SnapShot.py +80 -80
  204. edsl/study/Study.py +528 -528
  205. edsl/study/__init__.py +4 -4
  206. edsl/surveys/DAG.py +148 -148
  207. edsl/surveys/Memory.py +31 -31
  208. edsl/surveys/MemoryPlan.py +244 -244
  209. edsl/surveys/Rule.py +326 -326
  210. edsl/surveys/RuleCollection.py +387 -387
  211. edsl/surveys/Survey.py +1801 -1787
  212. edsl/surveys/SurveyCSS.py +261 -261
  213. edsl/surveys/SurveyExportMixin.py +259 -259
  214. edsl/surveys/SurveyFlowVisualizationMixin.py +179 -121
  215. edsl/surveys/SurveyQualtricsImport.py +284 -284
  216. edsl/surveys/__init__.py +3 -3
  217. edsl/surveys/base.py +53 -53
  218. edsl/surveys/descriptors.py +56 -56
  219. edsl/surveys/instructions/ChangeInstruction.py +49 -49
  220. edsl/surveys/instructions/Instruction.py +65 -53
  221. edsl/surveys/instructions/InstructionCollection.py +77 -77
  222. edsl/templates/error_reporting/base.html +23 -23
  223. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  224. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  225. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  226. edsl/templates/error_reporting/interview_details.html +115 -115
  227. edsl/templates/error_reporting/interviews.html +19 -10
  228. edsl/templates/error_reporting/overview.html +4 -4
  229. edsl/templates/error_reporting/performance_plot.html +1 -1
  230. edsl/templates/error_reporting/report.css +73 -73
  231. edsl/templates/error_reporting/report.html +117 -117
  232. edsl/templates/error_reporting/report.js +25 -25
  233. edsl/tools/__init__.py +1 -1
  234. edsl/tools/clusters.py +192 -192
  235. edsl/tools/embeddings.py +27 -27
  236. edsl/tools/embeddings_plotting.py +118 -118
  237. edsl/tools/plotting.py +112 -112
  238. edsl/tools/summarize.py +18 -18
  239. edsl/utilities/SystemInfo.py +28 -28
  240. edsl/utilities/__init__.py +22 -22
  241. edsl/utilities/ast_utilities.py +25 -25
  242. edsl/utilities/data/Registry.py +6 -6
  243. edsl/utilities/data/__init__.py +1 -1
  244. edsl/utilities/data/scooter_results.json +1 -1
  245. edsl/utilities/decorators.py +77 -77
  246. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  247. edsl/utilities/interface.py +627 -627
  248. edsl/utilities/naming_utilities.py +263 -263
  249. edsl/utilities/repair_functions.py +28 -28
  250. edsl/utilities/restricted_python.py +70 -70
  251. edsl/utilities/utilities.py +424 -409
  252. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/LICENSE +21 -21
  253. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/METADATA +2 -1
  254. edsl-0.1.38.dev4.dist-info/RECORD +277 -0
  255. edsl-0.1.38.dev3.dist-info/RECORD +0 -269
  256. {edsl-0.1.38.dev3.dist-info → edsl-0.1.38.dev4.dist-info}/WHEEL +0 -0
@@ -1,258 +1,258 @@
1
- """A Notebook is a utility class that allows you to easily share/pull ipynbs from Coop."""
2
-
3
- from __future__ import annotations
4
- import json
5
- from typing import Dict, List, Optional, Union
6
- from uuid import uuid4
7
- from edsl.Base import Base
8
- from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
9
-
10
-
11
- class Notebook(Base):
12
- """
13
- A Notebook is a utility class that allows you to easily share/pull ipynbs from Coop.
14
- """
15
-
16
- default_name = "notebook"
17
-
18
- def __init__(
19
- self,
20
- data: Optional[Dict] = None,
21
- path: Optional[str] = None,
22
- name: Optional[str] = None,
23
- ):
24
- """
25
- Initialize a new Notebook.
26
-
27
- :param data: A dictionary representing the notebook data.
28
- This dictionary must conform to the official Jupyter Notebook format, as defined by nbformat.
29
- :param path: A filepath from which to load the notebook.
30
- If no path is provided, assume this code is run in a notebook and try to load the current notebook from file.
31
- :param name: A name for the Notebook.
32
- """
33
- import nbformat
34
-
35
- # Load current notebook path as fallback (VS Code only)
36
- path = path or globals().get("__vsc_ipynb_file__")
37
- if data is not None:
38
- nbformat.validate(data)
39
- self.data = data
40
- elif path is not None:
41
- with open(path, mode="r", encoding="utf-8") as f:
42
- data = nbformat.read(f, as_version=4)
43
- self.data = json.loads(json.dumps(data))
44
- else:
45
- # TODO: Support for IDEs other than VSCode
46
- raise NotImplementedError(
47
- "Cannot create a notebook from within itself in this development environment"
48
- )
49
-
50
- # TODO: perhaps add sanity check function
51
- # 1. could check if the notebook is a valid notebook
52
- # 2. could check notebook uses EDSL
53
- # ....
54
-
55
- self.name = name or self.default_name
56
-
57
- @classmethod
58
- def from_script(cls, path: str, name: Optional[str] = None) -> "Notebook":
59
- import nbformat
60
-
61
- # Read the script file
62
- with open(path, "r") as script_file:
63
- script_content = script_file.read()
64
-
65
- # Create a new Jupyter notebook
66
- nb = nbformat.v4.new_notebook()
67
-
68
- # Add the script content to the first cell
69
- first_cell = nbformat.v4.new_code_cell(script_content)
70
- nb.cells.append(first_cell)
71
-
72
- # Create a Notebook instance with the notebook data
73
- notebook_instance = cls(nb)
74
-
75
- return notebook_instance
76
-
77
- @classmethod
78
- def from_current_script(cls) -> "Notebook":
79
- import inspect
80
- import os
81
-
82
- # Get the path to the current file
83
- current_frame = inspect.currentframe()
84
- caller_frame = inspect.getouterframes(current_frame, 2)
85
- current_file_path = os.path.abspath(caller_frame[1].filename)
86
-
87
- # Use from_script to create the notebook
88
- return cls.from_script(current_file_path)
89
-
90
- def __eq__(self, other):
91
- """
92
- Check if two Notebooks are equal.
93
- This only checks the notebook data.
94
- """
95
- return self.data == other.data
96
-
97
- def __hash__(self) -> int:
98
- """
99
- Allow the model to be used as a key in a dictionary.
100
- """
101
- from edsl.utilities.utilities import dict_hash
102
-
103
- return dict_hash(self.data["cells"])
104
-
105
- def to_dict(self, add_edsl_version=False) -> dict:
106
- """
107
- Serialize to a dictionary.
108
- """
109
- d = {"name": self.name, "data": self.data}
110
- if add_edsl_version:
111
- from edsl import __version__
112
-
113
- d["edsl_version"] = __version__
114
- d["edsl_class_name"] = self.__class__.__name__
115
- return d
116
-
117
- @classmethod
118
- @remove_edsl_version
119
- def from_dict(cls, d: Dict) -> "Notebook":
120
- """
121
- Convert a dictionary representation of a Notebook to a Notebook object.
122
- """
123
- return cls(data=d["data"], name=d["name"])
124
-
125
- def to_file(self, path: str):
126
- """
127
- Save the notebook at the specified filepath.
128
- """
129
- import nbformat
130
-
131
- nbformat.write(nbformat.from_dict(self.data), fp=path)
132
-
133
- def print(self):
134
- """
135
- Print the notebook.
136
- """
137
- from rich import print_json
138
- import json
139
-
140
- print_json(json.dumps(self.to_dict()))
141
-
142
- def __repr__(self):
143
- """
144
- Return representation of Notebook.
145
- """
146
- return f'Notebook(data={self.data}, name="""{self.name}""")'
147
-
148
- def _repr_html_(self):
149
- """
150
- Return HTML representation of Notebook.
151
- """
152
- from nbconvert import HTMLExporter
153
- import nbformat
154
-
155
- notebook = nbformat.from_dict(self.data)
156
- html_exporter = HTMLExporter(template_name="basic")
157
- (body, _) = html_exporter.from_notebook_node(notebook)
158
- return body
159
-
160
- def _table(self) -> tuple[dict, list]:
161
- """
162
- Prepare generic table data.
163
- """
164
- table_data = []
165
-
166
- notebook_preview = ""
167
- for cell in self.data["cells"]:
168
- if "source" in cell:
169
- notebook_preview += f"{cell['source']}\n"
170
- if len(notebook_preview) > 1000:
171
- notebook_preview = f"{notebook_preview[:1000]} [...]"
172
- break
173
- notebook_preview = notebook_preview.rstrip()
174
-
175
- table_data.append(
176
- {
177
- "Attribute": "name",
178
- "Value": repr(self.name),
179
- }
180
- )
181
- table_data.append(
182
- {
183
- "Attribute": "notebook_preview",
184
- "Value": notebook_preview,
185
- }
186
- )
187
-
188
- column_names = ["Attribute", "Value"]
189
- return table_data, column_names
190
-
191
- def rich_print(self) -> "Table":
192
- """
193
- Display a Notebook as a rich table.
194
- """
195
- from rich.table import Table
196
-
197
- table_data, column_names = self._table()
198
- table = Table(title=f"{self.__class__.__name__} Attributes")
199
- for column in column_names:
200
- table.add_column(column, style="bold")
201
-
202
- for row in table_data:
203
- row_data = [row[column] for column in column_names]
204
- table.add_row(*row_data)
205
-
206
- return table
207
-
208
- @classmethod
209
- def example(cls, randomize: bool = False) -> Notebook:
210
- """
211
- Returns an example Notebook instance.
212
-
213
- :param randomize: If True, adds a random string one of the cells' output.
214
- """
215
- addition = "" if not randomize else str(uuid4())
216
- cells = [
217
- {
218
- "cell_type": "markdown",
219
- "metadata": dict(),
220
- "source": "# Test notebook",
221
- },
222
- {
223
- "cell_type": "code",
224
- "execution_count": 1,
225
- "metadata": dict(),
226
- "outputs": [
227
- {
228
- "name": "stdout",
229
- "output_type": "stream",
230
- "text": f"Hello world!\n{addition}",
231
- }
232
- ],
233
- "source": 'print("Hello world!")',
234
- },
235
- ]
236
- data = {
237
- "metadata": dict(),
238
- "nbformat": 4,
239
- "nbformat_minor": 4,
240
- "cells": cells,
241
- }
242
- return cls(data=data)
243
-
244
- def code(self) -> List[str]:
245
- """
246
- Return the code that could be used to create this Notebook.
247
- """
248
- lines = []
249
- lines.append("from edsl import Notebook")
250
- lines.append(f'nb = Notebook(data={self.data}, name="""{self.name}""")')
251
- return lines
252
-
253
-
254
- if __name__ == "__main__":
255
- from edsl import Notebook
256
-
257
- notebook = Notebook.example()
258
- assert notebook == notebook.from_dict(notebook.to_dict())
1
+ """A Notebook is a utility class that allows you to easily share/pull ipynbs from Coop."""
2
+
3
+ from __future__ import annotations
4
+ import json
5
+ from typing import Dict, List, Optional, Union
6
+ from uuid import uuid4
7
+ from edsl.Base import Base
8
+ from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
9
+
10
+
11
+ class Notebook(Base):
12
+ """
13
+ A Notebook is a utility class that allows you to easily share/pull ipynbs from Coop.
14
+ """
15
+
16
+ default_name = "notebook"
17
+
18
+ def __init__(
19
+ self,
20
+ data: Optional[Dict] = None,
21
+ path: Optional[str] = None,
22
+ name: Optional[str] = None,
23
+ ):
24
+ """
25
+ Initialize a new Notebook.
26
+
27
+ :param data: A dictionary representing the notebook data.
28
+ This dictionary must conform to the official Jupyter Notebook format, as defined by nbformat.
29
+ :param path: A filepath from which to load the notebook.
30
+ If no path is provided, assume this code is run in a notebook and try to load the current notebook from file.
31
+ :param name: A name for the Notebook.
32
+ """
33
+ import nbformat
34
+
35
+ # Load current notebook path as fallback (VS Code only)
36
+ path = path or globals().get("__vsc_ipynb_file__")
37
+ if data is not None:
38
+ nbformat.validate(data)
39
+ self.data = data
40
+ elif path is not None:
41
+ with open(path, mode="r", encoding="utf-8") as f:
42
+ data = nbformat.read(f, as_version=4)
43
+ self.data = json.loads(json.dumps(data))
44
+ else:
45
+ # TODO: Support for IDEs other than VSCode
46
+ raise NotImplementedError(
47
+ "Cannot create a notebook from within itself in this development environment"
48
+ )
49
+
50
+ # TODO: perhaps add sanity check function
51
+ # 1. could check if the notebook is a valid notebook
52
+ # 2. could check notebook uses EDSL
53
+ # ....
54
+
55
+ self.name = name or self.default_name
56
+
57
+ @classmethod
58
+ def from_script(cls, path: str, name: Optional[str] = None) -> "Notebook":
59
+ import nbformat
60
+
61
+ # Read the script file
62
+ with open(path, "r") as script_file:
63
+ script_content = script_file.read()
64
+
65
+ # Create a new Jupyter notebook
66
+ nb = nbformat.v4.new_notebook()
67
+
68
+ # Add the script content to the first cell
69
+ first_cell = nbformat.v4.new_code_cell(script_content)
70
+ nb.cells.append(first_cell)
71
+
72
+ # Create a Notebook instance with the notebook data
73
+ notebook_instance = cls(nb)
74
+
75
+ return notebook_instance
76
+
77
+ @classmethod
78
+ def from_current_script(cls) -> "Notebook":
79
+ import inspect
80
+ import os
81
+
82
+ # Get the path to the current file
83
+ current_frame = inspect.currentframe()
84
+ caller_frame = inspect.getouterframes(current_frame, 2)
85
+ current_file_path = os.path.abspath(caller_frame[1].filename)
86
+
87
+ # Use from_script to create the notebook
88
+ return cls.from_script(current_file_path)
89
+
90
+ def __eq__(self, other):
91
+ """
92
+ Check if two Notebooks are equal.
93
+ This only checks the notebook data.
94
+ """
95
+ return self.data == other.data
96
+
97
+ def __hash__(self) -> int:
98
+ """
99
+ Allow the model to be used as a key in a dictionary.
100
+ """
101
+ from edsl.utilities.utilities import dict_hash
102
+
103
+ return dict_hash(self.data["cells"])
104
+
105
+ def to_dict(self, add_edsl_version=False) -> dict:
106
+ """
107
+ Serialize to a dictionary.
108
+ """
109
+ d = {"name": self.name, "data": self.data}
110
+ if add_edsl_version:
111
+ from edsl import __version__
112
+
113
+ d["edsl_version"] = __version__
114
+ d["edsl_class_name"] = self.__class__.__name__
115
+ return d
116
+
117
+ @classmethod
118
+ @remove_edsl_version
119
+ def from_dict(cls, d: Dict) -> "Notebook":
120
+ """
121
+ Convert a dictionary representation of a Notebook to a Notebook object.
122
+ """
123
+ return cls(data=d["data"], name=d["name"])
124
+
125
+ def to_file(self, path: str):
126
+ """
127
+ Save the notebook at the specified filepath.
128
+ """
129
+ import nbformat
130
+
131
+ nbformat.write(nbformat.from_dict(self.data), fp=path)
132
+
133
+ def print(self):
134
+ """
135
+ Print the notebook.
136
+ """
137
+ from rich import print_json
138
+ import json
139
+
140
+ print_json(json.dumps(self.to_dict()))
141
+
142
+ def __repr__(self):
143
+ """
144
+ Return representation of Notebook.
145
+ """
146
+ return f'Notebook(data={self.data}, name="""{self.name}""")'
147
+
148
+ def _repr_html_(self):
149
+ """
150
+ Return HTML representation of Notebook.
151
+ """
152
+ from nbconvert import HTMLExporter
153
+ import nbformat
154
+
155
+ notebook = nbformat.from_dict(self.data)
156
+ html_exporter = HTMLExporter(template_name="basic")
157
+ (body, _) = html_exporter.from_notebook_node(notebook)
158
+ return body
159
+
160
+ def _table(self) -> tuple[dict, list]:
161
+ """
162
+ Prepare generic table data.
163
+ """
164
+ table_data = []
165
+
166
+ notebook_preview = ""
167
+ for cell in self.data["cells"]:
168
+ if "source" in cell:
169
+ notebook_preview += f"{cell['source']}\n"
170
+ if len(notebook_preview) > 1000:
171
+ notebook_preview = f"{notebook_preview[:1000]} [...]"
172
+ break
173
+ notebook_preview = notebook_preview.rstrip()
174
+
175
+ table_data.append(
176
+ {
177
+ "Attribute": "name",
178
+ "Value": repr(self.name),
179
+ }
180
+ )
181
+ table_data.append(
182
+ {
183
+ "Attribute": "notebook_preview",
184
+ "Value": notebook_preview,
185
+ }
186
+ )
187
+
188
+ column_names = ["Attribute", "Value"]
189
+ return table_data, column_names
190
+
191
+ def rich_print(self) -> "Table":
192
+ """
193
+ Display a Notebook as a rich table.
194
+ """
195
+ from rich.table import Table
196
+
197
+ table_data, column_names = self._table()
198
+ table = Table(title=f"{self.__class__.__name__} Attributes")
199
+ for column in column_names:
200
+ table.add_column(column, style="bold")
201
+
202
+ for row in table_data:
203
+ row_data = [row[column] for column in column_names]
204
+ table.add_row(*row_data)
205
+
206
+ return table
207
+
208
+ @classmethod
209
+ def example(cls, randomize: bool = False) -> Notebook:
210
+ """
211
+ Returns an example Notebook instance.
212
+
213
+ :param randomize: If True, adds a random string one of the cells' output.
214
+ """
215
+ addition = "" if not randomize else str(uuid4())
216
+ cells = [
217
+ {
218
+ "cell_type": "markdown",
219
+ "metadata": dict(),
220
+ "source": "# Test notebook",
221
+ },
222
+ {
223
+ "cell_type": "code",
224
+ "execution_count": 1,
225
+ "metadata": dict(),
226
+ "outputs": [
227
+ {
228
+ "name": "stdout",
229
+ "output_type": "stream",
230
+ "text": f"Hello world!\n{addition}",
231
+ }
232
+ ],
233
+ "source": 'print("Hello world!")',
234
+ },
235
+ ]
236
+ data = {
237
+ "metadata": dict(),
238
+ "nbformat": 4,
239
+ "nbformat_minor": 4,
240
+ "cells": cells,
241
+ }
242
+ return cls(data=data)
243
+
244
+ def code(self) -> List[str]:
245
+ """
246
+ Return the code that could be used to create this Notebook.
247
+ """
248
+ lines = []
249
+ lines.append("from edsl import Notebook")
250
+ lines.append(f'nb = Notebook(data={self.data}, name="""{self.name}""")')
251
+ return lines
252
+
253
+
254
+ if __name__ == "__main__":
255
+ from edsl import Notebook
256
+
257
+ notebook = Notebook.example()
258
+ assert notebook == notebook.from_dict(notebook.to_dict())
@@ -1 +1 @@
1
- from edsl.notebooks.Notebook import Notebook
1
+ from edsl.notebooks.Notebook import Notebook