edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (344) hide show
  1. edsl/Base.py +413 -332
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +57 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +1071 -867
  7. edsl/agents/AgentList.py +551 -413
  8. edsl/agents/Invigilator.py +284 -233
  9. edsl/agents/InvigilatorBase.py +257 -270
  10. edsl/agents/PromptConstructor.py +272 -354
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/__init__.py +2 -3
  14. edsl/agents/descriptors.py +99 -99
  15. edsl/agents/prompt_helpers.py +129 -129
  16. edsl/agents/question_option_processor.py +172 -0
  17. edsl/auto/AutoStudy.py +130 -117
  18. edsl/auto/StageBase.py +243 -230
  19. edsl/auto/StageGenerateSurvey.py +178 -178
  20. edsl/auto/StageLabelQuestions.py +125 -125
  21. edsl/auto/StagePersona.py +61 -61
  22. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  23. edsl/auto/StagePersonaDimensionValues.py +74 -74
  24. edsl/auto/StagePersonaDimensions.py +69 -69
  25. edsl/auto/StageQuestions.py +74 -73
  26. edsl/auto/SurveyCreatorPipeline.py +21 -21
  27. edsl/auto/utilities.py +218 -224
  28. edsl/base/Base.py +279 -279
  29. edsl/config.py +177 -157
  30. edsl/conversation/Conversation.py +290 -290
  31. edsl/conversation/car_buying.py +59 -58
  32. edsl/conversation/chips.py +95 -95
  33. edsl/conversation/mug_negotiation.py +81 -81
  34. edsl/conversation/next_speaker_utilities.py +93 -93
  35. edsl/coop/CoopFunctionsMixin.py +15 -0
  36. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  37. edsl/coop/PriceFetcher.py +54 -54
  38. edsl/coop/__init__.py +2 -2
  39. edsl/coop/coop.py +1106 -1028
  40. edsl/coop/utils.py +131 -131
  41. edsl/data/Cache.py +573 -555
  42. edsl/data/CacheEntry.py +230 -233
  43. edsl/data/CacheHandler.py +168 -149
  44. edsl/data/RemoteCacheSync.py +186 -78
  45. edsl/data/SQLiteDict.py +292 -292
  46. edsl/data/__init__.py +5 -4
  47. edsl/data/hack.py +10 -0
  48. edsl/data/orm.py +10 -10
  49. edsl/data_transfer_models.py +74 -73
  50. edsl/enums.py +202 -175
  51. edsl/exceptions/BaseException.py +21 -21
  52. edsl/exceptions/__init__.py +54 -54
  53. edsl/exceptions/agents.py +54 -42
  54. edsl/exceptions/cache.py +5 -5
  55. edsl/exceptions/configuration.py +16 -16
  56. edsl/exceptions/coop.py +10 -10
  57. edsl/exceptions/data.py +14 -14
  58. edsl/exceptions/general.py +34 -34
  59. edsl/exceptions/inference_services.py +5 -0
  60. edsl/exceptions/jobs.py +33 -33
  61. edsl/exceptions/language_models.py +63 -63
  62. edsl/exceptions/prompts.py +15 -15
  63. edsl/exceptions/questions.py +109 -91
  64. edsl/exceptions/results.py +29 -29
  65. edsl/exceptions/scenarios.py +29 -22
  66. edsl/exceptions/surveys.py +37 -37
  67. edsl/inference_services/AnthropicService.py +106 -87
  68. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  69. edsl/inference_services/AvailableModelFetcher.py +215 -0
  70. edsl/inference_services/AwsBedrock.py +118 -120
  71. edsl/inference_services/AzureAI.py +215 -217
  72. edsl/inference_services/DeepInfraService.py +18 -18
  73. edsl/inference_services/GoogleService.py +143 -148
  74. edsl/inference_services/GroqService.py +20 -20
  75. edsl/inference_services/InferenceServiceABC.py +80 -147
  76. edsl/inference_services/InferenceServicesCollection.py +138 -97
  77. edsl/inference_services/MistralAIService.py +120 -123
  78. edsl/inference_services/OllamaService.py +18 -18
  79. edsl/inference_services/OpenAIService.py +236 -224
  80. edsl/inference_services/PerplexityService.py +160 -163
  81. edsl/inference_services/ServiceAvailability.py +135 -0
  82. edsl/inference_services/TestService.py +90 -89
  83. edsl/inference_services/TogetherAIService.py +172 -170
  84. edsl/inference_services/data_structures.py +134 -0
  85. edsl/inference_services/models_available_cache.py +118 -118
  86. edsl/inference_services/rate_limits_cache.py +25 -25
  87. edsl/inference_services/registry.py +41 -41
  88. edsl/inference_services/write_available.py +10 -10
  89. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  90. edsl/jobs/Answers.py +43 -56
  91. edsl/jobs/FetchInvigilator.py +47 -0
  92. edsl/jobs/InterviewTaskManager.py +98 -0
  93. edsl/jobs/InterviewsConstructor.py +50 -0
  94. edsl/jobs/Jobs.py +823 -898
  95. edsl/jobs/JobsChecks.py +172 -147
  96. edsl/jobs/JobsComponentConstructor.py +189 -0
  97. edsl/jobs/JobsPrompts.py +270 -268
  98. edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
  99. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  100. edsl/jobs/RequestTokenEstimator.py +30 -0
  101. edsl/jobs/__init__.py +1 -1
  102. edsl/jobs/async_interview_runner.py +138 -0
  103. edsl/jobs/buckets/BucketCollection.py +104 -63
  104. edsl/jobs/buckets/ModelBuckets.py +65 -65
  105. edsl/jobs/buckets/TokenBucket.py +283 -251
  106. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  107. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  108. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  109. edsl/jobs/data_structures.py +120 -0
  110. edsl/jobs/decorators.py +35 -0
  111. edsl/jobs/interviews/Interview.py +396 -661
  112. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  113. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  114. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  115. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  116. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  117. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  118. edsl/jobs/interviews/ReportErrors.py +66 -66
  119. edsl/jobs/interviews/interview_status_enum.py +9 -9
  120. edsl/jobs/jobs_status_enums.py +9 -0
  121. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  122. edsl/jobs/results_exceptions_handler.py +98 -0
  123. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
  124. edsl/jobs/runners/JobsRunnerStatus.py +297 -330
  125. edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
  126. edsl/jobs/tasks/TaskCreators.py +64 -64
  127. edsl/jobs/tasks/TaskHistory.py +470 -450
  128. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  129. edsl/jobs/tasks/task_status_enum.py +161 -163
  130. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  131. edsl/jobs/tokens/TokenUsage.py +34 -34
  132. edsl/language_models/ComputeCost.py +63 -0
  133. edsl/language_models/LanguageModel.py +626 -668
  134. edsl/language_models/ModelList.py +164 -155
  135. edsl/language_models/PriceManager.py +127 -0
  136. edsl/language_models/RawResponseHandler.py +106 -0
  137. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  138. edsl/language_models/ServiceDataSources.py +0 -0
  139. edsl/language_models/__init__.py +2 -3
  140. edsl/language_models/fake_openai_call.py +15 -15
  141. edsl/language_models/fake_openai_service.py +61 -61
  142. edsl/language_models/key_management/KeyLookup.py +63 -0
  143. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  144. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  145. edsl/language_models/key_management/__init__.py +0 -0
  146. edsl/language_models/key_management/models.py +131 -0
  147. edsl/language_models/model.py +256 -0
  148. edsl/language_models/repair.py +156 -156
  149. edsl/language_models/utilities.py +65 -64
  150. edsl/notebooks/Notebook.py +263 -258
  151. edsl/notebooks/NotebookToLaTeX.py +142 -0
  152. edsl/notebooks/__init__.py +1 -1
  153. edsl/prompts/Prompt.py +352 -362
  154. edsl/prompts/__init__.py +2 -2
  155. edsl/questions/ExceptionExplainer.py +77 -0
  156. edsl/questions/HTMLQuestion.py +103 -0
  157. edsl/questions/QuestionBase.py +518 -664
  158. edsl/questions/QuestionBasePromptsMixin.py +221 -217
  159. edsl/questions/QuestionBudget.py +227 -227
  160. edsl/questions/QuestionCheckBox.py +359 -359
  161. edsl/questions/QuestionExtract.py +180 -182
  162. edsl/questions/QuestionFreeText.py +113 -114
  163. edsl/questions/QuestionFunctional.py +166 -166
  164. edsl/questions/QuestionList.py +223 -231
  165. edsl/questions/QuestionMatrix.py +265 -0
  166. edsl/questions/QuestionMultipleChoice.py +330 -286
  167. edsl/questions/QuestionNumerical.py +151 -153
  168. edsl/questions/QuestionRank.py +314 -324
  169. edsl/questions/Quick.py +41 -41
  170. edsl/questions/SimpleAskMixin.py +74 -73
  171. edsl/questions/__init__.py +27 -26
  172. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
  173. edsl/questions/compose_questions.py +98 -98
  174. edsl/questions/data_structures.py +20 -0
  175. edsl/questions/decorators.py +21 -21
  176. edsl/questions/derived/QuestionLikertFive.py +76 -76
  177. edsl/questions/derived/QuestionLinearScale.py +90 -87
  178. edsl/questions/derived/QuestionTopK.py +93 -93
  179. edsl/questions/derived/QuestionYesNo.py +82 -82
  180. edsl/questions/descriptors.py +427 -413
  181. edsl/questions/loop_processor.py +149 -0
  182. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  183. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  184. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  185. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  186. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  187. edsl/questions/prompt_templates/question_list.jinja +17 -17
  188. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  189. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  190. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
  191. edsl/questions/question_registry.py +177 -177
  192. edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
  193. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
  194. edsl/questions/response_validator_factory.py +34 -0
  195. edsl/questions/settings.py +12 -12
  196. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  197. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  198. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  199. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  200. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  201. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  202. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  203. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  204. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  205. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  206. edsl/questions/templates/list/question_presentation.jinja +5 -5
  207. edsl/questions/templates/matrix/__init__.py +1 -0
  208. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  209. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  210. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  211. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  212. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  213. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  214. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  215. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  216. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  217. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  218. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  219. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  220. edsl/results/CSSParameterizer.py +108 -108
  221. edsl/results/Dataset.py +587 -424
  222. edsl/results/DatasetExportMixin.py +594 -731
  223. edsl/results/DatasetTree.py +295 -275
  224. edsl/results/MarkdownToDocx.py +122 -0
  225. edsl/results/MarkdownToPDF.py +111 -0
  226. edsl/results/Result.py +557 -465
  227. edsl/results/Results.py +1183 -1165
  228. edsl/results/ResultsExportMixin.py +45 -43
  229. edsl/results/ResultsGGMixin.py +121 -121
  230. edsl/results/TableDisplay.py +125 -198
  231. edsl/results/TextEditor.py +50 -0
  232. edsl/results/__init__.py +2 -2
  233. edsl/results/file_exports.py +252 -0
  234. edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
  235. edsl/results/{Selector.py → results_selector.py} +145 -135
  236. edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
  237. edsl/results/smart_objects.py +96 -0
  238. edsl/results/table_data_class.py +12 -0
  239. edsl/results/table_display.css +77 -77
  240. edsl/results/table_renderers.py +118 -0
  241. edsl/results/tree_explore.py +115 -115
  242. edsl/scenarios/ConstructDownloadLink.py +109 -0
  243. edsl/scenarios/DocumentChunker.py +102 -0
  244. edsl/scenarios/DocxScenario.py +16 -0
  245. edsl/scenarios/FileStore.py +511 -632
  246. edsl/scenarios/PdfExtractor.py +40 -0
  247. edsl/scenarios/Scenario.py +498 -601
  248. edsl/scenarios/ScenarioHtmlMixin.py +65 -64
  249. edsl/scenarios/ScenarioList.py +1458 -1287
  250. edsl/scenarios/ScenarioListExportMixin.py +45 -52
  251. edsl/scenarios/ScenarioListPdfMixin.py +239 -261
  252. edsl/scenarios/__init__.py +3 -4
  253. edsl/scenarios/directory_scanner.py +96 -0
  254. edsl/scenarios/file_methods.py +85 -0
  255. edsl/scenarios/handlers/__init__.py +13 -0
  256. edsl/scenarios/handlers/csv.py +38 -0
  257. edsl/scenarios/handlers/docx.py +76 -0
  258. edsl/scenarios/handlers/html.py +37 -0
  259. edsl/scenarios/handlers/json.py +111 -0
  260. edsl/scenarios/handlers/latex.py +5 -0
  261. edsl/scenarios/handlers/md.py +51 -0
  262. edsl/scenarios/handlers/pdf.py +68 -0
  263. edsl/scenarios/handlers/png.py +39 -0
  264. edsl/scenarios/handlers/pptx.py +105 -0
  265. edsl/scenarios/handlers/py.py +294 -0
  266. edsl/scenarios/handlers/sql.py +313 -0
  267. edsl/scenarios/handlers/sqlite.py +149 -0
  268. edsl/scenarios/handlers/txt.py +33 -0
  269. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
  270. edsl/scenarios/scenario_selector.py +156 -0
  271. edsl/shared.py +1 -1
  272. edsl/study/ObjectEntry.py +173 -173
  273. edsl/study/ProofOfWork.py +113 -113
  274. edsl/study/SnapShot.py +80 -80
  275. edsl/study/Study.py +521 -528
  276. edsl/study/__init__.py +4 -4
  277. edsl/surveys/ConstructDAG.py +92 -0
  278. edsl/surveys/DAG.py +148 -148
  279. edsl/surveys/EditSurvey.py +221 -0
  280. edsl/surveys/InstructionHandler.py +100 -0
  281. edsl/surveys/Memory.py +31 -31
  282. edsl/surveys/MemoryManagement.py +72 -0
  283. edsl/surveys/MemoryPlan.py +244 -244
  284. edsl/surveys/Rule.py +327 -326
  285. edsl/surveys/RuleCollection.py +385 -387
  286. edsl/surveys/RuleManager.py +172 -0
  287. edsl/surveys/Simulator.py +75 -0
  288. edsl/surveys/Survey.py +1280 -1801
  289. edsl/surveys/SurveyCSS.py +273 -261
  290. edsl/surveys/SurveyExportMixin.py +259 -259
  291. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
  292. edsl/surveys/SurveyQualtricsImport.py +284 -284
  293. edsl/surveys/SurveyToApp.py +141 -0
  294. edsl/surveys/__init__.py +5 -3
  295. edsl/surveys/base.py +53 -53
  296. edsl/surveys/descriptors.py +60 -56
  297. edsl/surveys/instructions/ChangeInstruction.py +48 -49
  298. edsl/surveys/instructions/Instruction.py +56 -65
  299. edsl/surveys/instructions/InstructionCollection.py +82 -77
  300. edsl/templates/error_reporting/base.html +23 -23
  301. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  302. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  303. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  304. edsl/templates/error_reporting/interview_details.html +115 -115
  305. edsl/templates/error_reporting/interviews.html +19 -19
  306. edsl/templates/error_reporting/overview.html +4 -4
  307. edsl/templates/error_reporting/performance_plot.html +1 -1
  308. edsl/templates/error_reporting/report.css +73 -73
  309. edsl/templates/error_reporting/report.html +117 -117
  310. edsl/templates/error_reporting/report.js +25 -25
  311. edsl/test_h +1 -0
  312. edsl/tools/__init__.py +1 -1
  313. edsl/tools/clusters.py +192 -192
  314. edsl/tools/embeddings.py +27 -27
  315. edsl/tools/embeddings_plotting.py +118 -118
  316. edsl/tools/plotting.py +112 -112
  317. edsl/tools/summarize.py +18 -18
  318. edsl/utilities/PrettyList.py +56 -0
  319. edsl/utilities/SystemInfo.py +28 -28
  320. edsl/utilities/__init__.py +22 -22
  321. edsl/utilities/ast_utilities.py +25 -25
  322. edsl/utilities/data/Registry.py +6 -6
  323. edsl/utilities/data/__init__.py +1 -1
  324. edsl/utilities/data/scooter_results.json +1 -1
  325. edsl/utilities/decorators.py +77 -77
  326. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  327. edsl/utilities/gcp_bucket/example.py +50 -0
  328. edsl/utilities/interface.py +627 -627
  329. edsl/utilities/is_notebook.py +18 -0
  330. edsl/utilities/is_valid_variable_name.py +11 -0
  331. edsl/utilities/naming_utilities.py +263 -263
  332. edsl/utilities/remove_edsl_version.py +24 -0
  333. edsl/utilities/repair_functions.py +28 -28
  334. edsl/utilities/restricted_python.py +70 -70
  335. edsl/utilities/utilities.py +436 -424
  336. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/LICENSE +21 -21
  337. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/METADATA +13 -11
  338. edsl-0.1.39.dev4.dist-info/RECORD +361 -0
  339. edsl/language_models/KeyLookup.py +0 -30
  340. edsl/language_models/registry.py +0 -190
  341. edsl/language_models/unused/ReplicateBase.py +0 -83
  342. edsl/results/ResultsDBMixin.py +0 -238
  343. edsl-0.1.39.dev3.dist-info/RECORD +0 -277
  344. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/WHEEL +0 -0
@@ -1,63 +1,63 @@
1
- import asyncio
2
- from enum import Enum
3
- from typing import Literal, List, Type, DefaultDict
4
- from collections import UserDict, defaultdict
5
-
6
- from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
7
- from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
8
- from edsl.enums import pricing, TokenPricing
9
- from edsl.jobs.tasks.task_status_enum import TaskStatus
10
-
11
- InterviewTokenUsageMapping = DefaultDict[str, InterviewTokenUsage]
12
-
13
-
14
- class InterviewStatistic(UserDict):
15
- @staticmethod
16
- def _format_number(number, digits=0, units=""):
17
- """Format a number.
18
-
19
- :param number: the number to format
20
- :param digits: the number of digits to display
21
- :param units: the units to display
22
-
23
- Example usage:
24
-
25
- >>> InterviewStatistic._format_number(1000, 1, "sec.")
26
- '1,000.0 sec.'
27
- """
28
- if type(number) == str:
29
- return number
30
- else:
31
- return f"{number:,.{digits}f}" + " " + units
32
-
33
- @property
34
- def _pretty_name(self):
35
- """Return a pretty name for the statistic.
36
-
37
- Example usage:
38
-
39
- >>> InterviewStatistic("elapsed_time", value=100, digits=1, units="sec.").pretty_name
40
- 'Elapsed time'
41
- """
42
- return self.name.replace("_", " ").capitalize()
43
-
44
- def __init__(
45
- self,
46
- name: str,
47
- value: float,
48
- digits: int = 0,
49
- units: str = "",
50
- pretty_name: str = None,
51
- ):
52
- """Create a new InterviewStatistic object."""
53
- self.name = name
54
- self.value = value
55
- self.digits = digits
56
- self.units = units
57
- self.pretty_name = pretty_name or self._pretty_name
58
-
59
- super().__init__(
60
- {self.pretty_name: self._format_number(self.value, self.digits, self.units)}
61
- )
62
-
63
- self.raw: dict = {self.name: self.value}
1
+ import asyncio
2
+ from enum import Enum
3
+ from typing import Literal, List, Type, DefaultDict
4
+ from collections import UserDict, defaultdict
5
+
6
+ from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
7
+ from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
8
+ from edsl.enums import pricing, TokenPricing
9
+ from edsl.jobs.tasks.task_status_enum import TaskStatus
10
+
11
+ InterviewTokenUsageMapping = DefaultDict[str, InterviewTokenUsage]
12
+
13
+
14
+ class InterviewStatistic(UserDict):
15
+ @staticmethod
16
+ def _format_number(number, digits=0, units=""):
17
+ """Format a number.
18
+
19
+ :param number: the number to format
20
+ :param digits: the number of digits to display
21
+ :param units: the units to display
22
+
23
+ Example usage:
24
+
25
+ >>> InterviewStatistic._format_number(1000, 1, "sec.")
26
+ '1,000.0 sec.'
27
+ """
28
+ if type(number) == str:
29
+ return number
30
+ else:
31
+ return f"{number:,.{digits}f}" + " " + units
32
+
33
+ @property
34
+ def _pretty_name(self):
35
+ """Return a pretty name for the statistic.
36
+
37
+ Example usage:
38
+
39
+ >>> InterviewStatistic("elapsed_time", value=100, digits=1, units="sec.").pretty_name
40
+ 'Elapsed time'
41
+ """
42
+ return self.name.replace("_", " ").capitalize()
43
+
44
+ def __init__(
45
+ self,
46
+ name: str,
47
+ value: float,
48
+ digits: int = 0,
49
+ units: str = "",
50
+ pretty_name: str = None,
51
+ ):
52
+ """Create a new InterviewStatistic object."""
53
+ self.name = name
54
+ self.value = value
55
+ self.digits = digits
56
+ self.units = units
57
+ self.pretty_name = pretty_name or self._pretty_name
58
+
59
+ super().__init__(
60
+ {self.pretty_name: self._format_number(self.value, self.digits, self.units)}
61
+ )
62
+
63
+ self.raw: dict = {self.name: self.value}
@@ -1,25 +1,25 @@
1
- from collections import UserDict
2
- from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
3
-
4
-
5
- class InterviewStatisticsCollection(UserDict):
6
- """A collection of interview statistics."""
7
-
8
- def __init__(self, *args, **kwargs):
9
- super().__init__(*args, **kwargs)
10
- self.raw: dict = {}
11
-
12
- def add_stat(self, statistic: InterviewStatistic):
13
- """Add a statistic to the collection.
14
-
15
- Each statistic is a dictionary with a single key-value pair.
16
-
17
- Example usage:
18
-
19
- >>> isc = InterviewStatisticsCollection()
20
- >>> isc.add_stat(InterviewStatistic("elapsed_time", value=100, digits=1, units="sec."))
21
- >>> isc.raw
22
- {'elapsed_time': 100}
23
- """
24
- self.update(statistic)
25
- self.raw.update(statistic.raw)
1
+ from collections import UserDict
2
+ from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
3
+
4
+
5
+ class InterviewStatisticsCollection(UserDict):
6
+ """A collection of interview statistics."""
7
+
8
+ def __init__(self, *args, **kwargs):
9
+ super().__init__(*args, **kwargs)
10
+ self.raw: dict = {}
11
+
12
+ def add_stat(self, statistic: InterviewStatistic):
13
+ """Add a statistic to the collection.
14
+
15
+ Each statistic is a dictionary with a single key-value pair.
16
+
17
+ Example usage:
18
+
19
+ >>> isc = InterviewStatisticsCollection()
20
+ >>> isc.add_stat(InterviewStatistic("elapsed_time", value=100, digits=1, units="sec."))
21
+ >>> isc.raw
22
+ {'elapsed_time': 100}
23
+ """
24
+ self.update(statistic)
25
+ self.raw.update(statistic.raw)
@@ -1,78 +1,78 @@
1
- from __future__ import annotations
2
- import json
3
- from collections import UserDict
4
- from typing import Union, Dict
5
-
6
- from edsl.jobs.tasks.task_status_enum import TaskStatus, get_enum_from_string
7
-
8
-
9
- class InterviewStatusDictionary(UserDict):
10
- """A dictionary that keeps track of the status of all the tasks in an interview."""
11
-
12
- def __init__(self, data: Union[Dict[TaskStatus, int], None] = None):
13
- if data:
14
- # checks to make sure every task status is in the enum
15
- assert all([task_status in data for task_status in TaskStatus])
16
- super().__init__(data)
17
- else:
18
- # sets all the task statuses to 0
19
- d = {}
20
- for task_status in TaskStatus:
21
- d[task_status] = 0
22
- d["number_from_cache"] = 0
23
- super().__init__(d)
24
-
25
- def __add__(
26
- self, other: "InterviewStatusDictionary"
27
- ) -> "InterviewStatusDictionary":
28
- """Adds two InterviewStatusDictionaries together."""
29
- if not isinstance(other, InterviewStatusDictionary):
30
- raise ValueError(f"Can't add {type(other)} to InterviewStatusDictionary")
31
- new_dict = {}
32
- for key in self.keys():
33
- new_dict[key] = self[key] + other[key]
34
- return InterviewStatusDictionary(new_dict)
35
-
36
- @property
37
- def waiting(self) -> int:
38
- """Return the number of tasks that are in a waiting status of some kind."""
39
-
40
- waiting_status_list = [
41
- TaskStatus.WAITING_FOR_REQUEST_CAPACITY,
42
- TaskStatus.WAITING_FOR_TOKEN_CAPACITY,
43
- TaskStatus.WAITING_FOR_DEPENDENCIES,
44
- ]
45
-
46
- return sum([self[status] for status in waiting_status_list])
47
-
48
- def __repr__(self):
49
- return f"InterviewStatusDictionary({self.data})"
50
-
51
- def to_dict(self):
52
- new_data = {str(key): value for key, value in self.data.items()}
53
- return new_data
54
-
55
- def print(self):
56
- d = {}
57
- for key, value in self.data.items():
58
- d[str(key)] = value
59
- from edsl.utilities.interface import print_dict_with_rich
60
-
61
- print_dict_with_rich(d)
62
-
63
- @classmethod
64
- def from_dict(cls, data):
65
- new_data = {get_enum_from_string(key): value for key, value in data.items()}
66
- return cls(new_data)
67
-
68
- def to_json(self):
69
- import json
70
-
71
- return json.dumps(self.to_dict())
72
-
73
- @classmethod
74
- def from_json(cls, data):
75
- import json
76
-
77
- data = json.loads(data)
78
- return cls.from_dict(data)
1
+ from __future__ import annotations
2
+ import json
3
+ from collections import UserDict
4
+ from typing import Union, Dict
5
+
6
+ from edsl.jobs.tasks.task_status_enum import TaskStatus, get_enum_from_string
7
+
8
+
9
+ class InterviewStatusDictionary(UserDict):
10
+ """A dictionary that keeps track of the status of all the tasks in an interview."""
11
+
12
+ def __init__(self, data: Union[Dict[TaskStatus, int], None] = None):
13
+ if data:
14
+ # checks to make sure every task status is in the enum
15
+ assert all([task_status in data for task_status in TaskStatus])
16
+ super().__init__(data)
17
+ else:
18
+ # sets all the task statuses to 0
19
+ d = {}
20
+ for task_status in TaskStatus:
21
+ d[task_status] = 0
22
+ d["number_from_cache"] = 0
23
+ super().__init__(d)
24
+
25
+ def __add__(
26
+ self, other: "InterviewStatusDictionary"
27
+ ) -> "InterviewStatusDictionary":
28
+ """Adds two InterviewStatusDictionaries together."""
29
+ if not isinstance(other, InterviewStatusDictionary):
30
+ raise ValueError(f"Can't add {type(other)} to InterviewStatusDictionary")
31
+ new_dict = {}
32
+ for key in self.keys():
33
+ new_dict[key] = self[key] + other[key]
34
+ return InterviewStatusDictionary(new_dict)
35
+
36
+ @property
37
+ def waiting(self) -> int:
38
+ """Return the number of tasks that are in a waiting status of some kind."""
39
+
40
+ waiting_status_list = [
41
+ TaskStatus.WAITING_FOR_REQUEST_CAPACITY,
42
+ TaskStatus.WAITING_FOR_TOKEN_CAPACITY,
43
+ TaskStatus.WAITING_FOR_DEPENDENCIES,
44
+ ]
45
+
46
+ return sum([self[status] for status in waiting_status_list])
47
+
48
+ def __repr__(self):
49
+ return f"InterviewStatusDictionary({self.data})"
50
+
51
+ def to_dict(self):
52
+ new_data = {str(key): value for key, value in self.data.items()}
53
+ return new_data
54
+
55
+ def print(self):
56
+ d = {}
57
+ for key, value in self.data.items():
58
+ d[str(key)] = value
59
+ from edsl.utilities.interface import print_dict_with_rich
60
+
61
+ print_dict_with_rich(d)
62
+
63
+ @classmethod
64
+ def from_dict(cls, data):
65
+ new_data = {get_enum_from_string(key): value for key, value in data.items()}
66
+ return cls(new_data)
67
+
68
+ def to_json(self):
69
+ import json
70
+
71
+ return json.dumps(self.to_dict())
72
+
73
+ @classmethod
74
+ def from_json(cls, data):
75
+ import json
76
+
77
+ data = json.loads(data)
78
+ return cls.from_dict(data)
@@ -1,92 +1,92 @@
1
- from collections import UserDict
2
-
3
- from edsl.jobs.tasks.task_status_enum import TaskStatus, status_colors
4
-
5
-
6
- class InterviewStatusLog(UserDict):
7
- """A dictionary of TaskStatusLog objects.
8
-
9
- The key is the name of the task.
10
- """
11
-
12
- @property
13
- def min_time(self):
14
- return min([log.min_time for log in self.values()])
15
-
16
- @property
17
- def max_time(self):
18
- return max([log.max_time for log in self.values()])
19
-
20
- def status_matrix(self, num_periods):
21
- """Return a matrix of status values."""
22
- start_time = self.min_time
23
- end_time = self.max_time
24
- time_increment = (end_time - start_time) / num_periods
25
- status_matrix = {}
26
- time_periods = [start_time + i * time_increment for i in range(num_periods)]
27
- for task_name, log in self.items():
28
- status_matrix[task_name] = [log.status_at_time(t) for t in time_periods]
29
- return status_matrix
30
-
31
- def numerical_matrix(self, num_periods):
32
- """Return a numerical matrix of status values."""
33
- status_dicts = self.status_matrix(num_periods)
34
-
35
- num_cols = num_periods
36
- num_rows = len(status_dicts)
37
- matrix = [[0 for _ in range(num_cols)] for _ in range(num_rows)]
38
-
39
- for row_index, (task_name, status_list) in enumerate(status_dicts.items()):
40
- matrix[row_index] = [
41
- list(status_colors.keys()).index(status) for status in status_list
42
- ]
43
-
44
- index_to_names = {i: name for i, name in enumerate(status_dicts.keys())}
45
- return matrix, index_to_names
46
-
47
- def visualize(self, num_periods=10):
48
- """Visualize the status matrix with outlined squares."""
49
- import matplotlib.pyplot as plt
50
- from matplotlib.colors import ListedColormap
51
- import numpy as np
52
- from matplotlib.patches import Rectangle
53
-
54
- # Define your custom colormap
55
- custom_cmap = ListedColormap(list(status_colors.values()))
56
-
57
- # Generate the matrix
58
- matrix, index_to_names = self.numerical_matrix(num_periods)
59
-
60
- # Create the figure and axes
61
- plt.figure(figsize=(10, 5))
62
- ax = plt.gca()
63
-
64
- # Display the matrix and keep a reference to the imshow object
65
- im = ax.imshow(matrix, aspect="auto", cmap=custom_cmap)
66
-
67
- # Adding color bar, now correctly associating it with 'im'
68
- cbar = plt.colorbar(im, ticks=range(len(status_colors)), label="Task Status")
69
-
70
- cbar_labels = [status.name for status in status_colors.keys()]
71
- # breakpoint()
72
- cbar.set_ticklabels(cbar_labels) # Setting the custom labels for the colorbar
73
-
74
- im.set_clim(
75
- -0.5, len(status_colors) - 0.5
76
- ) # Setting color limits directly on the imshow object
77
-
78
- # Outline each cell by drawing rectangles
79
- for (j, i), val in np.ndenumerate(matrix):
80
- ax.add_patch(
81
- Rectangle(
82
- (i - 0.5, j - 0.5), 1, 1, fill=False, edgecolor="black", lw=0.5
83
- )
84
- )
85
-
86
- # Set custom y-axis ticks and labels
87
- yticks = list(index_to_names.keys())
88
- yticklabels = list(index_to_names.values())
89
- plt.yticks(ticks=yticks, labels=yticklabels)
90
-
91
- # Show the plot
92
- plt.show()
1
+ from collections import UserDict
2
+
3
+ from edsl.jobs.tasks.task_status_enum import TaskStatus, status_colors
4
+
5
+
6
+ class InterviewStatusLog(UserDict):
7
+ """A dictionary of TaskStatusLog objects.
8
+
9
+ The key is the name of the task.
10
+ """
11
+
12
+ @property
13
+ def min_time(self):
14
+ return min([log.min_time for log in self.values()])
15
+
16
+ @property
17
+ def max_time(self):
18
+ return max([log.max_time for log in self.values()])
19
+
20
+ def status_matrix(self, num_periods):
21
+ """Return a matrix of status values."""
22
+ start_time = self.min_time
23
+ end_time = self.max_time
24
+ time_increment = (end_time - start_time) / num_periods
25
+ status_matrix = {}
26
+ time_periods = [start_time + i * time_increment for i in range(num_periods)]
27
+ for task_name, log in self.items():
28
+ status_matrix[task_name] = [log.status_at_time(t) for t in time_periods]
29
+ return status_matrix
30
+
31
+ def numerical_matrix(self, num_periods):
32
+ """Return a numerical matrix of status values."""
33
+ status_dicts = self.status_matrix(num_periods)
34
+
35
+ num_cols = num_periods
36
+ num_rows = len(status_dicts)
37
+ matrix = [[0 for _ in range(num_cols)] for _ in range(num_rows)]
38
+
39
+ for row_index, (task_name, status_list) in enumerate(status_dicts.items()):
40
+ matrix[row_index] = [
41
+ list(status_colors.keys()).index(status) for status in status_list
42
+ ]
43
+
44
+ index_to_names = {i: name for i, name in enumerate(status_dicts.keys())}
45
+ return matrix, index_to_names
46
+
47
+ def visualize(self, num_periods=10):
48
+ """Visualize the status matrix with outlined squares."""
49
+ import matplotlib.pyplot as plt
50
+ from matplotlib.colors import ListedColormap
51
+ import numpy as np
52
+ from matplotlib.patches import Rectangle
53
+
54
+ # Define your custom colormap
55
+ custom_cmap = ListedColormap(list(status_colors.values()))
56
+
57
+ # Generate the matrix
58
+ matrix, index_to_names = self.numerical_matrix(num_periods)
59
+
60
+ # Create the figure and axes
61
+ plt.figure(figsize=(10, 5))
62
+ ax = plt.gca()
63
+
64
+ # Display the matrix and keep a reference to the imshow object
65
+ im = ax.imshow(matrix, aspect="auto", cmap=custom_cmap)
66
+
67
+ # Adding color bar, now correctly associating it with 'im'
68
+ cbar = plt.colorbar(im, ticks=range(len(status_colors)), label="Task Status")
69
+
70
+ cbar_labels = [status.name for status in status_colors.keys()]
71
+ # breakpoint()
72
+ cbar.set_ticklabels(cbar_labels) # Setting the custom labels for the colorbar
73
+
74
+ im.set_clim(
75
+ -0.5, len(status_colors) - 0.5
76
+ ) # Setting color limits directly on the imshow object
77
+
78
+ # Outline each cell by drawing rectangles
79
+ for (j, i), val in np.ndenumerate(matrix):
80
+ ax.add_patch(
81
+ Rectangle(
82
+ (i - 0.5, j - 0.5), 1, 1, fill=False, edgecolor="black", lw=0.5
83
+ )
84
+ )
85
+
86
+ # Set custom y-axis ticks and labels
87
+ yticks = list(index_to_names.keys())
88
+ yticklabels = list(index_to_names.values())
89
+ plt.yticks(ticks=yticks, labels=yticklabels)
90
+
91
+ # Show the plot
92
+ plt.show()
@@ -1,66 +1,66 @@
1
- import json
2
- import requests
3
- import threading
4
- from edsl.coop import Coop
5
-
6
-
7
- class ReportErrors:
8
- def __init__(self, task_history):
9
- self.task_history = task_history
10
- self.email = None
11
-
12
- @property
13
- def data(self):
14
- return {
15
- "text": self.task_history.to_dict(),
16
- "email": self.email,
17
- }
18
-
19
- def get_email(self, timeout=10):
20
- """Helper method to get user input with a timeout."""
21
- input_queue = []
22
-
23
- def input_thread_method():
24
- email_input = input(
25
- "Please enter your email address (if you want us to get in touch): "
26
- )
27
- input_queue.append(email_input)
28
-
29
- input_thread = threading.Thread(target=input_thread_method)
30
- input_thread.start()
31
- input_thread.join(timeout=timeout)
32
-
33
- if input_queue:
34
- self.email = input_queue[0]
35
- else:
36
- print("No input received within the timeout period.")
37
-
38
- def upload(self):
39
- # The previous implementation was removed because it relied on the old Coop ErrorModel
40
- pass
41
-
42
-
43
- def main():
44
- from edsl.jobs.interviews.ReportErrors import ReportErrors
45
-
46
- class TaskHistory:
47
- def __init__(self, data):
48
- self.data = data
49
-
50
- def to_dict(self):
51
- """Converts the internal data of the task history to a dictionary format."""
52
- return self.data
53
-
54
- task_history_data = {
55
- "task": "Example Task",
56
- "status": "Completed",
57
- "details": "This is an example of a task history.",
58
- }
59
- task_history = TaskHistory(task_history_data)
60
-
61
- reporter = ReportErrors(task_history)
62
- # one without email
63
- reporter.upload()
64
- # one with email
65
- reporter.email = "fake@gmail.com"
66
- reporter.upload()
1
+ import json
2
+ import requests
3
+ import threading
4
+ from edsl.coop import Coop
5
+
6
+
7
+ class ReportErrors:
8
+ def __init__(self, task_history):
9
+ self.task_history = task_history
10
+ self.email = None
11
+
12
+ @property
13
+ def data(self):
14
+ return {
15
+ "text": self.task_history.to_dict(),
16
+ "email": self.email,
17
+ }
18
+
19
+ def get_email(self, timeout=10):
20
+ """Helper method to get user input with a timeout."""
21
+ input_queue = []
22
+
23
+ def input_thread_method():
24
+ email_input = input(
25
+ "Please enter your email address (if you want us to get in touch): "
26
+ )
27
+ input_queue.append(email_input)
28
+
29
+ input_thread = threading.Thread(target=input_thread_method)
30
+ input_thread.start()
31
+ input_thread.join(timeout=timeout)
32
+
33
+ if input_queue:
34
+ self.email = input_queue[0]
35
+ else:
36
+ print("No input received within the timeout period.")
37
+
38
+ def upload(self):
39
+ # The previous implementation was removed because it relied on the old Coop ErrorModel
40
+ pass
41
+
42
+
43
+ def main():
44
+ from edsl.jobs.interviews.ReportErrors import ReportErrors
45
+
46
+ class TaskHistory:
47
+ def __init__(self, data):
48
+ self.data = data
49
+
50
+ def to_dict(self):
51
+ """Converts the internal data of the task history to a dictionary format."""
52
+ return self.data
53
+
54
+ task_history_data = {
55
+ "task": "Example Task",
56
+ "status": "Completed",
57
+ "details": "This is an example of a task history.",
58
+ }
59
+ task_history = TaskHistory(task_history_data)
60
+
61
+ reporter = ReportErrors(task_history)
62
+ # one without email
63
+ reporter.upload()
64
+ # one with email
65
+ reporter.email = "fake@gmail.com"
66
+ reporter.upload()
@@ -1,9 +1,9 @@
1
- import enum
2
-
3
-
4
- class InterviewStatus(enum.Enum):
5
- "These are the possible states an interview can be in."
6
- NOT_STARTED = enum.auto()
7
- SUCCESS = enum.auto()
8
- WAITING_FOR_RESOURCES = enum.auto()
9
- FAILED = enum.auto()
1
+ import enum
2
+
3
+
4
+ class InterviewStatus(enum.Enum):
5
+ "These are the possible states an interview can be in."
6
+ NOT_STARTED = enum.auto()
7
+ SUCCESS = enum.auto()
8
+ WAITING_FOR_RESOURCES = enum.auto()
9
+ FAILED = enum.auto()