edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (341) hide show
  1. edsl/Base.py +413 -332
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +57 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +1071 -867
  7. edsl/agents/AgentList.py +551 -413
  8. edsl/agents/Invigilator.py +284 -233
  9. edsl/agents/InvigilatorBase.py +257 -270
  10. edsl/agents/PromptConstructor.py +272 -354
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/__init__.py +2 -3
  14. edsl/agents/descriptors.py +99 -99
  15. edsl/agents/prompt_helpers.py +129 -129
  16. edsl/agents/question_option_processor.py +172 -0
  17. edsl/auto/AutoStudy.py +130 -117
  18. edsl/auto/StageBase.py +243 -230
  19. edsl/auto/StageGenerateSurvey.py +178 -178
  20. edsl/auto/StageLabelQuestions.py +125 -125
  21. edsl/auto/StagePersona.py +61 -61
  22. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  23. edsl/auto/StagePersonaDimensionValues.py +74 -74
  24. edsl/auto/StagePersonaDimensions.py +69 -69
  25. edsl/auto/StageQuestions.py +74 -73
  26. edsl/auto/SurveyCreatorPipeline.py +21 -21
  27. edsl/auto/utilities.py +218 -224
  28. edsl/base/Base.py +279 -279
  29. edsl/config.py +177 -157
  30. edsl/conversation/Conversation.py +290 -290
  31. edsl/conversation/car_buying.py +59 -58
  32. edsl/conversation/chips.py +95 -95
  33. edsl/conversation/mug_negotiation.py +81 -81
  34. edsl/conversation/next_speaker_utilities.py +93 -93
  35. edsl/coop/CoopFunctionsMixin.py +15 -0
  36. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  37. edsl/coop/PriceFetcher.py +54 -54
  38. edsl/coop/__init__.py +2 -2
  39. edsl/coop/coop.py +1106 -1028
  40. edsl/coop/utils.py +131 -131
  41. edsl/data/Cache.py +573 -555
  42. edsl/data/CacheEntry.py +230 -233
  43. edsl/data/CacheHandler.py +168 -149
  44. edsl/data/RemoteCacheSync.py +186 -78
  45. edsl/data/SQLiteDict.py +292 -292
  46. edsl/data/__init__.py +5 -4
  47. edsl/data/orm.py +10 -10
  48. edsl/data_transfer_models.py +74 -73
  49. edsl/enums.py +202 -175
  50. edsl/exceptions/BaseException.py +21 -21
  51. edsl/exceptions/__init__.py +54 -54
  52. edsl/exceptions/agents.py +54 -42
  53. edsl/exceptions/cache.py +5 -5
  54. edsl/exceptions/configuration.py +16 -16
  55. edsl/exceptions/coop.py +10 -10
  56. edsl/exceptions/data.py +14 -14
  57. edsl/exceptions/general.py +34 -34
  58. edsl/exceptions/inference_services.py +5 -0
  59. edsl/exceptions/jobs.py +33 -33
  60. edsl/exceptions/language_models.py +63 -63
  61. edsl/exceptions/prompts.py +15 -15
  62. edsl/exceptions/questions.py +109 -91
  63. edsl/exceptions/results.py +29 -29
  64. edsl/exceptions/scenarios.py +29 -22
  65. edsl/exceptions/surveys.py +37 -37
  66. edsl/inference_services/AnthropicService.py +106 -87
  67. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  68. edsl/inference_services/AvailableModelFetcher.py +215 -0
  69. edsl/inference_services/AwsBedrock.py +118 -120
  70. edsl/inference_services/AzureAI.py +215 -217
  71. edsl/inference_services/DeepInfraService.py +18 -18
  72. edsl/inference_services/GoogleService.py +143 -148
  73. edsl/inference_services/GroqService.py +20 -20
  74. edsl/inference_services/InferenceServiceABC.py +80 -147
  75. edsl/inference_services/InferenceServicesCollection.py +138 -97
  76. edsl/inference_services/MistralAIService.py +120 -123
  77. edsl/inference_services/OllamaService.py +18 -18
  78. edsl/inference_services/OpenAIService.py +236 -224
  79. edsl/inference_services/PerplexityService.py +160 -163
  80. edsl/inference_services/ServiceAvailability.py +135 -0
  81. edsl/inference_services/TestService.py +90 -89
  82. edsl/inference_services/TogetherAIService.py +172 -170
  83. edsl/inference_services/data_structures.py +134 -0
  84. edsl/inference_services/models_available_cache.py +118 -118
  85. edsl/inference_services/rate_limits_cache.py +25 -25
  86. edsl/inference_services/registry.py +41 -41
  87. edsl/inference_services/write_available.py +10 -10
  88. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  89. edsl/jobs/Answers.py +43 -56
  90. edsl/jobs/FetchInvigilator.py +47 -0
  91. edsl/jobs/InterviewTaskManager.py +98 -0
  92. edsl/jobs/InterviewsConstructor.py +50 -0
  93. edsl/jobs/Jobs.py +823 -898
  94. edsl/jobs/JobsChecks.py +172 -147
  95. edsl/jobs/JobsComponentConstructor.py +189 -0
  96. edsl/jobs/JobsPrompts.py +270 -268
  97. edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
  98. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  99. edsl/jobs/RequestTokenEstimator.py +30 -0
  100. edsl/jobs/__init__.py +1 -1
  101. edsl/jobs/async_interview_runner.py +138 -0
  102. edsl/jobs/buckets/BucketCollection.py +104 -63
  103. edsl/jobs/buckets/ModelBuckets.py +65 -65
  104. edsl/jobs/buckets/TokenBucket.py +283 -251
  105. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  106. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  107. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  108. edsl/jobs/data_structures.py +120 -0
  109. edsl/jobs/decorators.py +35 -0
  110. edsl/jobs/interviews/Interview.py +396 -661
  111. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  112. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  113. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  114. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  115. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  116. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  117. edsl/jobs/interviews/ReportErrors.py +66 -66
  118. edsl/jobs/interviews/interview_status_enum.py +9 -9
  119. edsl/jobs/jobs_status_enums.py +9 -0
  120. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  121. edsl/jobs/results_exceptions_handler.py +98 -0
  122. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
  123. edsl/jobs/runners/JobsRunnerStatus.py +297 -330
  124. edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
  125. edsl/jobs/tasks/TaskCreators.py +64 -64
  126. edsl/jobs/tasks/TaskHistory.py +470 -450
  127. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  128. edsl/jobs/tasks/task_status_enum.py +161 -163
  129. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  130. edsl/jobs/tokens/TokenUsage.py +34 -34
  131. edsl/language_models/ComputeCost.py +63 -0
  132. edsl/language_models/LanguageModel.py +626 -668
  133. edsl/language_models/ModelList.py +164 -155
  134. edsl/language_models/PriceManager.py +127 -0
  135. edsl/language_models/RawResponseHandler.py +106 -0
  136. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  137. edsl/language_models/ServiceDataSources.py +0 -0
  138. edsl/language_models/__init__.py +2 -3
  139. edsl/language_models/fake_openai_call.py +15 -15
  140. edsl/language_models/fake_openai_service.py +61 -61
  141. edsl/language_models/key_management/KeyLookup.py +63 -0
  142. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  143. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  144. edsl/language_models/key_management/__init__.py +0 -0
  145. edsl/language_models/key_management/models.py +131 -0
  146. edsl/language_models/model.py +256 -0
  147. edsl/language_models/repair.py +156 -156
  148. edsl/language_models/utilities.py +65 -64
  149. edsl/notebooks/Notebook.py +263 -258
  150. edsl/notebooks/NotebookToLaTeX.py +142 -0
  151. edsl/notebooks/__init__.py +1 -1
  152. edsl/prompts/Prompt.py +352 -362
  153. edsl/prompts/__init__.py +2 -2
  154. edsl/questions/ExceptionExplainer.py +77 -0
  155. edsl/questions/HTMLQuestion.py +103 -0
  156. edsl/questions/QuestionBase.py +518 -664
  157. edsl/questions/QuestionBasePromptsMixin.py +221 -217
  158. edsl/questions/QuestionBudget.py +227 -227
  159. edsl/questions/QuestionCheckBox.py +359 -359
  160. edsl/questions/QuestionExtract.py +180 -182
  161. edsl/questions/QuestionFreeText.py +113 -114
  162. edsl/questions/QuestionFunctional.py +166 -166
  163. edsl/questions/QuestionList.py +223 -231
  164. edsl/questions/QuestionMatrix.py +265 -0
  165. edsl/questions/QuestionMultipleChoice.py +330 -286
  166. edsl/questions/QuestionNumerical.py +151 -153
  167. edsl/questions/QuestionRank.py +314 -324
  168. edsl/questions/Quick.py +41 -41
  169. edsl/questions/SimpleAskMixin.py +74 -73
  170. edsl/questions/__init__.py +27 -26
  171. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
  172. edsl/questions/compose_questions.py +98 -98
  173. edsl/questions/data_structures.py +20 -0
  174. edsl/questions/decorators.py +21 -21
  175. edsl/questions/derived/QuestionLikertFive.py +76 -76
  176. edsl/questions/derived/QuestionLinearScale.py +90 -87
  177. edsl/questions/derived/QuestionTopK.py +93 -93
  178. edsl/questions/derived/QuestionYesNo.py +82 -82
  179. edsl/questions/descriptors.py +427 -413
  180. edsl/questions/loop_processor.py +149 -0
  181. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  182. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  183. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  184. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  185. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  186. edsl/questions/prompt_templates/question_list.jinja +17 -17
  187. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  188. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  189. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
  190. edsl/questions/question_registry.py +177 -177
  191. edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
  192. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
  193. edsl/questions/response_validator_factory.py +34 -0
  194. edsl/questions/settings.py +12 -12
  195. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  196. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  197. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  198. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  199. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  200. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  201. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  202. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  203. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  204. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  205. edsl/questions/templates/list/question_presentation.jinja +5 -5
  206. edsl/questions/templates/matrix/__init__.py +1 -0
  207. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  208. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  209. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  210. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  211. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  212. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  213. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  214. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  215. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  216. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  217. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  218. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  219. edsl/results/CSSParameterizer.py +108 -108
  220. edsl/results/Dataset.py +587 -424
  221. edsl/results/DatasetExportMixin.py +594 -731
  222. edsl/results/DatasetTree.py +295 -275
  223. edsl/results/MarkdownToDocx.py +122 -0
  224. edsl/results/MarkdownToPDF.py +111 -0
  225. edsl/results/Result.py +557 -465
  226. edsl/results/Results.py +1183 -1165
  227. edsl/results/ResultsExportMixin.py +45 -43
  228. edsl/results/ResultsGGMixin.py +121 -121
  229. edsl/results/TableDisplay.py +125 -198
  230. edsl/results/TextEditor.py +50 -0
  231. edsl/results/__init__.py +2 -2
  232. edsl/results/file_exports.py +252 -0
  233. edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
  234. edsl/results/{Selector.py → results_selector.py} +145 -135
  235. edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
  236. edsl/results/smart_objects.py +96 -0
  237. edsl/results/table_data_class.py +12 -0
  238. edsl/results/table_display.css +77 -77
  239. edsl/results/table_renderers.py +118 -0
  240. edsl/results/tree_explore.py +115 -115
  241. edsl/scenarios/ConstructDownloadLink.py +109 -0
  242. edsl/scenarios/DocumentChunker.py +102 -0
  243. edsl/scenarios/DocxScenario.py +16 -0
  244. edsl/scenarios/FileStore.py +511 -632
  245. edsl/scenarios/PdfExtractor.py +40 -0
  246. edsl/scenarios/Scenario.py +498 -601
  247. edsl/scenarios/ScenarioHtmlMixin.py +65 -64
  248. edsl/scenarios/ScenarioList.py +1458 -1287
  249. edsl/scenarios/ScenarioListExportMixin.py +45 -52
  250. edsl/scenarios/ScenarioListPdfMixin.py +239 -261
  251. edsl/scenarios/__init__.py +3 -4
  252. edsl/scenarios/directory_scanner.py +96 -0
  253. edsl/scenarios/file_methods.py +85 -0
  254. edsl/scenarios/handlers/__init__.py +13 -0
  255. edsl/scenarios/handlers/csv.py +38 -0
  256. edsl/scenarios/handlers/docx.py +76 -0
  257. edsl/scenarios/handlers/html.py +37 -0
  258. edsl/scenarios/handlers/json.py +111 -0
  259. edsl/scenarios/handlers/latex.py +5 -0
  260. edsl/scenarios/handlers/md.py +51 -0
  261. edsl/scenarios/handlers/pdf.py +68 -0
  262. edsl/scenarios/handlers/png.py +39 -0
  263. edsl/scenarios/handlers/pptx.py +105 -0
  264. edsl/scenarios/handlers/py.py +294 -0
  265. edsl/scenarios/handlers/sql.py +313 -0
  266. edsl/scenarios/handlers/sqlite.py +149 -0
  267. edsl/scenarios/handlers/txt.py +33 -0
  268. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
  269. edsl/scenarios/scenario_selector.py +156 -0
  270. edsl/shared.py +1 -1
  271. edsl/study/ObjectEntry.py +173 -173
  272. edsl/study/ProofOfWork.py +113 -113
  273. edsl/study/SnapShot.py +80 -80
  274. edsl/study/Study.py +521 -528
  275. edsl/study/__init__.py +4 -4
  276. edsl/surveys/ConstructDAG.py +92 -0
  277. edsl/surveys/DAG.py +148 -148
  278. edsl/surveys/EditSurvey.py +221 -0
  279. edsl/surveys/InstructionHandler.py +100 -0
  280. edsl/surveys/Memory.py +31 -31
  281. edsl/surveys/MemoryManagement.py +72 -0
  282. edsl/surveys/MemoryPlan.py +244 -244
  283. edsl/surveys/Rule.py +327 -326
  284. edsl/surveys/RuleCollection.py +385 -387
  285. edsl/surveys/RuleManager.py +172 -0
  286. edsl/surveys/Simulator.py +75 -0
  287. edsl/surveys/Survey.py +1280 -1801
  288. edsl/surveys/SurveyCSS.py +273 -261
  289. edsl/surveys/SurveyExportMixin.py +259 -259
  290. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
  291. edsl/surveys/SurveyQualtricsImport.py +284 -284
  292. edsl/surveys/SurveyToApp.py +141 -0
  293. edsl/surveys/__init__.py +5 -3
  294. edsl/surveys/base.py +53 -53
  295. edsl/surveys/descriptors.py +60 -56
  296. edsl/surveys/instructions/ChangeInstruction.py +48 -49
  297. edsl/surveys/instructions/Instruction.py +56 -65
  298. edsl/surveys/instructions/InstructionCollection.py +82 -77
  299. edsl/templates/error_reporting/base.html +23 -23
  300. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  301. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  302. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  303. edsl/templates/error_reporting/interview_details.html +115 -115
  304. edsl/templates/error_reporting/interviews.html +19 -19
  305. edsl/templates/error_reporting/overview.html +4 -4
  306. edsl/templates/error_reporting/performance_plot.html +1 -1
  307. edsl/templates/error_reporting/report.css +73 -73
  308. edsl/templates/error_reporting/report.html +117 -117
  309. edsl/templates/error_reporting/report.js +25 -25
  310. edsl/tools/__init__.py +1 -1
  311. edsl/tools/clusters.py +192 -192
  312. edsl/tools/embeddings.py +27 -27
  313. edsl/tools/embeddings_plotting.py +118 -118
  314. edsl/tools/plotting.py +112 -112
  315. edsl/tools/summarize.py +18 -18
  316. edsl/utilities/PrettyList.py +56 -0
  317. edsl/utilities/SystemInfo.py +28 -28
  318. edsl/utilities/__init__.py +22 -22
  319. edsl/utilities/ast_utilities.py +25 -25
  320. edsl/utilities/data/Registry.py +6 -6
  321. edsl/utilities/data/__init__.py +1 -1
  322. edsl/utilities/data/scooter_results.json +1 -1
  323. edsl/utilities/decorators.py +77 -77
  324. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  325. edsl/utilities/interface.py +627 -627
  326. edsl/utilities/is_notebook.py +18 -0
  327. edsl/utilities/is_valid_variable_name.py +11 -0
  328. edsl/utilities/naming_utilities.py +263 -263
  329. edsl/utilities/remove_edsl_version.py +24 -0
  330. edsl/utilities/repair_functions.py +28 -28
  331. edsl/utilities/restricted_python.py +70 -70
  332. edsl/utilities/utilities.py +436 -424
  333. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/LICENSE +21 -21
  334. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/METADATA +13 -11
  335. edsl-0.1.39.dev5.dist-info/RECORD +358 -0
  336. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/WHEEL +1 -1
  337. edsl/language_models/KeyLookup.py +0 -30
  338. edsl/language_models/registry.py +0 -190
  339. edsl/language_models/unused/ReplicateBase.py +0 -83
  340. edsl/results/ResultsDBMixin.py +0 -238
  341. edsl-0.1.39.dev3.dist-info/RECORD +0 -277
@@ -1,63 +1,63 @@
1
- import asyncio
2
- from enum import Enum
3
- from typing import Literal, List, Type, DefaultDict
4
- from collections import UserDict, defaultdict
5
-
6
- from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
7
- from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
8
- from edsl.enums import pricing, TokenPricing
9
- from edsl.jobs.tasks.task_status_enum import TaskStatus
10
-
11
- InterviewTokenUsageMapping = DefaultDict[str, InterviewTokenUsage]
12
-
13
-
14
- class InterviewStatistic(UserDict):
15
- @staticmethod
16
- def _format_number(number, digits=0, units=""):
17
- """Format a number.
18
-
19
- :param number: the number to format
20
- :param digits: the number of digits to display
21
- :param units: the units to display
22
-
23
- Example usage:
24
-
25
- >>> InterviewStatistic._format_number(1000, 1, "sec.")
26
- '1,000.0 sec.'
27
- """
28
- if type(number) == str:
29
- return number
30
- else:
31
- return f"{number:,.{digits}f}" + " " + units
32
-
33
- @property
34
- def _pretty_name(self):
35
- """Return a pretty name for the statistic.
36
-
37
- Example usage:
38
-
39
- >>> InterviewStatistic("elapsed_time", value=100, digits=1, units="sec.").pretty_name
40
- 'Elapsed time'
41
- """
42
- return self.name.replace("_", " ").capitalize()
43
-
44
- def __init__(
45
- self,
46
- name: str,
47
- value: float,
48
- digits: int = 0,
49
- units: str = "",
50
- pretty_name: str = None,
51
- ):
52
- """Create a new InterviewStatistic object."""
53
- self.name = name
54
- self.value = value
55
- self.digits = digits
56
- self.units = units
57
- self.pretty_name = pretty_name or self._pretty_name
58
-
59
- super().__init__(
60
- {self.pretty_name: self._format_number(self.value, self.digits, self.units)}
61
- )
62
-
63
- self.raw: dict = {self.name: self.value}
1
+ import asyncio
2
+ from enum import Enum
3
+ from typing import Literal, List, Type, DefaultDict
4
+ from collections import UserDict, defaultdict
5
+
6
+ from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
7
+ from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
8
+ from edsl.enums import pricing, TokenPricing
9
+ from edsl.jobs.tasks.task_status_enum import TaskStatus
10
+
11
+ InterviewTokenUsageMapping = DefaultDict[str, InterviewTokenUsage]
12
+
13
+
14
+ class InterviewStatistic(UserDict):
15
+ @staticmethod
16
+ def _format_number(number, digits=0, units=""):
17
+ """Format a number.
18
+
19
+ :param number: the number to format
20
+ :param digits: the number of digits to display
21
+ :param units: the units to display
22
+
23
+ Example usage:
24
+
25
+ >>> InterviewStatistic._format_number(1000, 1, "sec.")
26
+ '1,000.0 sec.'
27
+ """
28
+ if type(number) == str:
29
+ return number
30
+ else:
31
+ return f"{number:,.{digits}f}" + " " + units
32
+
33
+ @property
34
+ def _pretty_name(self):
35
+ """Return a pretty name for the statistic.
36
+
37
+ Example usage:
38
+
39
+ >>> InterviewStatistic("elapsed_time", value=100, digits=1, units="sec.").pretty_name
40
+ 'Elapsed time'
41
+ """
42
+ return self.name.replace("_", " ").capitalize()
43
+
44
+ def __init__(
45
+ self,
46
+ name: str,
47
+ value: float,
48
+ digits: int = 0,
49
+ units: str = "",
50
+ pretty_name: str = None,
51
+ ):
52
+ """Create a new InterviewStatistic object."""
53
+ self.name = name
54
+ self.value = value
55
+ self.digits = digits
56
+ self.units = units
57
+ self.pretty_name = pretty_name or self._pretty_name
58
+
59
+ super().__init__(
60
+ {self.pretty_name: self._format_number(self.value, self.digits, self.units)}
61
+ )
62
+
63
+ self.raw: dict = {self.name: self.value}
@@ -1,25 +1,25 @@
1
- from collections import UserDict
2
- from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
3
-
4
-
5
- class InterviewStatisticsCollection(UserDict):
6
- """A collection of interview statistics."""
7
-
8
- def __init__(self, *args, **kwargs):
9
- super().__init__(*args, **kwargs)
10
- self.raw: dict = {}
11
-
12
- def add_stat(self, statistic: InterviewStatistic):
13
- """Add a statistic to the collection.
14
-
15
- Each statistic is a dictionary with a single key-value pair.
16
-
17
- Example usage:
18
-
19
- >>> isc = InterviewStatisticsCollection()
20
- >>> isc.add_stat(InterviewStatistic("elapsed_time", value=100, digits=1, units="sec."))
21
- >>> isc.raw
22
- {'elapsed_time': 100}
23
- """
24
- self.update(statistic)
25
- self.raw.update(statistic.raw)
1
+ from collections import UserDict
2
+ from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
3
+
4
+
5
+ class InterviewStatisticsCollection(UserDict):
6
+ """A collection of interview statistics."""
7
+
8
+ def __init__(self, *args, **kwargs):
9
+ super().__init__(*args, **kwargs)
10
+ self.raw: dict = {}
11
+
12
+ def add_stat(self, statistic: InterviewStatistic):
13
+ """Add a statistic to the collection.
14
+
15
+ Each statistic is a dictionary with a single key-value pair.
16
+
17
+ Example usage:
18
+
19
+ >>> isc = InterviewStatisticsCollection()
20
+ >>> isc.add_stat(InterviewStatistic("elapsed_time", value=100, digits=1, units="sec."))
21
+ >>> isc.raw
22
+ {'elapsed_time': 100}
23
+ """
24
+ self.update(statistic)
25
+ self.raw.update(statistic.raw)
@@ -1,78 +1,78 @@
1
- from __future__ import annotations
2
- import json
3
- from collections import UserDict
4
- from typing import Union, Dict
5
-
6
- from edsl.jobs.tasks.task_status_enum import TaskStatus, get_enum_from_string
7
-
8
-
9
- class InterviewStatusDictionary(UserDict):
10
- """A dictionary that keeps track of the status of all the tasks in an interview."""
11
-
12
- def __init__(self, data: Union[Dict[TaskStatus, int], None] = None):
13
- if data:
14
- # checks to make sure every task status is in the enum
15
- assert all([task_status in data for task_status in TaskStatus])
16
- super().__init__(data)
17
- else:
18
- # sets all the task statuses to 0
19
- d = {}
20
- for task_status in TaskStatus:
21
- d[task_status] = 0
22
- d["number_from_cache"] = 0
23
- super().__init__(d)
24
-
25
- def __add__(
26
- self, other: "InterviewStatusDictionary"
27
- ) -> "InterviewStatusDictionary":
28
- """Adds two InterviewStatusDictionaries together."""
29
- if not isinstance(other, InterviewStatusDictionary):
30
- raise ValueError(f"Can't add {type(other)} to InterviewStatusDictionary")
31
- new_dict = {}
32
- for key in self.keys():
33
- new_dict[key] = self[key] + other[key]
34
- return InterviewStatusDictionary(new_dict)
35
-
36
- @property
37
- def waiting(self) -> int:
38
- """Return the number of tasks that are in a waiting status of some kind."""
39
-
40
- waiting_status_list = [
41
- TaskStatus.WAITING_FOR_REQUEST_CAPACITY,
42
- TaskStatus.WAITING_FOR_TOKEN_CAPACITY,
43
- TaskStatus.WAITING_FOR_DEPENDENCIES,
44
- ]
45
-
46
- return sum([self[status] for status in waiting_status_list])
47
-
48
- def __repr__(self):
49
- return f"InterviewStatusDictionary({self.data})"
50
-
51
- def to_dict(self):
52
- new_data = {str(key): value for key, value in self.data.items()}
53
- return new_data
54
-
55
- def print(self):
56
- d = {}
57
- for key, value in self.data.items():
58
- d[str(key)] = value
59
- from edsl.utilities.interface import print_dict_with_rich
60
-
61
- print_dict_with_rich(d)
62
-
63
- @classmethod
64
- def from_dict(cls, data):
65
- new_data = {get_enum_from_string(key): value for key, value in data.items()}
66
- return cls(new_data)
67
-
68
- def to_json(self):
69
- import json
70
-
71
- return json.dumps(self.to_dict())
72
-
73
- @classmethod
74
- def from_json(cls, data):
75
- import json
76
-
77
- data = json.loads(data)
78
- return cls.from_dict(data)
1
+ from __future__ import annotations
2
+ import json
3
+ from collections import UserDict
4
+ from typing import Union, Dict
5
+
6
+ from edsl.jobs.tasks.task_status_enum import TaskStatus, get_enum_from_string
7
+
8
+
9
+ class InterviewStatusDictionary(UserDict):
10
+ """A dictionary that keeps track of the status of all the tasks in an interview."""
11
+
12
+ def __init__(self, data: Union[Dict[TaskStatus, int], None] = None):
13
+ if data:
14
+ # checks to make sure every task status is in the enum
15
+ assert all([task_status in data for task_status in TaskStatus])
16
+ super().__init__(data)
17
+ else:
18
+ # sets all the task statuses to 0
19
+ d = {}
20
+ for task_status in TaskStatus:
21
+ d[task_status] = 0
22
+ d["number_from_cache"] = 0
23
+ super().__init__(d)
24
+
25
+ def __add__(
26
+ self, other: "InterviewStatusDictionary"
27
+ ) -> "InterviewStatusDictionary":
28
+ """Adds two InterviewStatusDictionaries together."""
29
+ if not isinstance(other, InterviewStatusDictionary):
30
+ raise ValueError(f"Can't add {type(other)} to InterviewStatusDictionary")
31
+ new_dict = {}
32
+ for key in self.keys():
33
+ new_dict[key] = self[key] + other[key]
34
+ return InterviewStatusDictionary(new_dict)
35
+
36
+ @property
37
+ def waiting(self) -> int:
38
+ """Return the number of tasks that are in a waiting status of some kind."""
39
+
40
+ waiting_status_list = [
41
+ TaskStatus.WAITING_FOR_REQUEST_CAPACITY,
42
+ TaskStatus.WAITING_FOR_TOKEN_CAPACITY,
43
+ TaskStatus.WAITING_FOR_DEPENDENCIES,
44
+ ]
45
+
46
+ return sum([self[status] for status in waiting_status_list])
47
+
48
+ def __repr__(self):
49
+ return f"InterviewStatusDictionary({self.data})"
50
+
51
+ def to_dict(self):
52
+ new_data = {str(key): value for key, value in self.data.items()}
53
+ return new_data
54
+
55
+ def print(self):
56
+ d = {}
57
+ for key, value in self.data.items():
58
+ d[str(key)] = value
59
+ from edsl.utilities.interface import print_dict_with_rich
60
+
61
+ print_dict_with_rich(d)
62
+
63
+ @classmethod
64
+ def from_dict(cls, data):
65
+ new_data = {get_enum_from_string(key): value for key, value in data.items()}
66
+ return cls(new_data)
67
+
68
+ def to_json(self):
69
+ import json
70
+
71
+ return json.dumps(self.to_dict())
72
+
73
+ @classmethod
74
+ def from_json(cls, data):
75
+ import json
76
+
77
+ data = json.loads(data)
78
+ return cls.from_dict(data)
@@ -1,92 +1,92 @@
1
- from collections import UserDict
2
-
3
- from edsl.jobs.tasks.task_status_enum import TaskStatus, status_colors
4
-
5
-
6
- class InterviewStatusLog(UserDict):
7
- """A dictionary of TaskStatusLog objects.
8
-
9
- The key is the name of the task.
10
- """
11
-
12
- @property
13
- def min_time(self):
14
- return min([log.min_time for log in self.values()])
15
-
16
- @property
17
- def max_time(self):
18
- return max([log.max_time for log in self.values()])
19
-
20
- def status_matrix(self, num_periods):
21
- """Return a matrix of status values."""
22
- start_time = self.min_time
23
- end_time = self.max_time
24
- time_increment = (end_time - start_time) / num_periods
25
- status_matrix = {}
26
- time_periods = [start_time + i * time_increment for i in range(num_periods)]
27
- for task_name, log in self.items():
28
- status_matrix[task_name] = [log.status_at_time(t) for t in time_periods]
29
- return status_matrix
30
-
31
- def numerical_matrix(self, num_periods):
32
- """Return a numerical matrix of status values."""
33
- status_dicts = self.status_matrix(num_periods)
34
-
35
- num_cols = num_periods
36
- num_rows = len(status_dicts)
37
- matrix = [[0 for _ in range(num_cols)] for _ in range(num_rows)]
38
-
39
- for row_index, (task_name, status_list) in enumerate(status_dicts.items()):
40
- matrix[row_index] = [
41
- list(status_colors.keys()).index(status) for status in status_list
42
- ]
43
-
44
- index_to_names = {i: name for i, name in enumerate(status_dicts.keys())}
45
- return matrix, index_to_names
46
-
47
- def visualize(self, num_periods=10):
48
- """Visualize the status matrix with outlined squares."""
49
- import matplotlib.pyplot as plt
50
- from matplotlib.colors import ListedColormap
51
- import numpy as np
52
- from matplotlib.patches import Rectangle
53
-
54
- # Define your custom colormap
55
- custom_cmap = ListedColormap(list(status_colors.values()))
56
-
57
- # Generate the matrix
58
- matrix, index_to_names = self.numerical_matrix(num_periods)
59
-
60
- # Create the figure and axes
61
- plt.figure(figsize=(10, 5))
62
- ax = plt.gca()
63
-
64
- # Display the matrix and keep a reference to the imshow object
65
- im = ax.imshow(matrix, aspect="auto", cmap=custom_cmap)
66
-
67
- # Adding color bar, now correctly associating it with 'im'
68
- cbar = plt.colorbar(im, ticks=range(len(status_colors)), label="Task Status")
69
-
70
- cbar_labels = [status.name for status in status_colors.keys()]
71
- # breakpoint()
72
- cbar.set_ticklabels(cbar_labels) # Setting the custom labels for the colorbar
73
-
74
- im.set_clim(
75
- -0.5, len(status_colors) - 0.5
76
- ) # Setting color limits directly on the imshow object
77
-
78
- # Outline each cell by drawing rectangles
79
- for (j, i), val in np.ndenumerate(matrix):
80
- ax.add_patch(
81
- Rectangle(
82
- (i - 0.5, j - 0.5), 1, 1, fill=False, edgecolor="black", lw=0.5
83
- )
84
- )
85
-
86
- # Set custom y-axis ticks and labels
87
- yticks = list(index_to_names.keys())
88
- yticklabels = list(index_to_names.values())
89
- plt.yticks(ticks=yticks, labels=yticklabels)
90
-
91
- # Show the plot
92
- plt.show()
1
+ from collections import UserDict
2
+
3
+ from edsl.jobs.tasks.task_status_enum import TaskStatus, status_colors
4
+
5
+
6
+ class InterviewStatusLog(UserDict):
7
+ """A dictionary of TaskStatusLog objects.
8
+
9
+ The key is the name of the task.
10
+ """
11
+
12
+ @property
13
+ def min_time(self):
14
+ return min([log.min_time for log in self.values()])
15
+
16
+ @property
17
+ def max_time(self):
18
+ return max([log.max_time for log in self.values()])
19
+
20
+ def status_matrix(self, num_periods):
21
+ """Return a matrix of status values."""
22
+ start_time = self.min_time
23
+ end_time = self.max_time
24
+ time_increment = (end_time - start_time) / num_periods
25
+ status_matrix = {}
26
+ time_periods = [start_time + i * time_increment for i in range(num_periods)]
27
+ for task_name, log in self.items():
28
+ status_matrix[task_name] = [log.status_at_time(t) for t in time_periods]
29
+ return status_matrix
30
+
31
+ def numerical_matrix(self, num_periods):
32
+ """Return a numerical matrix of status values."""
33
+ status_dicts = self.status_matrix(num_periods)
34
+
35
+ num_cols = num_periods
36
+ num_rows = len(status_dicts)
37
+ matrix = [[0 for _ in range(num_cols)] for _ in range(num_rows)]
38
+
39
+ for row_index, (task_name, status_list) in enumerate(status_dicts.items()):
40
+ matrix[row_index] = [
41
+ list(status_colors.keys()).index(status) for status in status_list
42
+ ]
43
+
44
+ index_to_names = {i: name for i, name in enumerate(status_dicts.keys())}
45
+ return matrix, index_to_names
46
+
47
+ def visualize(self, num_periods=10):
48
+ """Visualize the status matrix with outlined squares."""
49
+ import matplotlib.pyplot as plt
50
+ from matplotlib.colors import ListedColormap
51
+ import numpy as np
52
+ from matplotlib.patches import Rectangle
53
+
54
+ # Define your custom colormap
55
+ custom_cmap = ListedColormap(list(status_colors.values()))
56
+
57
+ # Generate the matrix
58
+ matrix, index_to_names = self.numerical_matrix(num_periods)
59
+
60
+ # Create the figure and axes
61
+ plt.figure(figsize=(10, 5))
62
+ ax = plt.gca()
63
+
64
+ # Display the matrix and keep a reference to the imshow object
65
+ im = ax.imshow(matrix, aspect="auto", cmap=custom_cmap)
66
+
67
+ # Adding color bar, now correctly associating it with 'im'
68
+ cbar = plt.colorbar(im, ticks=range(len(status_colors)), label="Task Status")
69
+
70
+ cbar_labels = [status.name for status in status_colors.keys()]
71
+ # breakpoint()
72
+ cbar.set_ticklabels(cbar_labels) # Setting the custom labels for the colorbar
73
+
74
+ im.set_clim(
75
+ -0.5, len(status_colors) - 0.5
76
+ ) # Setting color limits directly on the imshow object
77
+
78
+ # Outline each cell by drawing rectangles
79
+ for (j, i), val in np.ndenumerate(matrix):
80
+ ax.add_patch(
81
+ Rectangle(
82
+ (i - 0.5, j - 0.5), 1, 1, fill=False, edgecolor="black", lw=0.5
83
+ )
84
+ )
85
+
86
+ # Set custom y-axis ticks and labels
87
+ yticks = list(index_to_names.keys())
88
+ yticklabels = list(index_to_names.values())
89
+ plt.yticks(ticks=yticks, labels=yticklabels)
90
+
91
+ # Show the plot
92
+ plt.show()
@@ -1,66 +1,66 @@
1
- import json
2
- import requests
3
- import threading
4
- from edsl.coop import Coop
5
-
6
-
7
- class ReportErrors:
8
- def __init__(self, task_history):
9
- self.task_history = task_history
10
- self.email = None
11
-
12
- @property
13
- def data(self):
14
- return {
15
- "text": self.task_history.to_dict(),
16
- "email": self.email,
17
- }
18
-
19
- def get_email(self, timeout=10):
20
- """Helper method to get user input with a timeout."""
21
- input_queue = []
22
-
23
- def input_thread_method():
24
- email_input = input(
25
- "Please enter your email address (if you want us to get in touch): "
26
- )
27
- input_queue.append(email_input)
28
-
29
- input_thread = threading.Thread(target=input_thread_method)
30
- input_thread.start()
31
- input_thread.join(timeout=timeout)
32
-
33
- if input_queue:
34
- self.email = input_queue[0]
35
- else:
36
- print("No input received within the timeout period.")
37
-
38
- def upload(self):
39
- # The previous implementation was removed because it relied on the old Coop ErrorModel
40
- pass
41
-
42
-
43
- def main():
44
- from edsl.jobs.interviews.ReportErrors import ReportErrors
45
-
46
- class TaskHistory:
47
- def __init__(self, data):
48
- self.data = data
49
-
50
- def to_dict(self):
51
- """Converts the internal data of the task history to a dictionary format."""
52
- return self.data
53
-
54
- task_history_data = {
55
- "task": "Example Task",
56
- "status": "Completed",
57
- "details": "This is an example of a task history.",
58
- }
59
- task_history = TaskHistory(task_history_data)
60
-
61
- reporter = ReportErrors(task_history)
62
- # one without email
63
- reporter.upload()
64
- # one with email
65
- reporter.email = "fake@gmail.com"
66
- reporter.upload()
1
+ import json
2
+ import requests
3
+ import threading
4
+ from edsl.coop import Coop
5
+
6
+
7
+ class ReportErrors:
8
+ def __init__(self, task_history):
9
+ self.task_history = task_history
10
+ self.email = None
11
+
12
+ @property
13
+ def data(self):
14
+ return {
15
+ "text": self.task_history.to_dict(),
16
+ "email": self.email,
17
+ }
18
+
19
+ def get_email(self, timeout=10):
20
+ """Helper method to get user input with a timeout."""
21
+ input_queue = []
22
+
23
+ def input_thread_method():
24
+ email_input = input(
25
+ "Please enter your email address (if you want us to get in touch): "
26
+ )
27
+ input_queue.append(email_input)
28
+
29
+ input_thread = threading.Thread(target=input_thread_method)
30
+ input_thread.start()
31
+ input_thread.join(timeout=timeout)
32
+
33
+ if input_queue:
34
+ self.email = input_queue[0]
35
+ else:
36
+ print("No input received within the timeout period.")
37
+
38
+ def upload(self):
39
+ # The previous implementation was removed because it relied on the old Coop ErrorModel
40
+ pass
41
+
42
+
43
+ def main():
44
+ from edsl.jobs.interviews.ReportErrors import ReportErrors
45
+
46
+ class TaskHistory:
47
+ def __init__(self, data):
48
+ self.data = data
49
+
50
+ def to_dict(self):
51
+ """Converts the internal data of the task history to a dictionary format."""
52
+ return self.data
53
+
54
+ task_history_data = {
55
+ "task": "Example Task",
56
+ "status": "Completed",
57
+ "details": "This is an example of a task history.",
58
+ }
59
+ task_history = TaskHistory(task_history_data)
60
+
61
+ reporter = ReportErrors(task_history)
62
+ # one without email
63
+ reporter.upload()
64
+ # one with email
65
+ reporter.email = "fake@gmail.com"
66
+ reporter.upload()
@@ -1,9 +1,9 @@
1
- import enum
2
-
3
-
4
- class InterviewStatus(enum.Enum):
5
- "These are the possible states an interview can be in."
6
- NOT_STARTED = enum.auto()
7
- SUCCESS = enum.auto()
8
- WAITING_FOR_RESOURCES = enum.auto()
9
- FAILED = enum.auto()
1
+ import enum
2
+
3
+
4
+ class InterviewStatus(enum.Enum):
5
+ "These are the possible states an interview can be in."
6
+ NOT_STARTED = enum.auto()
7
+ SUCCESS = enum.auto()
8
+ WAITING_FOR_RESOURCES = enum.auto()
9
+ FAILED = enum.auto()