edsl 0.1.47__py3-none-any.whl → 0.1.49__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. edsl/__init__.py +44 -39
  2. edsl/__version__.py +1 -1
  3. edsl/agents/__init__.py +4 -2
  4. edsl/agents/{Agent.py → agent.py} +442 -152
  5. edsl/agents/{AgentList.py → agent_list.py} +220 -162
  6. edsl/agents/descriptors.py +46 -7
  7. edsl/{exceptions/agents.py → agents/exceptions.py} +3 -12
  8. edsl/base/__init__.py +75 -0
  9. edsl/base/base_class.py +1303 -0
  10. edsl/base/data_transfer_models.py +114 -0
  11. edsl/base/enums.py +215 -0
  12. edsl/base.py +8 -0
  13. edsl/buckets/__init__.py +25 -0
  14. edsl/buckets/bucket_collection.py +324 -0
  15. edsl/buckets/model_buckets.py +206 -0
  16. edsl/buckets/token_bucket.py +502 -0
  17. edsl/{jobs/buckets/TokenBucketAPI.py → buckets/token_bucket_api.py} +1 -1
  18. edsl/buckets/token_bucket_client.py +509 -0
  19. edsl/caching/__init__.py +20 -0
  20. edsl/caching/cache.py +814 -0
  21. edsl/caching/cache_entry.py +427 -0
  22. edsl/{data/CacheHandler.py → caching/cache_handler.py} +14 -15
  23. edsl/caching/exceptions.py +24 -0
  24. edsl/caching/orm.py +30 -0
  25. edsl/{data/RemoteCacheSync.py → caching/remote_cache_sync.py} +3 -3
  26. edsl/caching/sql_dict.py +441 -0
  27. edsl/config/__init__.py +8 -0
  28. edsl/config/config_class.py +177 -0
  29. edsl/config.py +4 -176
  30. edsl/conversation/Conversation.py +7 -7
  31. edsl/conversation/car_buying.py +4 -4
  32. edsl/conversation/chips.py +6 -6
  33. edsl/coop/__init__.py +25 -2
  34. edsl/coop/coop.py +311 -75
  35. edsl/coop/{ExpectedParrotKeyHandler.py → ep_key_handling.py} +86 -10
  36. edsl/coop/exceptions.py +62 -0
  37. edsl/coop/price_fetcher.py +126 -0
  38. edsl/coop/utils.py +89 -24
  39. edsl/data_transfer_models.py +5 -72
  40. edsl/dataset/__init__.py +10 -0
  41. edsl/{results/Dataset.py → dataset/dataset.py} +116 -36
  42. edsl/{results/DatasetExportMixin.py → dataset/dataset_operations_mixin.py} +606 -122
  43. edsl/{results/DatasetTree.py → dataset/dataset_tree.py} +156 -75
  44. edsl/{results/TableDisplay.py → dataset/display/table_display.py} +18 -7
  45. edsl/{results → dataset/display}/table_renderers.py +58 -2
  46. edsl/{results → dataset}/file_exports.py +4 -5
  47. edsl/{results → dataset}/smart_objects.py +2 -2
  48. edsl/enums.py +5 -205
  49. edsl/inference_services/__init__.py +5 -0
  50. edsl/inference_services/{AvailableModelCacheHandler.py → available_model_cache_handler.py} +2 -3
  51. edsl/inference_services/{AvailableModelFetcher.py → available_model_fetcher.py} +8 -14
  52. edsl/inference_services/data_structures.py +3 -2
  53. edsl/{exceptions/inference_services.py → inference_services/exceptions.py} +1 -1
  54. edsl/inference_services/{InferenceServiceABC.py → inference_service_abc.py} +1 -1
  55. edsl/inference_services/{InferenceServicesCollection.py → inference_services_collection.py} +8 -7
  56. edsl/inference_services/registry.py +4 -41
  57. edsl/inference_services/{ServiceAvailability.py → service_availability.py} +5 -25
  58. edsl/inference_services/services/__init__.py +31 -0
  59. edsl/inference_services/{AnthropicService.py → services/anthropic_service.py} +3 -3
  60. edsl/inference_services/{AwsBedrock.py → services/aws_bedrock.py} +2 -2
  61. edsl/inference_services/{AzureAI.py → services/azure_ai.py} +2 -2
  62. edsl/inference_services/{DeepInfraService.py → services/deep_infra_service.py} +1 -3
  63. edsl/inference_services/{DeepSeekService.py → services/deep_seek_service.py} +2 -4
  64. edsl/inference_services/{GoogleService.py → services/google_service.py} +5 -4
  65. edsl/inference_services/{GroqService.py → services/groq_service.py} +1 -1
  66. edsl/inference_services/{MistralAIService.py → services/mistral_ai_service.py} +3 -3
  67. edsl/inference_services/{OllamaService.py → services/ollama_service.py} +1 -7
  68. edsl/inference_services/{OpenAIService.py → services/open_ai_service.py} +5 -6
  69. edsl/inference_services/{PerplexityService.py → services/perplexity_service.py} +3 -7
  70. edsl/inference_services/{TestService.py → services/test_service.py} +7 -6
  71. edsl/inference_services/{TogetherAIService.py → services/together_ai_service.py} +2 -6
  72. edsl/inference_services/{XAIService.py → services/xai_service.py} +1 -1
  73. edsl/inference_services/write_available.py +1 -2
  74. edsl/instructions/__init__.py +6 -0
  75. edsl/{surveys/instructions/Instruction.py → instructions/instruction.py} +11 -6
  76. edsl/{surveys/instructions/InstructionCollection.py → instructions/instruction_collection.py} +10 -5
  77. edsl/{surveys/InstructionHandler.py → instructions/instruction_handler.py} +3 -3
  78. edsl/{jobs/interviews → interviews}/ReportErrors.py +2 -2
  79. edsl/interviews/__init__.py +4 -0
  80. edsl/{jobs/AnswerQuestionFunctionConstructor.py → interviews/answering_function.py} +45 -18
  81. edsl/{jobs/interviews/InterviewExceptionEntry.py → interviews/exception_tracking.py} +107 -22
  82. edsl/interviews/interview.py +638 -0
  83. edsl/{jobs/interviews/InterviewStatusDictionary.py → interviews/interview_status_dictionary.py} +21 -12
  84. edsl/{jobs/interviews/InterviewStatusLog.py → interviews/interview_status_log.py} +16 -7
  85. edsl/{jobs/InterviewTaskManager.py → interviews/interview_task_manager.py} +12 -7
  86. edsl/{jobs/RequestTokenEstimator.py → interviews/request_token_estimator.py} +8 -3
  87. edsl/{jobs/interviews/InterviewStatistic.py → interviews/statistics.py} +36 -10
  88. edsl/invigilators/__init__.py +38 -0
  89. edsl/invigilators/invigilator_base.py +477 -0
  90. edsl/{agents/Invigilator.py → invigilators/invigilators.py} +263 -10
  91. edsl/invigilators/prompt_constructor.py +476 -0
  92. edsl/{agents → invigilators}/prompt_helpers.py +2 -1
  93. edsl/{agents/QuestionInstructionPromptBuilder.py → invigilators/question_instructions_prompt_builder.py} +18 -13
  94. edsl/{agents → invigilators}/question_option_processor.py +96 -21
  95. edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} +64 -12
  96. edsl/jobs/__init__.py +7 -1
  97. edsl/jobs/async_interview_runner.py +99 -35
  98. edsl/jobs/check_survey_scenario_compatibility.py +7 -5
  99. edsl/jobs/data_structures.py +153 -22
  100. edsl/{exceptions/jobs.py → jobs/exceptions.py} +2 -1
  101. edsl/jobs/{FetchInvigilator.py → fetch_invigilator.py} +4 -4
  102. edsl/jobs/{loggers/HTMLTableJobLogger.py → html_table_job_logger.py} +6 -2
  103. edsl/jobs/{Jobs.py → jobs.py} +313 -167
  104. edsl/jobs/{JobsChecks.py → jobs_checks.py} +15 -7
  105. edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} +19 -17
  106. edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} +10 -5
  107. edsl/jobs/jobs_pricing_estimation.py +347 -0
  108. edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} +4 -3
  109. edsl/jobs/jobs_runner_asyncio.py +282 -0
  110. edsl/jobs/{JobsRemoteInferenceHandler.py → remote_inference.py} +19 -22
  111. edsl/jobs/results_exceptions_handler.py +2 -2
  112. edsl/key_management/__init__.py +28 -0
  113. edsl/key_management/key_lookup.py +161 -0
  114. edsl/{language_models/key_management/KeyLookupBuilder.py → key_management/key_lookup_builder.py} +118 -47
  115. edsl/key_management/key_lookup_collection.py +82 -0
  116. edsl/key_management/models.py +218 -0
  117. edsl/language_models/__init__.py +7 -2
  118. edsl/language_models/{ComputeCost.py → compute_cost.py} +18 -3
  119. edsl/{exceptions/language_models.py → language_models/exceptions.py} +2 -1
  120. edsl/language_models/language_model.py +1080 -0
  121. edsl/language_models/model.py +10 -25
  122. edsl/language_models/{ModelList.py → model_list.py} +9 -14
  123. edsl/language_models/{RawResponseHandler.py → raw_response_handler.py} +1 -1
  124. edsl/language_models/{RegisterLanguageModelsMeta.py → registry.py} +1 -1
  125. edsl/language_models/repair.py +4 -4
  126. edsl/language_models/utilities.py +4 -4
  127. edsl/notebooks/__init__.py +3 -1
  128. edsl/notebooks/{Notebook.py → notebook.py} +7 -8
  129. edsl/prompts/__init__.py +1 -1
  130. edsl/{exceptions/prompts.py → prompts/exceptions.py} +3 -1
  131. edsl/prompts/{Prompt.py → prompt.py} +101 -95
  132. edsl/questions/HTMLQuestion.py +1 -1
  133. edsl/questions/__init__.py +154 -25
  134. edsl/questions/answer_validator_mixin.py +1 -1
  135. edsl/questions/compose_questions.py +4 -3
  136. edsl/questions/derived/question_likert_five.py +166 -0
  137. edsl/questions/derived/{QuestionLinearScale.py → question_linear_scale.py} +4 -4
  138. edsl/questions/derived/{QuestionTopK.py → question_top_k.py} +4 -4
  139. edsl/questions/derived/{QuestionYesNo.py → question_yes_no.py} +4 -5
  140. edsl/questions/descriptors.py +24 -30
  141. edsl/questions/loop_processor.py +65 -19
  142. edsl/questions/question_base.py +881 -0
  143. edsl/questions/question_base_gen_mixin.py +15 -16
  144. edsl/questions/{QuestionBasePromptsMixin.py → question_base_prompts_mixin.py} +2 -2
  145. edsl/questions/{QuestionBudget.py → question_budget.py} +3 -4
  146. edsl/questions/{QuestionCheckBox.py → question_check_box.py} +16 -16
  147. edsl/questions/{QuestionDict.py → question_dict.py} +39 -5
  148. edsl/questions/{QuestionExtract.py → question_extract.py} +9 -9
  149. edsl/questions/question_free_text.py +282 -0
  150. edsl/questions/{QuestionFunctional.py → question_functional.py} +6 -5
  151. edsl/questions/{QuestionList.py → question_list.py} +6 -7
  152. edsl/questions/{QuestionMatrix.py → question_matrix.py} +6 -5
  153. edsl/questions/{QuestionMultipleChoice.py → question_multiple_choice.py} +126 -21
  154. edsl/questions/{QuestionNumerical.py → question_numerical.py} +5 -5
  155. edsl/questions/{QuestionRank.py → question_rank.py} +6 -6
  156. edsl/questions/question_registry.py +4 -9
  157. edsl/questions/register_questions_meta.py +8 -4
  158. edsl/questions/response_validator_abc.py +17 -16
  159. edsl/results/__init__.py +4 -1
  160. edsl/{exceptions/results.py → results/exceptions.py} +1 -1
  161. edsl/results/report.py +197 -0
  162. edsl/results/{Result.py → result.py} +131 -45
  163. edsl/results/{Results.py → results.py} +365 -220
  164. edsl/results/results_selector.py +344 -25
  165. edsl/scenarios/__init__.py +30 -3
  166. edsl/scenarios/{ConstructDownloadLink.py → construct_download_link.py} +7 -0
  167. edsl/scenarios/directory_scanner.py +156 -13
  168. edsl/scenarios/document_chunker.py +186 -0
  169. edsl/scenarios/exceptions.py +101 -0
  170. edsl/scenarios/file_methods.py +2 -3
  171. edsl/scenarios/{FileStore.py → file_store.py} +275 -189
  172. edsl/scenarios/handlers/__init__.py +14 -14
  173. edsl/scenarios/handlers/{csv.py → csv_file_store.py} +1 -2
  174. edsl/scenarios/handlers/{docx.py → docx_file_store.py} +8 -7
  175. edsl/scenarios/handlers/{html.py → html_file_store.py} +1 -2
  176. edsl/scenarios/handlers/{jpeg.py → jpeg_file_store.py} +1 -1
  177. edsl/scenarios/handlers/{json.py → json_file_store.py} +1 -1
  178. edsl/scenarios/handlers/latex_file_store.py +5 -0
  179. edsl/scenarios/handlers/{md.py → md_file_store.py} +1 -1
  180. edsl/scenarios/handlers/{pdf.py → pdf_file_store.py} +2 -2
  181. edsl/scenarios/handlers/{png.py → png_file_store.py} +1 -1
  182. edsl/scenarios/handlers/{pptx.py → pptx_file_store.py} +8 -7
  183. edsl/scenarios/handlers/{py.py → py_file_store.py} +1 -3
  184. edsl/scenarios/handlers/{sql.py → sql_file_store.py} +2 -1
  185. edsl/scenarios/handlers/{sqlite.py → sqlite_file_store.py} +2 -3
  186. edsl/scenarios/handlers/{txt.py → txt_file_store.py} +1 -1
  187. edsl/scenarios/scenario.py +928 -0
  188. edsl/scenarios/scenario_join.py +18 -5
  189. edsl/scenarios/{ScenarioList.py → scenario_list.py} +294 -106
  190. edsl/scenarios/{ScenarioListPdfMixin.py → scenario_list_pdf_tools.py} +16 -15
  191. edsl/scenarios/scenario_selector.py +5 -1
  192. edsl/study/ObjectEntry.py +2 -2
  193. edsl/study/SnapShot.py +5 -5
  194. edsl/study/Study.py +18 -19
  195. edsl/study/__init__.py +6 -4
  196. edsl/surveys/__init__.py +7 -4
  197. edsl/surveys/dag/__init__.py +2 -0
  198. edsl/surveys/{ConstructDAG.py → dag/construct_dag.py} +3 -3
  199. edsl/surveys/{DAG.py → dag/dag.py} +13 -10
  200. edsl/surveys/descriptors.py +1 -1
  201. edsl/surveys/{EditSurvey.py → edit_survey.py} +9 -9
  202. edsl/{exceptions/surveys.py → surveys/exceptions.py} +1 -2
  203. edsl/surveys/memory/__init__.py +3 -0
  204. edsl/surveys/{MemoryPlan.py → memory/memory_plan.py} +10 -9
  205. edsl/surveys/rules/__init__.py +3 -0
  206. edsl/surveys/{Rule.py → rules/rule.py} +103 -43
  207. edsl/surveys/{RuleCollection.py → rules/rule_collection.py} +21 -30
  208. edsl/surveys/{RuleManager.py → rules/rule_manager.py} +19 -13
  209. edsl/surveys/survey.py +1743 -0
  210. edsl/surveys/{SurveyExportMixin.py → survey_export.py} +22 -27
  211. edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} +11 -2
  212. edsl/surveys/{Simulator.py → survey_simulator.py} +10 -3
  213. edsl/tasks/__init__.py +32 -0
  214. edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} +115 -57
  215. edsl/tasks/task_creators.py +135 -0
  216. edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} +86 -47
  217. edsl/{jobs/tasks → tasks}/task_status_enum.py +91 -7
  218. edsl/tasks/task_status_log.py +85 -0
  219. edsl/tokens/__init__.py +2 -0
  220. edsl/tokens/interview_token_usage.py +53 -0
  221. edsl/utilities/PrettyList.py +1 -1
  222. edsl/utilities/SystemInfo.py +25 -22
  223. edsl/utilities/__init__.py +29 -21
  224. edsl/utilities/gcp_bucket/__init__.py +2 -0
  225. edsl/utilities/gcp_bucket/cloud_storage.py +99 -96
  226. edsl/utilities/interface.py +44 -536
  227. edsl/{results/MarkdownToPDF.py → utilities/markdown_to_pdf.py} +13 -5
  228. edsl/utilities/repair_functions.py +1 -1
  229. {edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/METADATA +1 -1
  230. edsl-0.1.49.dist-info/RECORD +347 -0
  231. edsl/Base.py +0 -493
  232. edsl/BaseDiff.py +0 -260
  233. edsl/agents/InvigilatorBase.py +0 -260
  234. edsl/agents/PromptConstructor.py +0 -318
  235. edsl/coop/PriceFetcher.py +0 -54
  236. edsl/data/Cache.py +0 -582
  237. edsl/data/CacheEntry.py +0 -238
  238. edsl/data/SQLiteDict.py +0 -292
  239. edsl/data/__init__.py +0 -5
  240. edsl/data/orm.py +0 -10
  241. edsl/exceptions/cache.py +0 -5
  242. edsl/exceptions/coop.py +0 -14
  243. edsl/exceptions/data.py +0 -14
  244. edsl/exceptions/scenarios.py +0 -29
  245. edsl/jobs/Answers.py +0 -43
  246. edsl/jobs/JobsPrompts.py +0 -354
  247. edsl/jobs/buckets/BucketCollection.py +0 -134
  248. edsl/jobs/buckets/ModelBuckets.py +0 -65
  249. edsl/jobs/buckets/TokenBucket.py +0 -283
  250. edsl/jobs/buckets/TokenBucketClient.py +0 -191
  251. edsl/jobs/interviews/Interview.py +0 -395
  252. edsl/jobs/interviews/InterviewExceptionCollection.py +0 -99
  253. edsl/jobs/interviews/InterviewStatisticsCollection.py +0 -25
  254. edsl/jobs/runners/JobsRunnerAsyncio.py +0 -163
  255. edsl/jobs/runners/JobsRunnerStatusData.py +0 -0
  256. edsl/jobs/tasks/TaskCreators.py +0 -64
  257. edsl/jobs/tasks/TaskStatusLog.py +0 -23
  258. edsl/jobs/tokens/InterviewTokenUsage.py +0 -27
  259. edsl/language_models/LanguageModel.py +0 -635
  260. edsl/language_models/ServiceDataSources.py +0 -0
  261. edsl/language_models/key_management/KeyLookup.py +0 -63
  262. edsl/language_models/key_management/KeyLookupCollection.py +0 -38
  263. edsl/language_models/key_management/models.py +0 -137
  264. edsl/questions/QuestionBase.py +0 -544
  265. edsl/questions/QuestionFreeText.py +0 -130
  266. edsl/questions/derived/QuestionLikertFive.py +0 -76
  267. edsl/results/ResultsExportMixin.py +0 -45
  268. edsl/results/TextEditor.py +0 -50
  269. edsl/results/results_fetch_mixin.py +0 -33
  270. edsl/results/results_tools_mixin.py +0 -98
  271. edsl/scenarios/DocumentChunker.py +0 -104
  272. edsl/scenarios/Scenario.py +0 -548
  273. edsl/scenarios/ScenarioHtmlMixin.py +0 -65
  274. edsl/scenarios/ScenarioListExportMixin.py +0 -45
  275. edsl/scenarios/handlers/latex.py +0 -5
  276. edsl/shared.py +0 -1
  277. edsl/surveys/Survey.py +0 -1301
  278. edsl/surveys/SurveyQualtricsImport.py +0 -284
  279. edsl/surveys/SurveyToApp.py +0 -141
  280. edsl/surveys/instructions/__init__.py +0 -0
  281. edsl/tools/__init__.py +0 -1
  282. edsl/tools/clusters.py +0 -192
  283. edsl/tools/embeddings.py +0 -27
  284. edsl/tools/embeddings_plotting.py +0 -118
  285. edsl/tools/plotting.py +0 -112
  286. edsl/tools/summarize.py +0 -18
  287. edsl/utilities/data/Registry.py +0 -6
  288. edsl/utilities/data/__init__.py +0 -1
  289. edsl/utilities/data/scooter_results.json +0 -1
  290. edsl-0.1.47.dist-info/RECORD +0 -354
  291. /edsl/coop/{CoopFunctionsMixin.py → coop_functions.py} +0 -0
  292. /edsl/{results → dataset/display}/CSSParameterizer.py +0 -0
  293. /edsl/{language_models/key_management → dataset/display}/__init__.py +0 -0
  294. /edsl/{results → dataset/display}/table_data_class.py +0 -0
  295. /edsl/{results → dataset/display}/table_display.css +0 -0
  296. /edsl/{results/ResultsGGMixin.py → dataset/r/ggplot.py} +0 -0
  297. /edsl/{results → dataset}/tree_explore.py +0 -0
  298. /edsl/{surveys/instructions/ChangeInstruction.py → instructions/change_instruction.py} +0 -0
  299. /edsl/{jobs/interviews → interviews}/interview_status_enum.py +0 -0
  300. /edsl/jobs/{runners/JobsRunnerStatus.py → jobs_runner_status.py} +0 -0
  301. /edsl/language_models/{PriceManager.py → price_manager.py} +0 -0
  302. /edsl/language_models/{fake_openai_call.py → unused/fake_openai_call.py} +0 -0
  303. /edsl/language_models/{fake_openai_service.py → unused/fake_openai_service.py} +0 -0
  304. /edsl/notebooks/{NotebookToLaTeX.py → notebook_to_latex.py} +0 -0
  305. /edsl/{exceptions/questions.py → questions/exceptions.py} +0 -0
  306. /edsl/questions/{SimpleAskMixin.py → simple_ask_mixin.py} +0 -0
  307. /edsl/surveys/{Memory.py → memory/memory.py} +0 -0
  308. /edsl/surveys/{MemoryManagement.py → memory/memory_management.py} +0 -0
  309. /edsl/surveys/{SurveyCSS.py → survey_css.py} +0 -0
  310. /edsl/{jobs/tokens/TokenUsage.py → tokens/token_usage.py} +0 -0
  311. /edsl/{results/MarkdownToDocx.py → utilities/markdown_to_docx.py} +0 -0
  312. /edsl/{TemplateLoader.py → utilities/template_loader.py} +0 -0
  313. {edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/LICENSE +0 -0
  314. {edsl-0.1.47.dist-info → edsl-0.1.49.dist-info}/WHEEL +0 -0
@@ -1,395 +0,0 @@
1
- """This module contains the Interview class, which is responsible for conducting an interview asynchronously."""
2
-
3
- from __future__ import annotations
4
- import asyncio
5
- from typing import Any, Type, List, Generator, Optional, Union, TYPE_CHECKING
6
- import copy
7
- from dataclasses import dataclass
8
-
9
- # from edsl.jobs.Answers import Answers
10
- from edsl.jobs.data_structures import Answers
11
- from edsl.jobs.interviews.InterviewStatusLog import InterviewStatusLog
12
- from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
13
- from edsl.jobs.interviews.InterviewExceptionCollection import (
14
- InterviewExceptionCollection,
15
- )
16
- from edsl.jobs.interviews.InterviewExceptionEntry import InterviewExceptionEntry
17
- from edsl.jobs.buckets.ModelBuckets import ModelBuckets
18
- from edsl.jobs.AnswerQuestionFunctionConstructor import (
19
- AnswerQuestionFunctionConstructor,
20
- )
21
- from edsl.jobs.InterviewTaskManager import InterviewTaskManager
22
- from edsl.jobs.FetchInvigilator import FetchInvigilator
23
- from edsl.jobs.RequestTokenEstimator import RequestTokenEstimator
24
-
25
-
26
- if TYPE_CHECKING:
27
- from edsl.agents.Agent import Agent
28
- from edsl.surveys.Survey import Survey
29
- from edsl.scenarios.Scenario import Scenario
30
- from edsl.data.Cache import Cache
31
- from edsl.language_models.LanguageModel import LanguageModel
32
- from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
33
- from edsl.agents.InvigilatorBase import InvigilatorBase
34
- from edsl.language_models.key_management.KeyLookup import KeyLookup
35
-
36
-
37
- @dataclass
38
- class InterviewRunningConfig:
39
- cache: Optional["Cache"] = (None,)
40
- skip_retry: bool = (False,) # COULD BE SET WITH CONFIG
41
- raise_validation_errors: bool = (True,)
42
- stop_on_exception: bool = (False,)
43
-
44
-
45
- class Interview:
46
- """
47
- An 'interview' is one agent answering one survey, with one language model, for a given scenario.
48
-
49
- The main method is `async_conduct_interview`, which conducts the interview asynchronously.
50
- Most of the class is dedicated to creating the tasks for each question in the survey, and then running them.
51
- """
52
-
53
- def __init__(
54
- self,
55
- agent: Agent,
56
- survey: Survey,
57
- scenario: Scenario,
58
- model: Type["LanguageModel"],
59
- iteration: int = 0,
60
- indices: dict = None, # explain?
61
- cache: Optional["Cache"] = None,
62
- skip_retry: bool = False, # COULD BE SET WITH CONFIG
63
- raise_validation_errors: bool = True,
64
- ):
65
- """Initialize the Interview instance.
66
-
67
- :param agent: the agent being interviewed.
68
- :param survey: the survey being administered to the agent.
69
- :param scenario: the scenario that populates the survey questions.
70
- :param model: the language model used to answer the questions.
71
- # :param debug: if True, run without calls to the language model.
72
- :param iteration: the iteration number of the interview.
73
- :param cache: the cache used to store the answers.
74
-
75
- >>> i = Interview.example()
76
- >>> i.task_manager.task_creators
77
- {}
78
-
79
- >>> i.exceptions
80
- {}
81
-
82
- >>> _ = asyncio.run(i.async_conduct_interview())
83
- >>> i.task_status_logs['q0']
84
- [{'log_time': ..., 'value': <TaskStatus.NOT_STARTED: 1>}, {'log_time': ..., 'value': <TaskStatus.WAITING_FOR_DEPENDENCIES: 2>}, {'log_time': ..., 'value': <TaskStatus.API_CALL_IN_PROGRESS: 7>}, {'log_time': ..., 'value': <TaskStatus.SUCCESS: 8>}]
85
-
86
- >>> i.to_index
87
- {'q0': 0, 'q1': 1, 'q2': 2}
88
-
89
- """
90
- self.agent = agent
91
- self.survey = copy.deepcopy(survey) # why do we need to deepcopy the survey?
92
- self.scenario = scenario
93
- self.model = model
94
- self.iteration = iteration
95
-
96
- self.answers = Answers() # will get filled in as interview progresses
97
-
98
- self.task_manager = InterviewTaskManager(
99
- survey=self.survey,
100
- iteration=iteration,
101
- )
102
-
103
- self.exceptions = InterviewExceptionCollection()
104
-
105
- self.running_config = InterviewRunningConfig(
106
- cache=cache,
107
- skip_retry=skip_retry,
108
- raise_validation_errors=raise_validation_errors,
109
- )
110
-
111
- self.cache = cache
112
- self.skip_retry = skip_retry
113
- self.raise_validation_errors = raise_validation_errors
114
-
115
- # dictionary mapping question names to their index in the survey.
116
- self.to_index = {
117
- question_name: index
118
- for index, question_name in enumerate(self.survey.question_names)
119
- }
120
-
121
- self.failed_questions = []
122
-
123
- self.indices = indices
124
- self.initial_hash = hash(self)
125
-
126
- @property
127
- def has_exceptions(self) -> bool:
128
- """Return True if there are exceptions."""
129
- return len(self.exceptions) > 0
130
-
131
- @property
132
- def task_status_logs(self) -> InterviewStatusLog:
133
- """Return the task status logs for the interview.
134
-
135
- The keys are the question names; the values are the lists of status log changes for each task.
136
- """
137
- return self.task_manager.task_status_logs
138
-
139
- @property
140
- def token_usage(self) -> InterviewTokenUsage:
141
- """Determine how many tokens were used for the interview."""
142
- return self.task_manager.token_usage # task_creators.token_usage
143
-
144
- @property
145
- def interview_status(self) -> InterviewStatusDictionary:
146
- """Return a dictionary mapping task status codes to counts."""
147
- # return self.task_creators.interview_status
148
- return self.task_manager.interview_status
149
-
150
- def to_dict(self, include_exceptions=True, add_edsl_version=True) -> dict[str, Any]:
151
- """Return a dictionary representation of the Interview instance.
152
- This is just for hashing purposes.
153
-
154
- >>> i = Interview.example()
155
- >>> hash(i)
156
- 767745459362662063
157
- """
158
- d = {
159
- "agent": self.agent.to_dict(add_edsl_version=add_edsl_version),
160
- "survey": self.survey.to_dict(add_edsl_version=add_edsl_version),
161
- "scenario": self.scenario.to_dict(add_edsl_version=add_edsl_version),
162
- "model": self.model.to_dict(add_edsl_version=add_edsl_version),
163
- "iteration": self.iteration,
164
- "exceptions": {},
165
- }
166
- if include_exceptions:
167
- d["exceptions"] = self.exceptions.to_dict()
168
- if hasattr(self, "indices"):
169
- d["indices"] = self.indices
170
- return d
171
-
172
- @classmethod
173
- def from_dict(cls, d: dict[str, Any]) -> "Interview":
174
- """Return an Interview instance from a dictionary."""
175
-
176
- from edsl.agents.Agent import Agent
177
- from edsl.surveys.Survey import Survey
178
- from edsl.scenarios.Scenario import Scenario
179
- from edsl.language_models.LanguageModel import LanguageModel
180
-
181
- agent = Agent.from_dict(d["agent"])
182
- survey = Survey.from_dict(d["survey"])
183
- scenario = Scenario.from_dict(d["scenario"])
184
- model = LanguageModel.from_dict(d["model"])
185
- iteration = d["iteration"]
186
- params = {
187
- "agent": agent,
188
- "survey": survey,
189
- "scenario": scenario,
190
- "model": model,
191
- "iteration": iteration,
192
- }
193
- if "indices" in d:
194
- params["indices"] = d["indices"]
195
- interview = cls(**params)
196
- if "exceptions" in d:
197
- exceptions = InterviewExceptionCollection.from_dict(d["exceptions"])
198
- interview.exceptions = exceptions
199
- return interview
200
-
201
- def __hash__(self) -> int:
202
- from edsl.utilities.utilities import dict_hash
203
-
204
- return dict_hash(self.to_dict(include_exceptions=False, add_edsl_version=False))
205
-
206
- def __eq__(self, other: "Interview") -> bool:
207
- """
208
- >>> from edsl.jobs.interviews.Interview import Interview; i = Interview.example(); d = i.to_dict(); i2 = Interview.from_dict(d); i == i2
209
- True
210
- """
211
- return hash(self) == hash(other)
212
-
213
- async def async_conduct_interview(
214
- self,
215
- run_config: Optional["RunConfig"] = None,
216
- ) -> tuple["Answers", List[dict[str, Any]]]:
217
- """
218
- Conduct an Interview asynchronously.
219
- It returns a tuple with the answers and a list of valid results.
220
-
221
- :param model_buckets: a dictionary of token buckets for the model.
222
- :param debug: run without calls to LLM.
223
- :param stop_on_exception: if True, stops the interview if an exception is raised.
224
-
225
- Example usage:
226
-
227
- >>> i = Interview.example()
228
- >>> result, _ = asyncio.run(i.async_conduct_interview())
229
- >>> result['q0']
230
- 'yes'
231
-
232
- >>> i = Interview.example(throw_exception = True)
233
- >>> result, _ = asyncio.run(i.async_conduct_interview())
234
- >>> i.exceptions
235
- {'q0': ...
236
- >>> i = Interview.example()
237
- >>> from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
238
- >>> run_config = RunConfig(parameters = RunParameters(), environment = RunEnvironment())
239
- >>> run_config.parameters.stop_on_exception = True
240
- >>> result, _ = asyncio.run(i.async_conduct_interview(run_config))
241
- """
242
- from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
243
-
244
- if run_config is None:
245
- run_config = RunConfig(
246
- parameters=RunParameters(),
247
- environment=RunEnvironment(),
248
- )
249
- self.stop_on_exception = run_config.parameters.stop_on_exception
250
-
251
- # if no model bucket is passed, create an 'infinity' bucket with no rate limits
252
- bucket_collection = run_config.environment.bucket_collection
253
-
254
- if bucket_collection:
255
- model_buckets = bucket_collection.get(self.model)
256
- else:
257
- model_buckets = None
258
-
259
- if model_buckets is None or hasattr(self.agent, "answer_question_directly"):
260
- model_buckets = ModelBuckets.infinity_bucket()
261
-
262
- self.skip_flags = {q.question_name: False for q in self.survey.questions}
263
-
264
- # was "self.tasks" - is that necessary?
265
- self.tasks = self.task_manager.build_question_tasks(
266
- answer_func=AnswerQuestionFunctionConstructor(
267
- self, key_lookup=run_config.environment.key_lookup
268
- )(),
269
- token_estimator=RequestTokenEstimator(self),
270
- model_buckets=model_buckets,
271
- )
272
-
273
- ## This is the key part---it creates a task for each question,
274
- ## with dependencies on the questions that must be answered before this one can be answered.
275
-
276
- ## 'Invigilators' are used to administer the survey.
277
- fetcher = FetchInvigilator(
278
- interview=self,
279
- current_answers=self.answers,
280
- key_lookup=run_config.environment.key_lookup,
281
- )
282
- self.invigilators = [fetcher(question) for question in self.survey.questions]
283
- await asyncio.gather(
284
- *self.tasks, return_exceptions=not run_config.parameters.stop_on_exception
285
- )
286
- self.answers.replace_missing_answers_with_none(self.survey)
287
- valid_results = list(
288
- self._extract_valid_results(self.tasks, self.invigilators, self.exceptions)
289
- )
290
- return self.answers, valid_results
291
-
292
- @staticmethod
293
- def _extract_valid_results(
294
- tasks: List["asyncio.Task"],
295
- invigilators: List["InvigilatorBase"],
296
- exceptions: InterviewExceptionCollection,
297
- ) -> Generator["Answers", None, None]:
298
- """Extract the valid results from the list of results.
299
-
300
- It iterates through the tasks and invigilators, and yields the results of the tasks that are done.
301
- If a task is not done, it raises a ValueError.
302
- If an exception is raised in the task, it records the exception in the Interview instance except if the task was cancelled, which is expected behavior.
303
-
304
- >>> i = Interview.example()
305
- >>> result, _ = asyncio.run(i.async_conduct_interview())
306
- """
307
- assert len(tasks) == len(invigilators)
308
-
309
- def handle_task(task, invigilator):
310
- try:
311
- result: Answers = task.result()
312
- if result == "skipped":
313
- result = invigilator.get_failed_task_result(
314
- failure_reason="Task was skipped."
315
- )
316
- except asyncio.CancelledError as e: # task was cancelled
317
- result = invigilator.get_failed_task_result(
318
- failure_reason="Task was cancelled."
319
- )
320
- except Exception as e: # any other kind of exception in the task
321
- result = invigilator.get_failed_task_result(
322
- failure_reason=f"Task failed with exception: {str(e)}."
323
- )
324
- exception_entry = InterviewExceptionEntry(
325
- exception=e,
326
- invigilator=invigilator,
327
- )
328
- exceptions.add(task.get_name(), exception_entry)
329
- return result
330
-
331
- for task, invigilator in zip(tasks, invigilators):
332
- if not task.done():
333
- raise ValueError(f"Task {task.get_name()} is not done.")
334
-
335
- yield handle_task(task, invigilator)
336
-
337
- def __repr__(self) -> str:
338
- """Return a string representation of the Interview instance."""
339
- return f"Interview(agent = {repr(self.agent)}, survey = {repr(self.survey)}, scenario = {repr(self.scenario)}, model = {repr(self.model)})"
340
-
341
- def duplicate(
342
- self, iteration: int, cache: "Cache", randomize_survey: Optional[bool] = True
343
- ) -> Interview:
344
- """Duplicate the interview, but with a new iteration number and cache.
345
-
346
- >>> i = Interview.example()
347
- >>> i2 = i.duplicate(1, None)
348
- >>> i.iteration + 1 == i2.iteration
349
- True
350
-
351
- """
352
- if randomize_survey:
353
- new_survey = self.survey.draw()
354
- else:
355
- new_survey = self.survey
356
-
357
- return Interview(
358
- agent=self.agent,
359
- survey=new_survey,
360
- scenario=self.scenario,
361
- model=self.model,
362
- iteration=iteration,
363
- cache=self.running_config.cache,
364
- skip_retry=self.running_config.skip_retry,
365
- indices=self.indices,
366
- )
367
-
368
- @classmethod
369
- def example(self, throw_exception: bool = False) -> Interview:
370
- """Return an example Interview instance."""
371
- from edsl.agents import Agent
372
- from edsl.surveys import Survey
373
- from edsl.scenarios import Scenario
374
- from edsl.language_models import LanguageModel
375
-
376
- def f(self, question, scenario):
377
- return "yes"
378
-
379
- agent = Agent.example()
380
- agent.add_direct_question_answering_method(f)
381
- survey = Survey.example()
382
- scenario = Scenario.example()
383
- model = LanguageModel.example()
384
- if throw_exception:
385
- model = LanguageModel.example(test_model=True, throw_exception=True)
386
- agent = Agent.example()
387
- return Interview(agent=agent, survey=survey, scenario=scenario, model=model)
388
- return Interview(agent=agent, survey=survey, scenario=scenario, model=model)
389
-
390
-
391
- if __name__ == "__main__":
392
- import doctest
393
-
394
- # add ellipsis
395
- doctest.testmod(optionflags=doctest.ELLIPSIS)
@@ -1,99 +0,0 @@
1
- from collections import UserDict
2
-
3
- from edsl.jobs.interviews.InterviewExceptionEntry import InterviewExceptionEntry
4
-
5
-
6
- class InterviewExceptionCollection(UserDict):
7
- """A collection of exceptions that occurred during the interview."""
8
-
9
- def __init__(self):
10
- super().__init__()
11
- self.fixed = set()
12
-
13
- def unfixed_exceptions(self) -> list:
14
- """Return a list of unfixed exceptions."""
15
- return {k: v for k, v in self.data.items() if k not in self.fixed}
16
-
17
- def num_unfixed(self) -> list:
18
- """Return a list of unfixed questions."""
19
- return len([k for k in self.data.keys() if k not in self.fixed])
20
-
21
- def record_fixed_question(self, question_name: str) -> None:
22
- """Record that a question has been fixed."""
23
- self.fixed.add(question_name)
24
-
25
- def add(self, question_name: str, entry: InterviewExceptionEntry) -> None:
26
- """Add an exception entry to the collection."""
27
- question_name = question_name
28
- if question_name not in self.data:
29
- self.data[question_name] = []
30
- self.data[question_name].append(entry)
31
-
32
- def to_dict(self, include_traceback=True) -> dict:
33
- """Return the collection of exceptions as a dictionary."""
34
- newdata = {k: [e.to_dict() for e in v] for k, v in self.data.items()}
35
- return newdata
36
-
37
- @classmethod
38
- def from_dict(cls, data: dict) -> "InterviewExceptionCollection":
39
- """Create an InterviewExceptionCollection from a dictionary."""
40
- collection = cls()
41
- for question_name, entries in data.items():
42
- for entry in entries:
43
- collection.add(question_name, InterviewExceptionEntry.from_dict(entry))
44
- return collection
45
-
46
- def _repr_html_(self) -> str:
47
- from edsl.utilities.utilities import data_to_html
48
-
49
- return data_to_html(self.to_dict(include_traceback=True))
50
-
51
- def ascii_table(self, traceback: bool = False) -> None:
52
- headers = ["Question name", "Exception", "Time", "Traceback"]
53
- from tabulate import tabulate
54
-
55
- data = []
56
- for question, exceptions in self.data.items():
57
- for exception in exceptions:
58
- if traceback:
59
- row = [
60
- question,
61
- exception["exception"],
62
- exception["time"],
63
- exception["traceback"],
64
- ]
65
- else:
66
- row = [question, exception["exception"], exception["time"]]
67
- data.append(row)
68
-
69
- print(tabulate(data, headers=headers, tablefmt="grid"))
70
-
71
- def print(self, traceback=False):
72
- """Print the collection of exceptions."""
73
- console = Console()
74
- table = Table(show_header=True, header_style="bold magenta")
75
- table.add_column("Question name", style="dim", width=12)
76
- table.add_column("Exception", width=32)
77
- table.add_column("Time", justify="right")
78
- table.add_column("Traceback", min_width=20)
79
-
80
- for queue, exceptions in self.data.items():
81
- for exception in exceptions:
82
- if traceback:
83
- traceback_string = exception["traceback"].replace("\n", "\n\n")
84
- else:
85
- traceback_string = ""
86
- table.add_row(
87
- queue,
88
- exception["exception"],
89
- str(exception["time"]),
90
- traceback_string, # Adding extra newlines for better readability
91
- )
92
-
93
- console.print(table)
94
-
95
-
96
- if __name__ == "__main__":
97
- import doctest
98
-
99
- doctest.testmod(optionflags=doctest.ELLIPSIS)
@@ -1,25 +0,0 @@
1
- from collections import UserDict
2
- from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
3
-
4
-
5
- class InterviewStatisticsCollection(UserDict):
6
- """A collection of interview statistics."""
7
-
8
- def __init__(self, *args, **kwargs):
9
- super().__init__(*args, **kwargs)
10
- self.raw: dict = {}
11
-
12
- def add_stat(self, statistic: InterviewStatistic):
13
- """Add a statistic to the collection.
14
-
15
- Each statistic is a dictionary with a single key-value pair.
16
-
17
- Example usage:
18
-
19
- >>> isc = InterviewStatisticsCollection()
20
- >>> isc.add_stat(InterviewStatistic("elapsed_time", value=100, digits=1, units="sec."))
21
- >>> isc.raw
22
- {'elapsed_time': 100}
23
- """
24
- self.update(statistic)
25
- self.raw.update(statistic.raw)
@@ -1,163 +0,0 @@
1
- from __future__ import annotations
2
- import time
3
- import asyncio
4
- import threading
5
- import warnings
6
- from typing import TYPE_CHECKING
7
-
8
- from edsl.results.Results import Results
9
- from edsl.jobs.runners.JobsRunnerStatus import JobsRunnerStatus
10
- from edsl.jobs.tasks.TaskHistory import TaskHistory
11
- from edsl.utilities.decorators import jupyter_nb_handler
12
- from edsl.jobs.async_interview_runner import AsyncInterviewRunner
13
- from edsl.jobs.data_structures import RunEnvironment, RunParameters, RunConfig
14
-
15
- if TYPE_CHECKING:
16
- from edsl.jobs.Jobs import Jobs
17
-
18
-
19
- class JobsRunnerAsyncio:
20
- """A class for running a collection of interviews asynchronously.
21
-
22
- It gets instaniated from a Jobs object.
23
- The Jobs object is a collection of interviews that are to be run.
24
- """
25
-
26
- def __init__(self, jobs: "Jobs", environment: RunEnvironment):
27
- self.jobs = jobs
28
- self.environment = environment
29
-
30
- def __len__(self):
31
- return len(self.jobs)
32
-
33
- async def run_async(self, parameters: RunParameters) -> Results:
34
- """Used for some other modules that have a non-standard way of running interviews."""
35
-
36
- self.environment.jobs_runner_status = JobsRunnerStatus(self, n=parameters.n)
37
- data = []
38
- task_history = TaskHistory(include_traceback=False)
39
-
40
- run_config = RunConfig(parameters=parameters, environment=self.environment)
41
- result_generator = AsyncInterviewRunner(self.jobs, run_config)
42
-
43
- async for result, interview in result_generator.run():
44
- data.append(result)
45
- task_history.add_interview(interview)
46
-
47
- results = Results(survey=self.jobs.survey, task_history=task_history, data=data)
48
-
49
- relevant_cache = results.relevant_cache(self.environment.cache)
50
-
51
- return Results(
52
- survey=self.jobs.survey,
53
- task_history=task_history,
54
- data=data,
55
- cache=relevant_cache,
56
- )
57
-
58
- def simple_run(self):
59
- data = asyncio.run(self.run_async())
60
- return Results(survey=self.jobs.survey, data=data)
61
-
62
- @jupyter_nb_handler
63
- async def run(self, parameters: RunParameters) -> Results:
64
- """Runs a collection of interviews, handling both async and sync contexts."""
65
-
66
- run_config = RunConfig(parameters=parameters, environment=self.environment)
67
-
68
- self.start_time = time.monotonic()
69
- self.completed = False
70
-
71
- from edsl.coop import Coop
72
-
73
- coop = Coop()
74
- endpoint_url = coop.get_progress_bar_url()
75
-
76
- def set_up_jobs_runner_status(jobs_runner_status):
77
- if jobs_runner_status is not None:
78
- return jobs_runner_status(
79
- self,
80
- n=parameters.n,
81
- endpoint_url=endpoint_url,
82
- job_uuid=parameters.job_uuid,
83
- )
84
- else:
85
- return JobsRunnerStatus(
86
- self,
87
- n=parameters.n,
88
- endpoint_url=endpoint_url,
89
- job_uuid=parameters.job_uuid,
90
- )
91
-
92
- run_config.environment.jobs_runner_status = set_up_jobs_runner_status(
93
- self.environment.jobs_runner_status
94
- )
95
-
96
- async def get_results(results) -> None:
97
- """Conducted the interviews and append to the results list."""
98
- result_generator = AsyncInterviewRunner(self.jobs, run_config)
99
- async for result, interview in result_generator.run():
100
- results.append(result)
101
- results.task_history.add_interview(interview)
102
-
103
- self.completed = True
104
-
105
- def run_progress_bar(stop_event, jobs_runner_status) -> None:
106
- """Runs the progress bar in a separate thread."""
107
- jobs_runner_status.update_progress(stop_event)
108
-
109
- def set_up_progress_bar(progress_bar: bool, jobs_runner_status):
110
- progress_thread = None
111
- if progress_bar and jobs_runner_status.has_ep_api_key():
112
- jobs_runner_status.setup()
113
- progress_thread = threading.Thread(
114
- target=run_progress_bar, args=(stop_event, jobs_runner_status)
115
- )
116
- progress_thread.start()
117
- elif progress_bar:
118
- warnings.warn(
119
- "You need an Expected Parrot API key to view job progress bars."
120
- )
121
- return progress_thread
122
-
123
- results = Results(
124
- survey=self.jobs.survey,
125
- data=[],
126
- task_history=TaskHistory(),
127
- # cache=self.environment.cache.new_entries_cache(),
128
- )
129
-
130
- stop_event = threading.Event()
131
- progress_thread = set_up_progress_bar(
132
- parameters.progress_bar, run_config.environment.jobs_runner_status
133
- )
134
-
135
- exception_to_raise = None
136
- try:
137
- await get_results(results)
138
- except KeyboardInterrupt:
139
- print("Keyboard interrupt received. Stopping gracefully...")
140
- stop_event.set()
141
- except Exception as e:
142
- if parameters.stop_on_exception:
143
- exception_to_raise = e
144
- stop_event.set()
145
- finally:
146
- stop_event.set()
147
- if progress_thread is not None:
148
- progress_thread.join()
149
-
150
- if exception_to_raise:
151
- raise exception_to_raise
152
-
153
- relevant_cache = results.relevant_cache(self.environment.cache)
154
- results.cache = relevant_cache
155
- # breakpoint()
156
- results.bucket_collection = self.environment.bucket_collection
157
-
158
- from edsl.jobs.results_exceptions_handler import ResultsExceptionsHandler
159
-
160
- results_exceptions_handler = ResultsExceptionsHandler(results, parameters)
161
-
162
- results_exceptions_handler.handle_exceptions()
163
- return results
File without changes