edsl 0.1.38.dev4__py3-none-any.whl → 0.1.39__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (212) hide show
  1. edsl/Base.py +197 -116
  2. edsl/__init__.py +15 -7
  3. edsl/__version__.py +1 -1
  4. edsl/agents/Agent.py +351 -147
  5. edsl/agents/AgentList.py +211 -73
  6. edsl/agents/Invigilator.py +101 -50
  7. edsl/agents/InvigilatorBase.py +62 -70
  8. edsl/agents/PromptConstructor.py +143 -225
  9. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  10. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  11. edsl/agents/__init__.py +0 -1
  12. edsl/agents/prompt_helpers.py +3 -3
  13. edsl/agents/question_option_processor.py +172 -0
  14. edsl/auto/AutoStudy.py +18 -5
  15. edsl/auto/StageBase.py +53 -40
  16. edsl/auto/StageQuestions.py +2 -1
  17. edsl/auto/utilities.py +0 -6
  18. edsl/config.py +22 -2
  19. edsl/conversation/car_buying.py +2 -1
  20. edsl/coop/CoopFunctionsMixin.py +15 -0
  21. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  22. edsl/coop/PriceFetcher.py +1 -1
  23. edsl/coop/coop.py +125 -47
  24. edsl/coop/utils.py +14 -14
  25. edsl/data/Cache.py +45 -27
  26. edsl/data/CacheEntry.py +12 -15
  27. edsl/data/CacheHandler.py +31 -12
  28. edsl/data/RemoteCacheSync.py +154 -46
  29. edsl/data/__init__.py +4 -3
  30. edsl/data_transfer_models.py +2 -1
  31. edsl/enums.py +27 -0
  32. edsl/exceptions/__init__.py +50 -50
  33. edsl/exceptions/agents.py +12 -0
  34. edsl/exceptions/inference_services.py +5 -0
  35. edsl/exceptions/questions.py +24 -6
  36. edsl/exceptions/scenarios.py +7 -0
  37. edsl/inference_services/AnthropicService.py +38 -19
  38. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  39. edsl/inference_services/AvailableModelFetcher.py +215 -0
  40. edsl/inference_services/AwsBedrock.py +0 -2
  41. edsl/inference_services/AzureAI.py +0 -2
  42. edsl/inference_services/GoogleService.py +7 -12
  43. edsl/inference_services/InferenceServiceABC.py +18 -85
  44. edsl/inference_services/InferenceServicesCollection.py +120 -79
  45. edsl/inference_services/MistralAIService.py +0 -3
  46. edsl/inference_services/OpenAIService.py +47 -35
  47. edsl/inference_services/PerplexityService.py +0 -3
  48. edsl/inference_services/ServiceAvailability.py +135 -0
  49. edsl/inference_services/TestService.py +11 -10
  50. edsl/inference_services/TogetherAIService.py +5 -3
  51. edsl/inference_services/data_structures.py +134 -0
  52. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  53. edsl/jobs/Answers.py +1 -14
  54. edsl/jobs/FetchInvigilator.py +47 -0
  55. edsl/jobs/InterviewTaskManager.py +98 -0
  56. edsl/jobs/InterviewsConstructor.py +50 -0
  57. edsl/jobs/Jobs.py +356 -431
  58. edsl/jobs/JobsChecks.py +35 -10
  59. edsl/jobs/JobsComponentConstructor.py +189 -0
  60. edsl/jobs/JobsPrompts.py +6 -4
  61. edsl/jobs/JobsRemoteInferenceHandler.py +205 -133
  62. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  63. edsl/jobs/RequestTokenEstimator.py +30 -0
  64. edsl/jobs/async_interview_runner.py +138 -0
  65. edsl/jobs/buckets/BucketCollection.py +44 -3
  66. edsl/jobs/buckets/TokenBucket.py +53 -21
  67. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  68. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  69. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  70. edsl/jobs/data_structures.py +120 -0
  71. edsl/jobs/decorators.py +35 -0
  72. edsl/jobs/interviews/Interview.py +143 -408
  73. edsl/jobs/jobs_status_enums.py +9 -0
  74. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  75. edsl/jobs/results_exceptions_handler.py +98 -0
  76. edsl/jobs/runners/JobsRunnerAsyncio.py +88 -403
  77. edsl/jobs/runners/JobsRunnerStatus.py +133 -165
  78. edsl/jobs/tasks/QuestionTaskCreator.py +21 -19
  79. edsl/jobs/tasks/TaskHistory.py +38 -18
  80. edsl/jobs/tasks/task_status_enum.py +0 -2
  81. edsl/language_models/ComputeCost.py +63 -0
  82. edsl/language_models/LanguageModel.py +194 -236
  83. edsl/language_models/ModelList.py +28 -19
  84. edsl/language_models/PriceManager.py +127 -0
  85. edsl/language_models/RawResponseHandler.py +106 -0
  86. edsl/language_models/ServiceDataSources.py +0 -0
  87. edsl/language_models/__init__.py +1 -2
  88. edsl/language_models/key_management/KeyLookup.py +63 -0
  89. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  90. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  91. edsl/language_models/key_management/__init__.py +0 -0
  92. edsl/language_models/key_management/models.py +131 -0
  93. edsl/language_models/model.py +256 -0
  94. edsl/language_models/repair.py +2 -2
  95. edsl/language_models/utilities.py +5 -4
  96. edsl/notebooks/Notebook.py +19 -14
  97. edsl/notebooks/NotebookToLaTeX.py +142 -0
  98. edsl/prompts/Prompt.py +29 -39
  99. edsl/questions/ExceptionExplainer.py +77 -0
  100. edsl/questions/HTMLQuestion.py +103 -0
  101. edsl/questions/QuestionBase.py +68 -214
  102. edsl/questions/QuestionBasePromptsMixin.py +7 -3
  103. edsl/questions/QuestionBudget.py +1 -1
  104. edsl/questions/QuestionCheckBox.py +3 -3
  105. edsl/questions/QuestionExtract.py +5 -7
  106. edsl/questions/QuestionFreeText.py +2 -3
  107. edsl/questions/QuestionList.py +10 -18
  108. edsl/questions/QuestionMatrix.py +265 -0
  109. edsl/questions/QuestionMultipleChoice.py +67 -23
  110. edsl/questions/QuestionNumerical.py +2 -4
  111. edsl/questions/QuestionRank.py +7 -17
  112. edsl/questions/SimpleAskMixin.py +4 -3
  113. edsl/questions/__init__.py +2 -1
  114. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +47 -2
  115. edsl/questions/data_structures.py +20 -0
  116. edsl/questions/derived/QuestionLinearScale.py +6 -3
  117. edsl/questions/derived/QuestionTopK.py +1 -1
  118. edsl/questions/descriptors.py +17 -3
  119. edsl/questions/loop_processor.py +149 -0
  120. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +57 -50
  121. edsl/questions/question_registry.py +1 -1
  122. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +40 -26
  123. edsl/questions/response_validator_factory.py +34 -0
  124. edsl/questions/templates/matrix/__init__.py +1 -0
  125. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  126. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  127. edsl/results/CSSParameterizer.py +1 -1
  128. edsl/results/Dataset.py +170 -7
  129. edsl/results/DatasetExportMixin.py +168 -305
  130. edsl/results/DatasetTree.py +28 -8
  131. edsl/results/MarkdownToDocx.py +122 -0
  132. edsl/results/MarkdownToPDF.py +111 -0
  133. edsl/results/Result.py +298 -206
  134. edsl/results/Results.py +149 -131
  135. edsl/results/ResultsExportMixin.py +2 -0
  136. edsl/results/TableDisplay.py +98 -171
  137. edsl/results/TextEditor.py +50 -0
  138. edsl/results/__init__.py +1 -1
  139. edsl/results/file_exports.py +252 -0
  140. edsl/results/{Selector.py → results_selector.py} +23 -13
  141. edsl/results/smart_objects.py +96 -0
  142. edsl/results/table_data_class.py +12 -0
  143. edsl/results/table_renderers.py +118 -0
  144. edsl/scenarios/ConstructDownloadLink.py +109 -0
  145. edsl/scenarios/DocumentChunker.py +102 -0
  146. edsl/scenarios/DocxScenario.py +16 -0
  147. edsl/scenarios/FileStore.py +150 -239
  148. edsl/scenarios/PdfExtractor.py +40 -0
  149. edsl/scenarios/Scenario.py +90 -193
  150. edsl/scenarios/ScenarioHtmlMixin.py +4 -3
  151. edsl/scenarios/ScenarioList.py +415 -244
  152. edsl/scenarios/ScenarioListExportMixin.py +0 -7
  153. edsl/scenarios/ScenarioListPdfMixin.py +15 -37
  154. edsl/scenarios/__init__.py +1 -2
  155. edsl/scenarios/directory_scanner.py +96 -0
  156. edsl/scenarios/file_methods.py +85 -0
  157. edsl/scenarios/handlers/__init__.py +13 -0
  158. edsl/scenarios/handlers/csv.py +49 -0
  159. edsl/scenarios/handlers/docx.py +76 -0
  160. edsl/scenarios/handlers/html.py +37 -0
  161. edsl/scenarios/handlers/json.py +111 -0
  162. edsl/scenarios/handlers/latex.py +5 -0
  163. edsl/scenarios/handlers/md.py +51 -0
  164. edsl/scenarios/handlers/pdf.py +68 -0
  165. edsl/scenarios/handlers/png.py +39 -0
  166. edsl/scenarios/handlers/pptx.py +105 -0
  167. edsl/scenarios/handlers/py.py +294 -0
  168. edsl/scenarios/handlers/sql.py +313 -0
  169. edsl/scenarios/handlers/sqlite.py +149 -0
  170. edsl/scenarios/handlers/txt.py +33 -0
  171. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +10 -6
  172. edsl/scenarios/scenario_selector.py +156 -0
  173. edsl/study/ObjectEntry.py +1 -1
  174. edsl/study/SnapShot.py +1 -1
  175. edsl/study/Study.py +5 -12
  176. edsl/surveys/ConstructDAG.py +92 -0
  177. edsl/surveys/EditSurvey.py +221 -0
  178. edsl/surveys/InstructionHandler.py +100 -0
  179. edsl/surveys/MemoryManagement.py +72 -0
  180. edsl/surveys/Rule.py +5 -4
  181. edsl/surveys/RuleCollection.py +25 -27
  182. edsl/surveys/RuleManager.py +172 -0
  183. edsl/surveys/Simulator.py +75 -0
  184. edsl/surveys/Survey.py +270 -791
  185. edsl/surveys/SurveyCSS.py +20 -8
  186. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +11 -9
  187. edsl/surveys/SurveyToApp.py +141 -0
  188. edsl/surveys/__init__.py +4 -2
  189. edsl/surveys/descriptors.py +6 -2
  190. edsl/surveys/instructions/ChangeInstruction.py +1 -2
  191. edsl/surveys/instructions/Instruction.py +4 -13
  192. edsl/surveys/instructions/InstructionCollection.py +11 -6
  193. edsl/templates/error_reporting/interview_details.html +1 -1
  194. edsl/templates/error_reporting/report.html +1 -1
  195. edsl/tools/plotting.py +1 -1
  196. edsl/utilities/PrettyList.py +56 -0
  197. edsl/utilities/is_notebook.py +18 -0
  198. edsl/utilities/is_valid_variable_name.py +11 -0
  199. edsl/utilities/remove_edsl_version.py +24 -0
  200. edsl/utilities/utilities.py +35 -23
  201. {edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/METADATA +12 -10
  202. edsl-0.1.39.dist-info/RECORD +358 -0
  203. {edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/WHEEL +1 -1
  204. edsl/language_models/KeyLookup.py +0 -30
  205. edsl/language_models/registry.py +0 -190
  206. edsl/language_models/unused/ReplicateBase.py +0 -83
  207. edsl/results/ResultsDBMixin.py +0 -238
  208. edsl-0.1.38.dev4.dist-info/RECORD +0 -277
  209. /edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +0 -0
  210. /edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +0 -0
  211. /edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +0 -0
  212. {edsl-0.1.38.dev4.dist-info → edsl-0.1.39.dist-info}/LICENSE +0 -0
@@ -2,7 +2,7 @@ from typing import Any, List, Optional
2
2
  import os
3
3
  import asyncio
4
4
  from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
5
- from edsl.language_models import LanguageModel
5
+ from edsl.language_models.LanguageModel import LanguageModel
6
6
  from edsl.inference_services.rate_limits_cache import rate_limits
7
7
  from edsl.utilities.utilities import fix_partial_correct_response
8
8
 
@@ -51,6 +51,7 @@ class TestService(InferenceServiceABC):
51
51
  @property
52
52
  def _canned_response(self):
53
53
  if hasattr(self, "canned_response"):
54
+
54
55
  return self.canned_response
55
56
  else:
56
57
  return "Hello, world"
@@ -63,15 +64,6 @@ class TestService(InferenceServiceABC):
63
64
  files_list: Optional[List["File"]] = None,
64
65
  ) -> dict[str, Any]:
65
66
  await asyncio.sleep(0.1)
66
- # return {"message": """{"answer": "Hello, world"}"""}
67
-
68
- if hasattr(self, "func"):
69
- return {
70
- "message": [
71
- {"text": self.func(user_prompt, system_prompt, files_list)}
72
- ],
73
- "usage": {"prompt_tokens": 1, "completion_tokens": 1},
74
- }
75
67
 
76
68
  if hasattr(self, "throw_exception") and self.throw_exception:
77
69
  if hasattr(self, "exception_probability"):
@@ -81,6 +73,15 @@ class TestService(InferenceServiceABC):
81
73
 
82
74
  if random.random() < p:
83
75
  raise Exception("This is a test error")
76
+
77
+ if hasattr(self, "func"):
78
+ return {
79
+ "message": [
80
+ {"text": self.func(user_prompt, system_prompt, files_list)}
81
+ ],
82
+ "usage": {"prompt_tokens": 1, "completion_tokens": 1},
83
+ }
84
+
84
85
  return {
85
86
  "message": [{"text": f"{self._canned_response}"}],
86
87
  "usage": {"prompt_tokens": 1, "completion_tokens": 1},
@@ -143,15 +143,17 @@ class TogetherAIService(OpenAIService):
143
143
  _async_client_ = openai.AsyncOpenAI
144
144
 
145
145
  @classmethod
146
- def get_model_list(cls):
146
+ def get_model_list(cls, api_token=None):
147
147
  # Togheter.ai has a different response in model list then openai
148
148
  # and the OpenAI class returns an error when calling .models.list()
149
149
  import requests
150
150
  import os
151
151
 
152
152
  url = "https://api.together.xyz/v1/models?filter=serverless"
153
- token = os.getenv(cls._env_key_name_)
154
- headers = {"accept": "application/json", "authorization": f"Bearer {token}"}
153
+ if api_token is None:
154
+ api_token = os.getenv(cls._env_key_name_)
155
+
156
+ headers = {"accept": "application/json", "authorization": f"Bearer {api_token}"}
155
157
 
156
158
  response = requests.get(url, headers=headers)
157
159
  return response.json()
@@ -0,0 +1,134 @@
1
+ from collections import UserDict, defaultdict, UserList
2
+ from typing import Union, Optional, List
3
+ from edsl.enums import InferenceServiceLiteral
4
+ from dataclasses import dataclass
5
+
6
+
7
+ @dataclass
8
+ class LanguageModelInfo:
9
+ """A dataclass for storing information about a language model.
10
+
11
+
12
+ >>> LanguageModelInfo("gpt-4-1106-preview", "openai")
13
+ LanguageModelInfo(model_name='gpt-4-1106-preview', service_name='openai')
14
+
15
+ >>> model_name, service = LanguageModelInfo.example()
16
+ >>> model_name
17
+ 'gpt-4-1106-preview'
18
+
19
+ >>> LanguageModelInfo.example().service_name
20
+ 'openai'
21
+
22
+ """
23
+
24
+ model_name: str
25
+ service_name: str
26
+
27
+ def __iter__(self):
28
+ yield self.model_name
29
+ yield self.service_name
30
+
31
+ def __getitem__(self, key: int) -> str:
32
+ import warnings
33
+
34
+ warnings.warn(
35
+ "Accessing LanguageModelInfo via index is deprecated. "
36
+ "Please use .model_name, .service_name, or .index attributes instead.",
37
+ DeprecationWarning,
38
+ stacklevel=2,
39
+ )
40
+
41
+ if key == 0:
42
+ return self.model_name
43
+ elif key == 1:
44
+ return self.service_name
45
+ else:
46
+ raise IndexError("Index out of range")
47
+
48
+ @classmethod
49
+ def example(cls) -> "LanguageModelInfo":
50
+ return cls("gpt-4-1106-preview", "openai")
51
+
52
+
53
+ class ModelNamesList(UserList):
54
+ pass
55
+
56
+
57
+ class AvailableModels(UserList):
58
+
59
+ def __init__(self, data: List[LanguageModelInfo]) -> None:
60
+ super().__init__(data)
61
+
62
+ def __contains__(self, model_name: str) -> bool:
63
+ for model_entry in self:
64
+ if model_entry.model_name == model_name:
65
+ return True
66
+ return False
67
+
68
+ def print(self):
69
+ return self.to_dataset().print()
70
+
71
+ def to_dataset(self):
72
+ from edsl.scenarios.ScenarioList import ScenarioList
73
+
74
+ models, services = zip(
75
+ *[(model.model_name, model.service_name) for model in self]
76
+ )
77
+ return (
78
+ ScenarioList.from_list("model", models)
79
+ .add_list("service", services)
80
+ .to_dataset()
81
+ )
82
+
83
+ def to_model_list(self):
84
+ from edsl.language_models.ModelList import ModelList
85
+
86
+ return ModelList.from_available_models(self)
87
+
88
+ def search(
89
+ self, pattern: str, service_name: Optional[str] = None, regex: bool = False
90
+ ) -> "AvailableModels":
91
+ import re
92
+
93
+ if not regex:
94
+ # Escape special regex characters except *
95
+ pattern = re.escape(pattern).replace(r"\*", ".*")
96
+
97
+ try:
98
+ regex = re.compile(pattern)
99
+ avm = AvailableModels(
100
+ [
101
+ entry
102
+ for entry in self
103
+ if regex.search(entry.model_name)
104
+ and (service_name is None or entry.service_name == service_name)
105
+ ]
106
+ )
107
+ if len(avm) == 0:
108
+ raise ValueError(
109
+ "No models found matching the search pattern: " + pattern
110
+ )
111
+ else:
112
+ return avm
113
+ except re.error as e:
114
+ raise ValueError(f"Invalid regular expression pattern: {e}")
115
+
116
+
117
+ class ServiceToModelsMapping(UserDict):
118
+ def __init__(self, data: dict) -> None:
119
+ super().__init__(data)
120
+
121
+ @property
122
+ def service_names(self) -> list[str]:
123
+ return list(self.data.keys())
124
+
125
+ def _validate_service_names(self):
126
+ for service in self.service_names:
127
+ if service not in InferenceServiceLiteral:
128
+ raise ValueError(f"Invalid service name: {service}")
129
+
130
+ def model_to_services(self) -> dict:
131
+ self._model_to_service = defaultdict(list)
132
+ for service, models in self.data.items():
133
+ for model in models:
134
+ self._model_to_service[model].append(service)
@@ -0,0 +1,223 @@
1
+ import copy
2
+ import asyncio
3
+
4
+ from typing import Union, Type, Callable, TYPE_CHECKING
5
+
6
+ if TYPE_CHECKING:
7
+ from edsl.questions.QuestionBase import QuestionBase
8
+ from edsl.jobs.interviews.Interview import Interview
9
+ from edsl.language_models.key_management.KeyLookup import KeyLookup
10
+
11
+ from edsl.surveys.base import EndOfSurvey
12
+ from edsl.jobs.tasks.task_status_enum import TaskStatus
13
+
14
+ from edsl.jobs.FetchInvigilator import FetchInvigilator
15
+ from edsl.exceptions.language_models import LanguageModelNoResponseError
16
+ from edsl.exceptions.questions import QuestionAnswerValidationError
17
+ from edsl.data_transfer_models import AgentResponseDict, EDSLResultObjectInput
18
+
19
+ from edsl.jobs.Answers import Answers
20
+
21
+
22
+ class RetryConfig:
23
+ from edsl.config import CONFIG
24
+
25
+ EDSL_BACKOFF_START_SEC = float(CONFIG.get("EDSL_BACKOFF_START_SEC"))
26
+ EDSL_BACKOFF_MAX_SEC = float(CONFIG.get("EDSL_BACKOFF_MAX_SEC"))
27
+ EDSL_MAX_ATTEMPTS = int(CONFIG.get("EDSL_MAX_ATTEMPTS"))
28
+
29
+
30
+ class SkipHandler:
31
+
32
+ def __init__(self, interview: "Interview"):
33
+ self.interview = interview
34
+ self.question_index = self.interview.to_index
35
+
36
+ self.skip_function: Callable = (
37
+ self.interview.survey.rule_collection.skip_question_before_running
38
+ )
39
+
40
+ def should_skip(self, current_question: "QuestionBase") -> bool:
41
+ """Determine if the current question should be skipped."""
42
+ current_question_index = self.question_index[current_question.question_name]
43
+ combined_answers = (
44
+ self.interview.answers
45
+ | self.interview.scenario
46
+ | self.interview.agent["traits"]
47
+ )
48
+ return self.skip_function(current_question_index, combined_answers)
49
+
50
+ def cancel_skipped_questions(self, current_question: "QuestionBase") -> None:
51
+ """Cancel the tasks for questions that should be skipped."""
52
+ current_question_index: int = self.interview.to_index[
53
+ current_question.question_name
54
+ ]
55
+ answers = (
56
+ self.interview.answers
57
+ | self.interview.scenario
58
+ | self.interview.agent["traits"]
59
+ )
60
+
61
+ # Get the index of the next question, which could also be the end of the survey
62
+ next_question: Union[int, EndOfSurvey] = (
63
+ self.interview.survey.rule_collection.next_question(
64
+ q_now=current_question_index,
65
+ answers=answers,
66
+ )
67
+ )
68
+
69
+ def cancel_between(start, end):
70
+ """Cancel the tasks for questions between the start and end indices."""
71
+ for i in range(start, end):
72
+ self.interview.tasks[i].cancel()
73
+
74
+ if (next_question_index := next_question.next_q) == EndOfSurvey:
75
+ cancel_between(
76
+ current_question_index + 1, len(self.interview.survey.questions)
77
+ )
78
+ return
79
+
80
+ if next_question_index > (current_question_index + 1):
81
+ cancel_between(current_question_index + 1, next_question_index)
82
+
83
+
84
+ class AnswerQuestionFunctionConstructor:
85
+ """Constructs a function that answers a question and records the answer."""
86
+
87
+ def __init__(self, interview: "Interview", key_lookup: "KeyLookup"):
88
+ self.interview = interview
89
+ self.key_lookup = key_lookup
90
+
91
+ self.had_language_model_no_response_error: bool = False
92
+ self.question_index = self.interview.to_index
93
+
94
+ self.skip_function: Callable = (
95
+ self.interview.survey.rule_collection.skip_question_before_running
96
+ )
97
+
98
+ self.invigilator_fetcher = FetchInvigilator(
99
+ self.interview, key_lookup=self.key_lookup
100
+ )
101
+ self.skip_handler = SkipHandler(self.interview)
102
+
103
+ def _handle_exception(
104
+ self, e: Exception, invigilator: "InvigilatorBase", task=None
105
+ ):
106
+ """Handle an exception that occurred while answering a question."""
107
+
108
+ from edsl.jobs.interviews.InterviewExceptionEntry import InterviewExceptionEntry
109
+
110
+ answers = copy.copy(
111
+ self.interview.answers
112
+ ) # copy to freeze the answers here for logging
113
+ exception_entry = InterviewExceptionEntry(
114
+ exception=e,
115
+ invigilator=invigilator,
116
+ answers=answers,
117
+ )
118
+ if task:
119
+ task.task_status = TaskStatus.FAILED
120
+
121
+ self.interview.exceptions.add(
122
+ invigilator.question.question_name, exception_entry
123
+ )
124
+
125
+ if self.interview.raise_validation_errors and isinstance(
126
+ e, QuestionAnswerValidationError
127
+ ):
128
+ raise e
129
+
130
+ stop_on_exception = getattr(self.interview, "stop_on_exception", False)
131
+ if stop_on_exception:
132
+ raise e
133
+
134
+ def __call__(self):
135
+ return self.answer_question_and_record_task
136
+
137
+ async def answer_question_and_record_task(
138
+ self,
139
+ *,
140
+ question: "QuestionBase",
141
+ task=None,
142
+ ) -> "AgentResponseDict":
143
+
144
+ from tenacity import (
145
+ retry,
146
+ stop_after_attempt,
147
+ wait_exponential,
148
+ retry_if_exception_type,
149
+ RetryError,
150
+ )
151
+
152
+ @retry(
153
+ stop=stop_after_attempt(RetryConfig.EDSL_MAX_ATTEMPTS),
154
+ wait=wait_exponential(
155
+ multiplier=RetryConfig.EDSL_BACKOFF_START_SEC,
156
+ max=RetryConfig.EDSL_BACKOFF_MAX_SEC,
157
+ ),
158
+ retry=retry_if_exception_type(LanguageModelNoResponseError),
159
+ reraise=True,
160
+ )
161
+ async def attempt_answer():
162
+ invigilator = self.invigilator_fetcher(question)
163
+
164
+ if self.skip_handler.should_skip(question):
165
+ return invigilator.get_failed_task_result(
166
+ failure_reason="Question skipped."
167
+ )
168
+
169
+ try:
170
+ response: EDSLResultObjectInput = (
171
+ await invigilator.async_answer_question()
172
+ )
173
+ if response.validated:
174
+ self.interview.answers.add_answer(
175
+ response=response, question=question
176
+ )
177
+
178
+ self.skip_handler.cancel_skipped_questions(question)
179
+ else:
180
+ if (
181
+ hasattr(response, "exception_occurred")
182
+ and response.exception_occurred
183
+ ):
184
+ raise response.exception_occurred
185
+
186
+ except QuestionAnswerValidationError as e:
187
+ self._handle_exception(e, invigilator, task)
188
+ return invigilator.get_failed_task_result(
189
+ failure_reason="Question answer validation failed."
190
+ )
191
+
192
+ except asyncio.TimeoutError as e:
193
+ self._handle_exception(e, invigilator, task)
194
+ had_language_model_no_response_error = True
195
+ raise LanguageModelNoResponseError(
196
+ f"Language model timed out for question '{question.question_name}.'"
197
+ )
198
+
199
+ except Exception as e:
200
+ self._handle_exception(e, invigilator, task)
201
+
202
+ if "response" not in locals():
203
+ had_language_model_no_response_error = True
204
+ raise LanguageModelNoResponseError(
205
+ f"Language model did not return a response for question '{question.question_name}.'"
206
+ )
207
+
208
+ if (
209
+ question.question_name in self.interview.exceptions
210
+ and had_language_model_no_response_error
211
+ ):
212
+ self.interview.exceptions.record_fixed_question(question.question_name)
213
+
214
+ return response
215
+
216
+ try:
217
+ return await attempt_answer()
218
+ except RetryError as retry_error:
219
+ original_error = retry_error.last_attempt.exception()
220
+ self._handle_exception(
221
+ original_error, self.invigilator_fetcher(question), task
222
+ )
223
+ raise original_error
edsl/jobs/Answers.py CHANGED
@@ -1,7 +1,6 @@
1
1
  """This module contains the Answers class, which is a helper class to hold the answers to a survey."""
2
2
 
3
3
  from collections import UserDict
4
- from rich.table import Table
5
4
  from edsl.data_transfer_models import EDSLResultObjectInput
6
5
 
7
6
 
@@ -22,7 +21,7 @@ class Answers(UserDict):
22
21
  if comment:
23
22
  self[question.question_name + "_comment"] = comment
24
23
 
25
- def replace_missing_answers_with_none(self, survey) -> None:
24
+ def replace_missing_answers_with_none(self, survey: "Survey") -> None:
26
25
  """Replace missing answers with None. Answers can be missing if the agent skips a question."""
27
26
  for question_name in survey.question_names:
28
27
  if question_name not in self:
@@ -37,18 +36,6 @@ class Answers(UserDict):
37
36
  """Return an Answers object from a dictionary."""
38
37
  return cls(d)
39
38
 
40
- def rich_print(self):
41
- """Display an object as a table."""
42
- table = Table(title="Answers")
43
- table.add_column("Attribute", style="bold")
44
- table.add_column("Value")
45
-
46
- to_display = self
47
- for attr_name, attr_value in to_display.items():
48
- table.add_row(attr_name, repr(attr_value))
49
-
50
- return table
51
-
52
39
 
53
40
  if __name__ == "__main__":
54
41
  import doctest
@@ -0,0 +1,47 @@
1
+ from typing import List, Dict, Any, Optional, TYPE_CHECKING
2
+
3
+ if TYPE_CHECKING:
4
+ from edsl.questions.QuestionBase import QuestionBase
5
+ from edsl.agents.InvigilatorBase import InvigilatorBase
6
+ from edsl.language_models.key_management.KeyLookup import KeyLookup
7
+ from edsl.jobs.interviews.Interview import Interview
8
+
9
+
10
+ class FetchInvigilator:
11
+ def __init__(
12
+ self,
13
+ interview: "Interview",
14
+ current_answers: Optional[Dict[str, Any]] = None,
15
+ key_lookup: Optional["KeyLookup"] = None,
16
+ ):
17
+ self.interview = interview
18
+ if current_answers is None:
19
+ self.current_answers = self.interview.answers
20
+ else:
21
+ self.current_answers = current_answers
22
+ self.key_lookup = key_lookup
23
+
24
+ def get_invigilator(self, question: "QuestionBase") -> "InvigilatorBase":
25
+ """Return an invigilator for the given question.
26
+
27
+ :param question: the question to be answered
28
+ :param debug: whether to use debug mode, in which case `InvigilatorDebug` is used.
29
+ """
30
+
31
+ invigilator = self.interview.agent.create_invigilator(
32
+ question=question,
33
+ scenario=self.interview.scenario,
34
+ model=self.interview.model,
35
+ survey=self.interview.survey,
36
+ memory_plan=self.interview.survey.memory_plan,
37
+ current_answers=self.current_answers, # not yet known
38
+ iteration=self.interview.iteration,
39
+ cache=self.interview.cache,
40
+ raise_validation_errors=self.interview.raise_validation_errors,
41
+ key_lookup=self.key_lookup,
42
+ )
43
+ """Return an invigilator for the given question."""
44
+ return invigilator
45
+
46
+ def __call__(self, question):
47
+ return self.get_invigilator(question)
@@ -0,0 +1,98 @@
1
+ from __future__ import annotations
2
+ import asyncio
3
+ from typing import Any, Type, List, Generator, Optional, Union, TYPE_CHECKING
4
+
5
+ if TYPE_CHECKING:
6
+ from edsl.questions import QuestionBase
7
+ from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
8
+ from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
9
+ from edsl.jobs.interviews.InterviewStatusLog import InterviewStatusLog
10
+
11
+
12
+ class InterviewTaskManager:
13
+ """Handles creation and management of interview tasks."""
14
+
15
+ def __init__(self, survey, iteration=0):
16
+ from edsl.jobs.tasks.TaskCreators import TaskCreators
17
+ from edsl.jobs.interviews.InterviewStatusLog import InterviewStatusLog
18
+
19
+ self.survey = survey
20
+ self.iteration = iteration
21
+ self.task_creators = TaskCreators()
22
+ self.to_index = {
23
+ question_name: index
24
+ for index, question_name in enumerate(self.survey.question_names)
25
+ }
26
+ self._task_status_log_dict = InterviewStatusLog()
27
+
28
+ def build_question_tasks(
29
+ self, answer_func, token_estimator, model_buckets
30
+ ) -> list[asyncio.Task]:
31
+ """Create tasks for all questions with proper dependencies."""
32
+ tasks = []
33
+ for question in self.survey.questions:
34
+ dependencies = self._get_task_dependencies(tasks, question)
35
+ task = self._create_single_task(
36
+ question=question,
37
+ dependencies=dependencies,
38
+ answer_func=answer_func,
39
+ token_estimator=token_estimator,
40
+ model_buckets=model_buckets,
41
+ )
42
+ tasks.append(task)
43
+ return tuple(tasks)
44
+
45
+ def _get_task_dependencies(
46
+ self, existing_tasks: list[asyncio.Task], question: "QuestionBase"
47
+ ) -> list[asyncio.Task]:
48
+ """Get tasks that must be completed before the given question."""
49
+ dag = self.survey.dag(textify=True)
50
+ parents = dag.get(question.question_name, [])
51
+ return [existing_tasks[self.to_index[parent_name]] for parent_name in parents]
52
+
53
+ def _create_single_task(
54
+ self,
55
+ question: "QuestionBase",
56
+ dependencies: list[asyncio.Task],
57
+ answer_func,
58
+ token_estimator,
59
+ model_buckets,
60
+ ) -> asyncio.Task:
61
+ """Create a single question task with its dependencies."""
62
+ from edsl.jobs.tasks.QuestionTaskCreator import QuestionTaskCreator
63
+
64
+ task_creator = QuestionTaskCreator(
65
+ question=question,
66
+ answer_question_func=answer_func,
67
+ token_estimator=token_estimator,
68
+ model_buckets=model_buckets,
69
+ iteration=self.iteration,
70
+ )
71
+
72
+ for dependency in dependencies:
73
+ task_creator.add_dependency(dependency)
74
+
75
+ self.task_creators[question.question_name] = task_creator
76
+ return task_creator.generate_task()
77
+
78
+ @property
79
+ def task_status_logs(self) -> "InterviewStatusLog":
80
+ """Return the task status logs for the interview.
81
+
82
+ The keys are the question names; the values are the lists of status log changes for each task.
83
+ """
84
+ for task_creator in self.task_creators.values():
85
+ self._task_status_log_dict[
86
+ task_creator.question.question_name
87
+ ] = task_creator.status_log
88
+ return self._task_status_log_dict
89
+
90
+ @property
91
+ def token_usage(self) -> "InterviewTokenUsage":
92
+ """Determine how many tokens were used for the interview."""
93
+ return self.task_creators.token_usage
94
+
95
+ @property
96
+ def interview_status(self) -> "InterviewStatusDictionary":
97
+ """Return a dictionary mapping task status codes to counts."""
98
+ return self.task_creators.interview_status
@@ -0,0 +1,50 @@
1
+ from typing import Generator, TYPE_CHECKING
2
+ from itertools import product
3
+
4
+ if TYPE_CHECKING:
5
+ from edsl.jobs.interviews.Interview import Interview
6
+
7
+
8
+ class InterviewsConstructor:
9
+ def __init__(self, jobs: "Jobs", cache: "Cache"):
10
+ self.jobs = jobs
11
+ self.cache = cache
12
+
13
+ def create_interviews(self) -> Generator["Interview", None, None]:
14
+ """
15
+ Generate interviews.
16
+
17
+ Note that this sets the agents, model and scenarios if they have not been set. This is a side effect of the method.
18
+ This is useful because a user can create a job without setting the agents, models, or scenarios, and the job will still run,
19
+ with us filling in defaults.
20
+
21
+ """
22
+ from edsl.jobs.interviews.Interview import Interview
23
+
24
+ agent_index = {
25
+ hash(agent): index for index, agent in enumerate(self.jobs.agents)
26
+ }
27
+ model_index = {
28
+ hash(model): index for index, model in enumerate(self.jobs.models)
29
+ }
30
+ scenario_index = {
31
+ hash(scenario): index for index, scenario in enumerate(self.jobs.scenarios)
32
+ }
33
+
34
+ for agent, scenario, model in product(
35
+ self.jobs.agents, self.jobs.scenarios, self.jobs.models
36
+ ):
37
+ yield Interview(
38
+ survey=self.jobs.survey.draw(),
39
+ agent=agent,
40
+ scenario=scenario,
41
+ model=model,
42
+ cache=self.cache,
43
+ skip_retry=self.jobs.run_config.parameters.skip_retry,
44
+ raise_validation_errors=self.jobs.run_config.parameters.raise_validation_errors,
45
+ indices={
46
+ "agent": agent_index[hash(agent)],
47
+ "model": model_index[hash(model)],
48
+ "scenario": scenario_index[hash(scenario)],
49
+ },
50
+ )