PyPI - edsl - Versions diffs - 0.1.39__py3-none-any.whl → 0.1.39.dev2__py3-none-any.whl - Mend

edsl 0.1.39py3-none-any.whl → 0.1.39.dev2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

edsl/Base.py +0 -28
edsl/__init__.py +1 -1
edsl/__version__.py +1 -1
edsl/agents/Agent.py +17 -9
edsl/agents/Invigilator.py +14 -13
edsl/agents/InvigilatorBase.py +1 -4
edsl/agents/PromptConstructor.py +22 -42
edsl/agents/QuestionInstructionPromptBuilder.py +1 -1
edsl/auto/AutoStudy.py +5 -18
edsl/auto/StageBase.py +40 -53
edsl/auto/StageQuestions.py +1 -2
edsl/auto/utilities.py +6 -0
edsl/coop/coop.py +5 -21
edsl/data/Cache.py +18 -29
edsl/data/CacheHandler.py +2 -0
edsl/data/RemoteCacheSync.py +46 -154
edsl/enums.py +0 -7
edsl/inference_services/AnthropicService.py +16 -38
edsl/inference_services/AvailableModelFetcher.py +1 -7
edsl/inference_services/GoogleService.py +1 -5
edsl/inference_services/InferenceServicesCollection.py +2 -18
edsl/inference_services/OpenAIService.py +31 -46
edsl/inference_services/TestService.py +3 -1
edsl/inference_services/TogetherAIService.py +3 -5
edsl/inference_services/data_structures.py +2 -74
edsl/jobs/AnswerQuestionFunctionConstructor.py +113 -148
edsl/jobs/FetchInvigilator.py +3 -10
edsl/jobs/InterviewsConstructor.py +4 -6
edsl/jobs/Jobs.py +233 -299
edsl/jobs/JobsChecks.py +2 -2
edsl/jobs/JobsPrompts.py +1 -1
edsl/jobs/JobsRemoteInferenceHandler.py +136 -160
edsl/jobs/interviews/Interview.py +42 -80
edsl/jobs/runners/JobsRunnerAsyncio.py +358 -88
edsl/jobs/runners/JobsRunnerStatus.py +165 -133
edsl/jobs/tasks/TaskHistory.py +3 -24
edsl/language_models/LanguageModel.py +4 -59
edsl/language_models/ModelList.py +8 -19
edsl/language_models/__init__.py +1 -1
edsl/language_models/registry.py +180 -0
edsl/language_models/repair.py +1 -1
edsl/questions/QuestionBase.py +26 -35
edsl/questions/{question_base_gen_mixin.py → QuestionBaseGenMixin.py} +49 -52
edsl/questions/QuestionBasePromptsMixin.py +1 -1
edsl/questions/QuestionBudget.py +1 -1
edsl/questions/QuestionCheckBox.py +2 -2
edsl/questions/QuestionExtract.py +7 -5
edsl/questions/QuestionFreeText.py +1 -1
edsl/questions/QuestionList.py +15 -9
edsl/questions/QuestionMatrix.py +1 -1
edsl/questions/QuestionMultipleChoice.py +1 -1
edsl/questions/QuestionNumerical.py +1 -1
edsl/questions/QuestionRank.py +1 -1
edsl/questions/{response_validator_abc.py → ResponseValidatorABC.py} +18 -6
edsl/questions/{response_validator_factory.py → ResponseValidatorFactory.py} +1 -7
edsl/questions/SimpleAskMixin.py +1 -1
edsl/questions/__init__.py +1 -1
edsl/results/DatasetExportMixin.py +119 -60
edsl/results/Result.py +3 -109
edsl/results/Results.py +39 -50
edsl/scenarios/FileStore.py +0 -32
edsl/scenarios/ScenarioList.py +7 -35
edsl/scenarios/handlers/csv.py +0 -11
edsl/surveys/Survey.py +20 -71
{edsl-0.1.39.dist-info → edsl-0.1.39.dev2.dist-info}/METADATA +1 -1
{edsl-0.1.39.dist-info → edsl-0.1.39.dev2.dist-info}/RECORD +78 -84
{edsl-0.1.39.dist-info → edsl-0.1.39.dev2.dist-info}/WHEEL +1 -1
edsl/jobs/async_interview_runner.py +0 -138
edsl/jobs/check_survey_scenario_compatibility.py +0 -85
edsl/jobs/data_structures.py +0 -120
edsl/jobs/results_exceptions_handler.py +0 -98
edsl/language_models/model.py +0 -256
edsl/questions/data_structures.py +0 -20
edsl/results/file_exports.py +0 -252
/edsl/agents/{question_option_processor.py → QuestionOptionProcessor.py} +0 -0
/edsl/questions/{answer_validator_mixin.py → AnswerValidatorMixin.py} +0 -0
/edsl/questions/{loop_processor.py → LoopProcessor.py} +0 -0
/edsl/questions/{register_questions_meta.py → RegisterQuestionsMeta.py} +0 -0
/edsl/results/{results_fetch_mixin.py → ResultsFetchMixin.py} +0 -0
/edsl/results/{results_tools_mixin.py → ResultsToolsMixin.py} +0 -0
/edsl/results/{results_selector.py → Selector.py} +0 -0
/edsl/scenarios/{directory_scanner.py → DirectoryScanner.py} +0 -0
/edsl/scenarios/{scenario_join.py → ScenarioJoin.py} +0 -0
/edsl/scenarios/{scenario_selector.py → ScenarioSelector.py} +0 -0
{edsl-0.1.39.dist-info → edsl-0.1.39.dev2.dist-info}/LICENSE +0 -0

edsl/jobs/interviews/Interview.py CHANGED Viewed

@@ -4,10 +4,10 @@ from __future__ import annotations
 import asyncio
 from typing import Any, Type, List, Generator, Optional, Union, TYPE_CHECKING
 import copy
-from dataclasses import dataclass
-# from edsl.jobs.Answers import Answers
-from edsl.jobs.data_structures import Answers
+# from edsl.config import CONFIG
+from edsl.jobs.Answers import Answers
 from edsl.jobs.interviews.InterviewStatusLog import InterviewStatusLog
 from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
 from edsl.jobs.interviews.InterviewExceptionCollection import (
@@ -22,7 +22,6 @@ from edsl.jobs.InterviewTaskManager import InterviewTaskManager
 from edsl.jobs.FetchInvigilator import FetchInvigilator
 from edsl.jobs.RequestTokenEstimator import RequestTokenEstimator
 if TYPE_CHECKING:
     from edsl.agents.Agent import Agent
     from edsl.surveys.Survey import Survey
@@ -30,16 +29,6 @@ if TYPE_CHECKING:
     from edsl.data.Cache import Cache
     from edsl.language_models.LanguageModel import LanguageModel
     from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
-    from edsl.agents.InvigilatorBase import InvigilatorBase
-    from edsl.language_models.key_management.KeyLookup import KeyLookup
-@dataclass
-class InterviewRunningConfig:
-    cache: Optional["Cache"] = (None,)
-    skip_retry: bool = (False,)  # COULD BE SET WITH CONFIG
-    raise_validation_errors: bool = (True,)
-    stop_on_exception: bool = (False,)
 class Interview:
@@ -56,11 +45,13 @@ class Interview:
         survey: Survey,
         scenario: Scenario,
         model: Type["LanguageModel"],
+        debug: Optional[bool] = False,  # DEPRECATE
         iteration: int = 0,
-        indices: dict = None,  # explain?
         cache: Optional["Cache"] = None,
+        sidecar_model: Optional["LanguageModel"] = None,  # DEPRECATE
         skip_retry: bool = False,  # COULD BE SET WITH CONFIG
         raise_validation_errors: bool = True,
+        indices: dict = None,  # explain?
     ):
         """Initialize the Interview instance.
@@ -68,9 +59,10 @@ class Interview:
         :param survey: the survey being administered to the agent.
         :param scenario: the scenario that populates the survey questions.
         :param model: the language model used to answer the questions.
-        # :param debug: if True, run without calls to the language model.
+        :param debug: if True, run without calls to the language model.
         :param iteration: the iteration number of the interview.
         :param cache: the cache used to store the answers.
+        :param sidecar_model: a sidecar model used to answer questions.
         >>> i = Interview.example()
         >>> i.task_manager.task_creators
@@ -91,9 +83,12 @@ class Interview:
         self.survey = copy.deepcopy(survey)  # why do we need to deepcopy the survey?
         self.scenario = scenario
         self.model = model
+        self.debug = debug
         self.iteration = iteration
+        self.cache = cache
         self.answers = Answers()  # will get filled in as interview progresses
+        self.sidecar_model = sidecar_model
         self.task_manager = InterviewTaskManager(
             survey=self.survey,
@@ -102,13 +97,6 @@ class Interview:
         self.exceptions = InterviewExceptionCollection()
-        self.running_config = InterviewRunningConfig(
-            cache=cache,
-            skip_retry=skip_retry,
-            raise_validation_errors=raise_validation_errors,
-        )
-        self.cache = cache
         self.skip_retry = skip_retry
         self.raise_validation_errors = raise_validation_errors
@@ -121,7 +109,6 @@ class Interview:
         self.failed_questions = []
         self.indices = indices
-        self.initial_hash = hash(self)
     @property
     def has_exceptions(self) -> bool:
@@ -147,6 +134,7 @@ class Interview:
         # return self.task_creators.interview_status
         return self.task_manager.interview_status
+    # region: Serialization
     def to_dict(self, include_exceptions=True, add_edsl_version=True) -> dict[str, Any]:
         """Return a dictionary representation of the Interview instance.
         This is just for hashing purposes.
@@ -210,13 +198,13 @@ class Interview:
         """
         return hash(self) == hash(other)
+    # region: Conducting the interview
     async def async_conduct_interview(
         self,
-        run_config: Optional["RunConfig"] = None,
-        #     model_buckets: Optional[ModelBuckets] = None,
-        #     stop_on_exception: bool = False,
-        #     raise_validation_errors: bool = True,
-        #     key_lookup: Optional[KeyLookup] = None,
+        model_buckets: Optional[ModelBuckets] = None,
+        stop_on_exception: bool = False,
+        sidecar_model: Optional["LanguageModel"] = None,
+        raise_validation_errors: bool = True,
     ) -> tuple["Answers", List[dict[str, Any]]]:
         """
         Conduct an Interview asynchronously.
@@ -225,6 +213,7 @@ class Interview:
         :param model_buckets: a dictionary of token buckets for the model.
         :param debug: run without calls to LLM.
         :param stop_on_exception: if True, stops the interview if an exception is raised.
+        :param sidecar_model: a sidecar model used to answer questions.
         Example usage:
@@ -238,39 +227,21 @@ class Interview:
         >>> i.exceptions
         {'q0': ...
         >>> i = Interview.example()
-        >>> from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
-        >>> run_config = RunConfig(parameters = RunParameters(), environment = RunEnvironment())
-        >>> run_config.parameters.stop_on_exception = True
-        >>> result, _ = asyncio.run(i.async_conduct_interview(run_config))
+        >>> result, _ = asyncio.run(i.async_conduct_interview(stop_on_exception = True))
         Traceback (most recent call last):
         ...
         asyncio.exceptions.CancelledError
         """
-        from edsl.jobs.Jobs import RunConfig, RunParameters, RunEnvironment
-        if run_config is None:
-            run_config = RunConfig(
-                parameters=RunParameters(),
-                environment=RunEnvironment(),
-            )
-        self.stop_on_exception = run_config.parameters.stop_on_exception
+        self.sidecar_model = sidecar_model
+        self.stop_on_exception = stop_on_exception
         # if no model bucket is passed, create an 'infinity' bucket with no rate limits
-        bucket_collection = run_config.environment.bucket_collection
-        if bucket_collection:
-            model_buckets = bucket_collection.get(self.model)
-        else:
-            model_buckets = None
         if model_buckets is None or hasattr(self.agent, "answer_question_directly"):
             model_buckets = ModelBuckets.infinity_bucket()
         # was "self.tasks" - is that necessary?
         self.tasks = self.task_manager.build_question_tasks(
-            answer_func=AnswerQuestionFunctionConstructor(
-                self, key_lookup=run_config.environment.key_lookup
-            )(),
+            answer_func=AnswerQuestionFunctionConstructor(self)(),
             token_estimator=RequestTokenEstimator(self),
             model_buckets=model_buckets,
         )
@@ -279,26 +250,23 @@ class Interview:
         ## with dependencies on the questions that must be answered before this one can be answered.
         ## 'Invigilators' are used to administer the survey.
-        fetcher = FetchInvigilator(
-            interview=self,
-            current_answers=self.answers,
-            key_lookup=run_config.environment.key_lookup,
-        )
-        self.invigilators = [fetcher(question) for question in self.survey.questions]
-        await asyncio.gather(
-            *self.tasks, return_exceptions=not run_config.parameters.stop_on_exception
-        )
+        self.invigilators = [
+            FetchInvigilator(interview=self, current_answers=self.answers)(question)
+            for question in self.survey.questions
+        ]
+        await asyncio.gather(*self.tasks, return_exceptions=not stop_on_exception)
         self.answers.replace_missing_answers_with_none(self.survey)
         valid_results = list(
             self._extract_valid_results(self.tasks, self.invigilators, self.exceptions)
         )
         return self.answers, valid_results
+    # endregion
+    # region: Extracting results and recording errors
     @staticmethod
     def _extract_valid_results(
-        tasks: List["asyncio.Task"],
-        invigilators: List["InvigilatorBase"],
-        exceptions: InterviewExceptionCollection,
+        tasks, invigilators: List["InvigilatorABC"], exceptions
     ) -> Generator["Answers", None, None]:
         """Extract the valid results from the list of results.
@@ -311,7 +279,10 @@ class Interview:
         """
         assert len(tasks) == len(invigilators)
-        def handle_task(task, invigilator):
+        for task, invigilator in zip(tasks, invigilators):
+            if not task.done():
+                raise ValueError(f"Task {task.get_name()} is not done.")
             try:
                 result = task.result()
             except asyncio.CancelledError as e:  # task was cancelled
@@ -327,21 +298,17 @@ class Interview:
                     invigilator=invigilator,
                 )
                 exceptions.add(task.get_name(), exception_entry)
-            return result
-        for task, invigilator in zip(tasks, invigilators):
-            if not task.done():
-                raise ValueError(f"Task {task.get_name()} is not done.")
+            yield result
-            yield handle_task(task, invigilator)
+    # endregion
+    # region: Magic methods
     def __repr__(self) -> str:
         """Return a string representation of the Interview instance."""
         return f"Interview(agent = {repr(self.agent)}, survey = {repr(self.survey)}, scenario = {repr(self.scenario)}, model = {repr(self.model)})"
-    def duplicate(
-        self, iteration: int, cache: "Cache", randomize_survey: Optional[bool] = True
-    ) -> Interview:
+    def duplicate(self, iteration: int, cache: "Cache") -> Interview:
         """Duplicate the interview, but with a new iteration number and cache.
         >>> i = Interview.example()
@@ -350,19 +317,14 @@ class Interview:
         True
         """
-        if randomize_survey:
-            new_survey = self.survey.draw()
-        else:
-            new_survey = self.survey
         return Interview(
             agent=self.agent,
-            survey=new_survey,
+            survey=self.survey,
             scenario=self.scenario,
             model=self.model,
             iteration=iteration,
-            cache=self.running_config.cache,
-            skip_retry=self.running_config.skip_retry,
+            cache=cache,
+            skip_retry=self.skip_retry,
             indices=self.indices,
         )

edsl 0.1.39__py3-none-any.whl → 0.1.39.dev2__py3-none-any.whl

edsl 0.1.39py3-none-any.whl → 0.1.39.dev2py3-none-any.whl