PyPI - edsl - Versions diffs - 0.1.39__py3-none-any.whl → 0.1.39.dev1__py3-none-any.whl - Mend

edsl 0.1.39py3-none-any.whl → 0.1.39.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

edsl/Base.py +116 -197
edsl/__init__.py +7 -15
edsl/__version__.py +1 -1
edsl/agents/Agent.py +147 -351
edsl/agents/AgentList.py +73 -211
edsl/agents/Invigilator.py +50 -101
edsl/agents/InvigilatorBase.py +70 -62
edsl/agents/PromptConstructor.py +225 -143
edsl/agents/__init__.py +1 -0
edsl/agents/prompt_helpers.py +3 -3
edsl/auto/AutoStudy.py +5 -18
edsl/auto/StageBase.py +40 -53
edsl/auto/StageQuestions.py +1 -2
edsl/auto/utilities.py +6 -0
edsl/config.py +2 -22
edsl/conversation/car_buying.py +1 -2
edsl/coop/PriceFetcher.py +1 -1
edsl/coop/coop.py +47 -125
edsl/coop/utils.py +14 -14
edsl/data/Cache.py +27 -45
edsl/data/CacheEntry.py +15 -12
edsl/data/CacheHandler.py +12 -31
edsl/data/RemoteCacheSync.py +46 -154
edsl/data/__init__.py +3 -4
edsl/data_transfer_models.py +1 -2
edsl/enums.py +0 -27
edsl/exceptions/__init__.py +50 -50
edsl/exceptions/agents.py +0 -12
edsl/exceptions/questions.py +6 -24
edsl/exceptions/scenarios.py +0 -7
edsl/inference_services/AnthropicService.py +19 -38
edsl/inference_services/AwsBedrock.py +2 -0
edsl/inference_services/AzureAI.py +2 -0
edsl/inference_services/GoogleService.py +12 -7
edsl/inference_services/InferenceServiceABC.py +85 -18
edsl/inference_services/InferenceServicesCollection.py +79 -120
edsl/inference_services/MistralAIService.py +3 -0
edsl/inference_services/OpenAIService.py +35 -47
edsl/inference_services/PerplexityService.py +3 -0
edsl/inference_services/TestService.py +10 -11
edsl/inference_services/TogetherAIService.py +3 -5
edsl/jobs/Answers.py +14 -1
edsl/jobs/Jobs.py +431 -356
edsl/jobs/JobsChecks.py +10 -35
edsl/jobs/JobsPrompts.py +4 -6
edsl/jobs/JobsRemoteInferenceHandler.py +133 -205
edsl/jobs/buckets/BucketCollection.py +3 -44
edsl/jobs/buckets/TokenBucket.py +21 -53
edsl/jobs/interviews/Interview.py +408 -143
edsl/jobs/runners/JobsRunnerAsyncio.py +403 -88
edsl/jobs/runners/JobsRunnerStatus.py +165 -133
edsl/jobs/tasks/QuestionTaskCreator.py +19 -21
edsl/jobs/tasks/TaskHistory.py +18 -38
edsl/jobs/tasks/task_status_enum.py +2 -0
edsl/language_models/KeyLookup.py +30 -0
edsl/language_models/LanguageModel.py +236 -194
edsl/language_models/ModelList.py +19 -28
edsl/language_models/__init__.py +2 -1
edsl/language_models/registry.py +190 -0
edsl/language_models/repair.py +2 -2
edsl/language_models/unused/ReplicateBase.py +83 -0
edsl/language_models/utilities.py +4 -5
edsl/notebooks/Notebook.py +14 -19
edsl/prompts/Prompt.py +39 -29
edsl/questions/{answer_validator_mixin.py → AnswerValidatorMixin.py} +2 -47
edsl/questions/QuestionBase.py +214 -68
edsl/questions/{question_base_gen_mixin.py → QuestionBaseGenMixin.py} +50 -57
edsl/questions/QuestionBasePromptsMixin.py +3 -7
edsl/questions/QuestionBudget.py +1 -1
edsl/questions/QuestionCheckBox.py +3 -3
edsl/questions/QuestionExtract.py +7 -5
edsl/questions/QuestionFreeText.py +3 -2
edsl/questions/QuestionList.py +18 -10
edsl/questions/QuestionMultipleChoice.py +23 -67
edsl/questions/QuestionNumerical.py +4 -2
edsl/questions/QuestionRank.py +17 -7
edsl/questions/{response_validator_abc.py → ResponseValidatorABC.py} +26 -40
edsl/questions/SimpleAskMixin.py +3 -4
edsl/questions/__init__.py +1 -2
edsl/questions/derived/QuestionLinearScale.py +3 -6
edsl/questions/derived/QuestionTopK.py +1 -1
edsl/questions/descriptors.py +3 -17
edsl/questions/question_registry.py +1 -1
edsl/results/CSSParameterizer.py +1 -1
edsl/results/Dataset.py +7 -170
edsl/results/DatasetExportMixin.py +305 -168
edsl/results/DatasetTree.py +8 -28
edsl/results/Result.py +206 -298
edsl/results/Results.py +131 -149
edsl/results/ResultsDBMixin.py +238 -0
edsl/results/ResultsExportMixin.py +0 -2
edsl/results/{results_selector.py → Selector.py} +13 -23
edsl/results/TableDisplay.py +171 -98
edsl/results/__init__.py +1 -1
edsl/scenarios/FileStore.py +239 -150
edsl/scenarios/Scenario.py +193 -90
edsl/scenarios/ScenarioHtmlMixin.py +3 -4
edsl/scenarios/{scenario_join.py → ScenarioJoin.py} +6 -10
edsl/scenarios/ScenarioList.py +244 -415
edsl/scenarios/ScenarioListExportMixin.py +7 -0
edsl/scenarios/ScenarioListPdfMixin.py +37 -15
edsl/scenarios/__init__.py +2 -1
edsl/study/ObjectEntry.py +1 -1
edsl/study/SnapShot.py +1 -1
edsl/study/Study.py +12 -5
edsl/surveys/Rule.py +4 -5
edsl/surveys/RuleCollection.py +27 -25
edsl/surveys/Survey.py +791 -270
edsl/surveys/SurveyCSS.py +8 -20
edsl/surveys/{SurveyFlowVisualization.py → SurveyFlowVisualizationMixin.py} +9 -11
edsl/surveys/__init__.py +2 -4
edsl/surveys/descriptors.py +2 -6
edsl/surveys/instructions/ChangeInstruction.py +2 -1
edsl/surveys/instructions/Instruction.py +13 -4
edsl/surveys/instructions/InstructionCollection.py +6 -11
edsl/templates/error_reporting/interview_details.html +1 -1
edsl/templates/error_reporting/report.html +1 -1
edsl/tools/plotting.py +1 -1
edsl/utilities/utilities.py +23 -35
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/METADATA +10 -12
edsl-0.1.39.dev1.dist-info/RECORD +277 -0
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/WHEEL +1 -1
edsl/agents/QuestionInstructionPromptBuilder.py +0 -128
edsl/agents/QuestionTemplateReplacementsBuilder.py +0 -137
edsl/agents/question_option_processor.py +0 -172
edsl/coop/CoopFunctionsMixin.py +0 -15
edsl/coop/ExpectedParrotKeyHandler.py +0 -125
edsl/exceptions/inference_services.py +0 -5
edsl/inference_services/AvailableModelCacheHandler.py +0 -184
edsl/inference_services/AvailableModelFetcher.py +0 -215
edsl/inference_services/ServiceAvailability.py +0 -135
edsl/inference_services/data_structures.py +0 -134
edsl/jobs/AnswerQuestionFunctionConstructor.py +0 -223
edsl/jobs/FetchInvigilator.py +0 -47
edsl/jobs/InterviewTaskManager.py +0 -98
edsl/jobs/InterviewsConstructor.py +0 -50
edsl/jobs/JobsComponentConstructor.py +0 -189
edsl/jobs/JobsRemoteInferenceLogger.py +0 -239
edsl/jobs/RequestTokenEstimator.py +0 -30
edsl/jobs/async_interview_runner.py +0 -138
edsl/jobs/buckets/TokenBucketAPI.py +0 -211
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/check_survey_scenario_compatibility.py +0 -85
edsl/jobs/data_structures.py +0 -120
edsl/jobs/decorators.py +0 -35
edsl/jobs/jobs_status_enums.py +0 -9
edsl/jobs/loggers/HTMLTableJobLogger.py +0 -304
edsl/jobs/results_exceptions_handler.py +0 -98
edsl/language_models/ComputeCost.py +0 -63
edsl/language_models/PriceManager.py +0 -127
edsl/language_models/RawResponseHandler.py +0 -106
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupBuilder.py +0 -273
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +0 -131
edsl/language_models/model.py +0 -256
edsl/notebooks/NotebookToLaTeX.py +0 -142
edsl/questions/ExceptionExplainer.py +0 -77
edsl/questions/HTMLQuestion.py +0 -103
edsl/questions/QuestionMatrix.py +0 -265
edsl/questions/data_structures.py +0 -20
edsl/questions/loop_processor.py +0 -149
edsl/questions/response_validator_factory.py +0 -34
edsl/questions/templates/matrix/__init__.py +0 -1
edsl/questions/templates/matrix/answering_instructions.jinja +0 -5
edsl/questions/templates/matrix/question_presentation.jinja +0 -20
edsl/results/MarkdownToDocx.py +0 -122
edsl/results/MarkdownToPDF.py +0 -111
edsl/results/TextEditor.py +0 -50
edsl/results/file_exports.py +0 -252
edsl/results/smart_objects.py +0 -96
edsl/results/table_data_class.py +0 -12
edsl/results/table_renderers.py +0 -118
edsl/scenarios/ConstructDownloadLink.py +0 -109
edsl/scenarios/DocumentChunker.py +0 -102
edsl/scenarios/DocxScenario.py +0 -16
edsl/scenarios/PdfExtractor.py +0 -40
edsl/scenarios/directory_scanner.py +0 -96
edsl/scenarios/file_methods.py +0 -85
edsl/scenarios/handlers/__init__.py +0 -13
edsl/scenarios/handlers/csv.py +0 -49
edsl/scenarios/handlers/docx.py +0 -76
edsl/scenarios/handlers/html.py +0 -37
edsl/scenarios/handlers/json.py +0 -111
edsl/scenarios/handlers/latex.py +0 -5
edsl/scenarios/handlers/md.py +0 -51
edsl/scenarios/handlers/pdf.py +0 -68
edsl/scenarios/handlers/png.py +0 -39
edsl/scenarios/handlers/pptx.py +0 -105
edsl/scenarios/handlers/py.py +0 -294
edsl/scenarios/handlers/sql.py +0 -313
edsl/scenarios/handlers/sqlite.py +0 -149
edsl/scenarios/handlers/txt.py +0 -33
edsl/scenarios/scenario_selector.py +0 -156
edsl/surveys/ConstructDAG.py +0 -92
edsl/surveys/EditSurvey.py +0 -221
edsl/surveys/InstructionHandler.py +0 -100
edsl/surveys/MemoryManagement.py +0 -72
edsl/surveys/RuleManager.py +0 -172
edsl/surveys/Simulator.py +0 -75
edsl/surveys/SurveyToApp.py +0 -141
edsl/utilities/PrettyList.py +0 -56
edsl/utilities/is_notebook.py +0 -18
edsl/utilities/is_valid_variable_name.py +0 -11
edsl/utilities/remove_edsl_version.py +0 -24
edsl-0.1.39.dist-info/RECORD +0 -358
/edsl/questions/{register_questions_meta.py → RegisterQuestionsMeta.py} +0 -0
/edsl/results/{results_fetch_mixin.py → ResultsFetchMixin.py} +0 -0
/edsl/results/{results_tools_mixin.py → ResultsToolsMixin.py} +0 -0
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/LICENSE +0 -0

edsl/jobs/runners/JobsRunnerStatus.py CHANGED Viewed

@@ -3,12 +3,21 @@ from __future__ import annotations
 import os
 import time
 import requests
+import warnings
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
+from typing import Any, List, DefaultDict, Optional, Dict
 from collections import defaultdict
-from typing import Any, Dict, Optional
 from uuid import UUID
+from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
+InterviewTokenUsageMapping = DefaultDict[str, InterviewTokenUsage]
+from edsl.jobs.interviews.InterviewStatistic import InterviewStatistic
+from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
 @dataclass
 class ModelInfo:
@@ -19,44 +28,11 @@ class ModelInfo:
     token_usage_info: dict
-class StatisticsTracker:
-    def __init__(self, total_interviews: int, distinct_models: list[str]):
-        self.start_time = time.time()
-        self.total_interviews = total_interviews
-        self.completed_count = 0
-        self.completed_by_model = defaultdict(int)
-        self.distinct_models = distinct_models
-        self.total_exceptions = 0
-        self.unfixed_exceptions = 0
-    def add_completed_interview(
-        self, model: str, num_exceptions: int = 0, num_unfixed: int = 0
-    ):
-        self.completed_count += 1
-        self.completed_by_model[model] += 1
-        self.total_exceptions += num_exceptions
-        self.unfixed_exceptions += num_unfixed
-    def get_elapsed_time(self) -> float:
-        return time.time() - self.start_time
-    def get_average_time_per_interview(self) -> float:
-        return (
-            self.get_elapsed_time() / self.completed_count
-            if self.completed_count > 0
-            else 0
-        )
-    def get_throughput(self) -> float:
-        elapsed = self.get_elapsed_time()
-        return self.completed_count / elapsed if elapsed > 0 else 0
-    def get_estimated_time_remaining(self) -> float:
-        if self.completed_count == 0:
-            return 0
-        avg_time = self.get_average_time_per_interview()
-        remaining = self.total_interviews - self.completed_count
-        return avg_time * remaining
+@dataclass
+class ModelTokenUsageStats:
+    token_usage_type: str
+    details: List[dict]
+    cost: str
 class JobsRunnerStatusBase(ABC):
@@ -70,39 +46,48 @@ class JobsRunnerStatusBase(ABC):
         api_key: str = None,
     ):
         self.jobs_runner = jobs_runner
+        # The uuid of the job on Coop
         self.job_uuid = job_uuid
         self.base_url = f"{endpoint_url}"
+        self.start_time = time.time()
+        self.completed_interviews = []
         self.refresh_rate = refresh_rate
         self.statistics = [
             "elapsed_time",
             "total_interviews_requested",
             "completed_interviews",
+            #            "percent_complete",
             "average_time_per_interview",
+            #            "task_remaining",
             "estimated_time_remaining",
             "exceptions",
             "unfixed_exceptions",
             "throughput",
         ]
-        self.num_total_interviews = n * len(self.jobs_runner)
+        self.num_total_interviews = n * len(self.jobs_runner.interviews)
         self.distinct_models = list(
-            set(model.model for model in self.jobs_runner.jobs.models)
+            set(i.model.model for i in self.jobs_runner.interviews)
         )
-        self.stats_tracker = StatisticsTracker(
-            total_interviews=self.num_total_interviews,
-            distinct_models=self.distinct_models,
-        )
+        self.completed_interview_by_model = defaultdict(list)
         self.api_key = api_key or os.getenv("EXPECTED_PARROT_API_KEY")
     @abstractmethod
     def has_ep_api_key(self):
-        """Checks if the user has an Expected Parrot API key."""
+        """
+        Checks if the user has an Expected Parrot API key.
+        """
         pass
     def get_status_dict(self) -> Dict[str, Any]:
-        """Converts current status into a JSON-serializable dictionary."""
+        """
+        Converts current status into a JSON-serializable dictionary.
+        """
         # Get all statistics
         stats = {}
         for stat_name in self.statistics:
@@ -110,46 +95,42 @@ class JobsRunnerStatusBase(ABC):
             name, value = list(stat.items())[0]
             stats[name] = value
+        # Calculate overall progress
+        total_interviews = len(self.jobs_runner.total_interviews)
+        completed = len(self.completed_interviews)
         # Get model-specific progress
         model_progress = {}
-        target_per_model = int(self.num_total_interviews / len(self.distinct_models))
         for model in self.distinct_models:
-            completed = self.stats_tracker.completed_by_model[model]
+            completed_for_model = len(self.completed_interview_by_model[model])
+            target_for_model = int(
+                self.num_total_interviews / len(self.distinct_models)
+            )
             model_progress[model] = {
-                "completed": completed,
-                "total": target_per_model,
+                "completed": completed_for_model,
+                "total": target_for_model,
                 "percent": (
-                    (completed / target_per_model * 100) if target_per_model > 0 else 0
+                    (completed_for_model / target_for_model * 100)
+                    if target_for_model > 0
+                    else 0
                 ),
             }
         status_dict = {
             "overall_progress": {
-                "completed": self.stats_tracker.completed_count,
-                "total": self.num_total_interviews,
+                "completed": completed,
+                "total": total_interviews,
                 "percent": (
-                    (
-                        self.stats_tracker.completed_count
-                        / self.num_total_interviews
-                        * 100
-                    )
-                    if self.num_total_interviews > 0
-                    else 0
+                    (completed / total_interviews * 100) if total_interviews > 0 else 0
                 ),
             },
             "language_model_progress": model_progress,
             "statistics": stats,
-            "status": (
-                "completed"
-                if self.stats_tracker.completed_count >= self.num_total_interviews
-                else "running"
-            ),
+            "status": "completed" if completed >= total_interviews else "running",
         }
         model_queues = {}
-        # for model, bucket in self.jobs_runner.bucket_collection.items():
-        for model, bucket in self.jobs_runner.environment.bucket_collection.items():
+        for model, bucket in self.jobs_runner.bucket_collection.items():
             model_name = model.model
             model_queues[model_name] = {
                 "language_model_name": model_name,
@@ -171,67 +152,98 @@ class JobsRunnerStatusBase(ABC):
         status_dict["language_model_queues"] = model_queues
         return status_dict
-    def add_completed_interview(self, result):
-        """Records a completed interview without storing the full interview data."""
-        self.stats_tracker.add_completed_interview(
-            model=result.model.model,
-            num_exceptions=(
-                len(result.exceptions) if hasattr(result, "exceptions") else 0
-            ),
-            num_unfixed=(
-                result.exceptions.num_unfixed() if hasattr(result, "exceptions") else 0
-            ),
-        )
-    def _compute_statistic(self, stat_name: str):
-        """Computes individual statistics based on the stats tracker."""
-        if stat_name == "elapsed_time":
-            value = self.stats_tracker.get_elapsed_time()
-            return {"elapsed_time": (value, 1, "sec.")}
-        elif stat_name == "total_interviews_requested":
-            return {"total_interviews_requested": (self.num_total_interviews, None, "")}
+    @abstractmethod
+    def setup(self):
+        """
+        Conducts any setup that needs to happen prior to sending status updates.
-        elif stat_name == "completed_interviews":
-            return {
-                "completed_interviews": (self.stats_tracker.completed_count, None, "")
-            }
+        Ex. For a local job, creates a job in the Coop database.
+        """
+        pass
-        elif stat_name == "average_time_per_interview":
-            value = self.stats_tracker.get_average_time_per_interview()
-            return {"average_time_per_interview": (value, 2, "sec.")}
+    @abstractmethod
+    def send_status_update(self):
+        """
+        Updates the current status of the job.
+        """
+        pass
-        elif stat_name == "estimated_time_remaining":
-            value = self.stats_tracker.get_estimated_time_remaining()
-            return {"estimated_time_remaining": (value, 1, "sec.")}
+    def add_completed_interview(self, result):
+        self.completed_interviews.append(result.interview_hash)
-        elif stat_name == "exceptions":
-            return {"exceptions": (self.stats_tracker.total_exceptions, None, "")}
+        relevant_model = result.model.model
+        self.completed_interview_by_model[relevant_model].append(result.interview_hash)
-        elif stat_name == "unfixed_exceptions":
-            return {
-                "unfixed_exceptions": (self.stats_tracker.unfixed_exceptions, None, "")
-            }
+    def _compute_statistic(self, stat_name: str):
+        completed_tasks = self.completed_interviews
+        elapsed_time = time.time() - self.start_time
+        interviews = self.jobs_runner.total_interviews
-        elif stat_name == "throughput":
-            value = self.stats_tracker.get_throughput()
-            return {"throughput": (value, 2, "interviews/sec.")}
+        stat_definitions = {
+            "elapsed_time": lambda: InterviewStatistic(
+                "elapsed_time", value=elapsed_time, digits=1, units="sec."
+            ),
+            "total_interviews_requested": lambda: InterviewStatistic(
+                "total_interviews_requested", value=len(interviews), units=""
+            ),
+            "completed_interviews": lambda: InterviewStatistic(
+                "completed_interviews", value=len(completed_tasks), units=""
+            ),
+            "percent_complete": lambda: InterviewStatistic(
+                "percent_complete",
+                value=(
+                    len(completed_tasks) / len(interviews) * 100
+                    if len(interviews) > 0
+                    else 0
+                ),
+                digits=1,
+                units="%",
+            ),
+            "average_time_per_interview": lambda: InterviewStatistic(
+                "average_time_per_interview",
+                value=elapsed_time / len(completed_tasks) if completed_tasks else 0,
+                digits=2,
+                units="sec.",
+            ),
+            "task_remaining": lambda: InterviewStatistic(
+                "task_remaining", value=len(interviews) - len(completed_tasks), units=""
+            ),
+            "estimated_time_remaining": lambda: InterviewStatistic(
+                "estimated_time_remaining",
+                value=(
+                    (len(interviews) - len(completed_tasks))
+                    * (elapsed_time / len(completed_tasks))
+                    if len(completed_tasks) > 0
+                    else 0
+                ),
+                digits=1,
+                units="sec.",
+            ),
+            "exceptions": lambda: InterviewStatistic(
+                "exceptions",
+                value=sum(len(i.exceptions) for i in interviews),
+                units="",
+            ),
+            "unfixed_exceptions": lambda: InterviewStatistic(
+                "unfixed_exceptions",
+                value=sum(i.exceptions.num_unfixed() for i in interviews),
+                units="",
+            ),
+            "throughput": lambda: InterviewStatistic(
+                "throughput",
+                value=len(completed_tasks) / elapsed_time if elapsed_time > 0 else 0,
+                digits=2,
+                units="interviews/sec.",
+            ),
+        }
+        return stat_definitions[stat_name]()
     def update_progress(self, stop_event):
         while not stop_event.is_set():
             self.send_status_update()
             time.sleep(self.refresh_rate)
-        self.send_status_update()
-    @abstractmethod
-    def setup(self):
-        """Conducts any setup needed prior to sending status updates."""
-        pass
-    @abstractmethod
-    def send_status_update(self):
-        """Updates the current status of the job."""
-        pass
+        self.send_status_update()
 class JobsRunnerStatus(JobsRunnerStatusBase):
@@ -248,35 +260,49 @@ class JobsRunnerStatus(JobsRunnerStatusBase):
         return f"{self.base_url}/api/v0/local-job/{str(self.job_uuid)}"
     def setup(self) -> None:
-        """Creates a local job on Coop if one does not already exist."""
-        headers = {
-            "Content-Type": "application/json",
-            "Authorization": f"Bearer {self.api_key or 'None'}",
-        }
+        """
+        Creates a local job on Coop if one does not already exist.
+        """
+        headers = {"Content-Type": "application/json"}
+        if self.api_key:
+            headers["Authorization"] = f"Bearer {self.api_key}"
+        else:
+            headers["Authorization"] = f"Bearer None"
         if self.job_uuid is None:
+            # Create a new local job
             response = requests.post(
                 self.create_url,
                 headers=headers,
                 timeout=1,
             )
-            response.raise_for_status()
-            data = response.json()
-            self.job_uuid = data.get("job_uuid")
+        response.raise_for_status()
+        data = response.json()
+        self.job_uuid = data.get("job_uuid")
         print(f"Running with progress bar. View progress at {self.viewing_url}")
     def send_status_update(self) -> None:
-        """Sends current status to the web endpoint using the instance's job_uuid."""
+        """
+        Sends current status to the web endpoint using the instance's job_uuid.
+        """
         try:
+            # Get the status dictionary and add the job_id
             status_dict = self.get_status_dict()
+            # Make the UUID JSON serializable
             status_dict["job_id"] = str(self.job_uuid)
-            headers = {
-                "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.api_key or 'None'}",
-            }
+            headers = {"Content-Type": "application/json"}
+            if self.api_key:
+                headers["Authorization"] = f"Bearer {self.api_key}"
+            else:
+                headers["Authorization"] = f"Bearer None"
+            # Send the update
             response = requests.patch(
                 self.update_url,
                 json=status_dict,
@@ -288,8 +314,14 @@ class JobsRunnerStatus(JobsRunnerStatusBase):
             print(f"Failed to send status update for job {self.job_uuid}: {e}")
     def has_ep_api_key(self) -> bool:
-        """Returns True if the user has an Expected Parrot API key."""
-        return self.api_key is not None
+        """
+        Returns True if the user has an Expected Parrot API key. Otherwise, returns False.
+        """
+        if self.api_key is not None:
+            return True
+        else:
+            return False
 if __name__ == "__main__":

edsl/jobs/tasks/QuestionTaskCreator.py CHANGED Viewed

@@ -1,17 +1,17 @@
 import asyncio
-from typing import Callable, Union, List, TYPE_CHECKING
+from typing import Callable, Union, List
 from collections import UserList, UserDict
-from edsl.exceptions.jobs import InterviewErrorPriorTaskCanceled
+from edsl.jobs.buckets import ModelBuckets
+from edsl.exceptions import InterviewErrorPriorTaskCanceled
+from edsl.jobs.interviews.InterviewStatusDictionary import InterviewStatusDictionary
 from edsl.jobs.tasks.task_status_enum import TaskStatus, TaskStatusDescriptor
 from edsl.jobs.tasks.TaskStatusLog import TaskStatusLog
+from edsl.jobs.tokens.InterviewTokenUsage import InterviewTokenUsage
 from edsl.jobs.tokens.TokenUsage import TokenUsage
 from edsl.jobs.Answers import Answers
-if TYPE_CHECKING:
-    from edsl.questions.QuestionBase import QuestionBase
-    from edsl.jobs.buckets import ModelBuckets
+from edsl.questions.QuestionBase import QuestionBase
 class TokensUsed(UserDict):
@@ -24,6 +24,7 @@ class TokensUsed(UserDict):
 class QuestionTaskCreator(UserList):
     """Class to create and manage a single question and its dependencies.
+    The class is an instance of a UserList of tasks that must be completed before the focal task can be run.
     It is a UserList with all the tasks that must be completed before the focal task can be run.
     The focal task is the question that we are interested in answering.
@@ -34,9 +35,9 @@ class QuestionTaskCreator(UserList):
     def __init__(
         self,
         *,
-        question: "QuestionBase",
+        question: QuestionBase,
         answer_question_func: Callable,
-        model_buckets: "ModelBuckets",
+        model_buckets: ModelBuckets,
         token_estimator: Union[Callable, None] = None,
         iteration: int = 0,
     ):
@@ -50,15 +51,14 @@ class QuestionTaskCreator(UserList):
         """
         super().__init__([])
+        # answer_question_func is the 'interview.answer_question_and_record_task" method
         self.answer_question_func = answer_question_func
         self.question = question
         self.iteration = iteration
         self.model_buckets = model_buckets
         self.requests_bucket = self.model_buckets.requests_bucket
         self.tokens_bucket = self.model_buckets.tokens_bucket
         self.status_log = TaskStatusLog()
         def fake_token_estimator(question):
@@ -125,13 +125,11 @@ class QuestionTaskCreator(UserList):
         await self.tokens_bucket.get_tokens(requested_tokens)
-        if (estimated_wait_time := self.model_buckets.requests_bucket.wait_time(1)) > 0:
+        if (estimated_wait_time := self.requests_bucket.wait_time(1)) > 0:
             self.waiting = True  #  do we need this?
             self.task_status = TaskStatus.WAITING_FOR_REQUEST_CAPACITY
-        await self.model_buckets.requests_bucket.get_tokens(
-            1, cheat_bucket_capacity=True
-        )
+        await self.requests_bucket.get_tokens(1, cheat_bucket_capacity=True)
         self.task_status = TaskStatus.API_CALL_IN_PROGRESS
         try:
@@ -144,22 +142,22 @@ class QuestionTaskCreator(UserList):
             raise e
         if results.cache_used:
-            self.model_buckets.tokens_bucket.add_tokens(requested_tokens)
-            self.model_buckets.requests_bucket.add_tokens(1)
+            self.tokens_bucket.add_tokens(requested_tokens)
+            self.requests_bucket.add_tokens(1)
             self.from_cache = True
             # Turbo mode means that we don't wait for tokens or requests.
-            self.model_buckets.tokens_bucket.turbo_mode_on()
-            self.model_buckets.requests_bucket.turbo_mode_on()
+            self.tokens_bucket.turbo_mode_on()
+            self.requests_bucket.turbo_mode_on()
         else:
-            self.model_buckets.tokens_bucket.turbo_mode_off()
-            self.model_buckets.requests_bucket.turbo_mode_off()
+            self.tokens_bucket.turbo_mode_off()
+            self.requests_bucket.turbo_mode_off()
         return results
     @classmethod
     def example(cls):
         """Return an example instance of the class."""
-        from edsl.questions.QuestionFreeText import QuestionFreeText
+        from edsl import QuestionFreeText
         from edsl.jobs.buckets.ModelBuckets import ModelBuckets
         m = ModelBuckets.infinity_bucket()

edsl/jobs/tasks/TaskHistory.py CHANGED Viewed

@@ -1,17 +1,18 @@
 from typing import List, Optional
 from io import BytesIO
+import webbrowser
+import os
 import base64
+from importlib import resources
 from edsl.jobs.tasks.task_status_enum import TaskStatus
-from edsl.Base import RepresentationMixin
-class TaskHistory(RepresentationMixin):
+class TaskHistory:
     def __init__(
         self,
-        interviews: List["Interview"] = None,
+        interviews: List["Interview"],
         include_traceback: bool = False,
         max_interviews: int = 10,
-        interviews_with_exceptions_only: bool = False,
     ):
         """
         The structure of a TaskHistory exception
@@ -21,33 +22,13 @@ class TaskHistory(RepresentationMixin):
         >>> _ = TaskHistory.example()
         ...
         """
-        self.interviews_with_exceptions_only = interviews_with_exceptions_only
-        self._interviews = {}
-        self.total_interviews = []
-        if interviews is not None:
-            for interview in interviews:
-                self.add_interview(interview)
-        self.include_traceback = include_traceback
-        self._interviews = {
-            index: interview for index, interview in enumerate(self.total_interviews)
-        }
-        self.max_interviews = max_interviews
-        # self.total_interviews = interviews
+        self.total_interviews = interviews
         self.include_traceback = include_traceback
-        # self._interviews = {index: i for index, i in enumerate(self.total_interviews)}
+        self._interviews = {index: i for index, i in enumerate(self.total_interviews)}
         self.max_interviews = max_interviews
-    def add_interview(self, interview: "Interview"):
-        """Add a single interview to the history"""
-        if self.interviews_with_exceptions_only and interview.exceptions == {}:
-            return
-        self.total_interviews.append(interview)
-        self._interviews[len(self._interviews)] = interview
     @classmethod
     def example(cls):
         """ """
@@ -140,6 +121,14 @@ class TaskHistory(RepresentationMixin):
         """Return True if there are any exceptions."""
         return len(self.unfixed_exceptions) > 0
+    def _repr_html_(self):
+        """Return an HTML representation of the TaskHistory."""
+        d = self.to_dict(add_edsl_version=False)
+        data = [[k, v] for k, v in d.items()]
+        from tabulate import tabulate
+        return tabulate(data, headers=["keys", "values"], tablefmt="html")
     def show_exceptions(self, tracebacks=False):
         """Print the exceptions."""
         for index in self.indices:
@@ -251,15 +240,11 @@ class TaskHistory(RepresentationMixin):
             plt.show()
     def css(self):
-        from importlib import resources
         env = resources.files("edsl").joinpath("templates/error_reporting")
         css = env.joinpath("report.css").read_text()
         return css
     def javascript(self):
-        from importlib import resources
         env = resources.files("edsl").joinpath("templates/error_reporting")
         js = env.joinpath("report.js").read_text()
         return js
@@ -296,7 +281,7 @@ class TaskHistory(RepresentationMixin):
         exceptions_by_question_name = {}
         for interview in self.total_interviews:
             for question_name, exceptions in interview.exceptions.items():
-                question_type = interview.survey._get_question_by_name(
+                question_type = interview.survey.get_question(
                     question_name
                 ).question_type
                 if (question_name, question_type) not in exceptions_by_question_name:
@@ -345,11 +330,8 @@ class TaskHistory(RepresentationMixin):
         }
         return sorted_exceptions_by_model
-    def generate_html_report(self, css: Optional[str], include_plot=False):
-        if include_plot:
-            performance_plot_html = self.plot(num_periods=100, get_embedded_html=True)
-        else:
-            performance_plot_html = ""
+    def generate_html_report(self, css: Optional[str]):
+        performance_plot_html = self.plot(num_periods=100, get_embedded_html=True)
         if css is None:
             css = self.css()
@@ -427,8 +409,6 @@ class TaskHistory(RepresentationMixin):
             print(f"Exception report saved to {filename}")
         if open_in_browser:
-            import webbrowser
             webbrowser.open(f"file://{os.path.abspath(filename)}")
         if return_link:

edsl/jobs/tasks/task_status_enum.py CHANGED Viewed

@@ -3,6 +3,8 @@ from collections import UserDict
 import enum
 import time
+# from edsl.jobs.tasks.TaskStatusLogEntry import TaskStatusLogEntry
 class TaskStatus(enum.Enum):
     "These are the possible states a task can be in."

edsl 0.1.39__py3-none-any.whl → 0.1.39.dev1__py3-none-any.whl

edsl 0.1.39py3-none-any.whl → 0.1.39.dev1py3-none-any.whl