PyPI - edsl - Versions diffs - 0.1.53__py3-none-any.whl → 0.1.55__py3-none-any.whl - Mend

edsl 0.1.53py3-none-any.whl → 0.1.55py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (104) hide show

edsl/__init__.py +8 -1
edsl/__init__original.py +134 -0
edsl/__version__.py +1 -1
edsl/agents/agent.py +29 -0
edsl/agents/agent_list.py +36 -1
edsl/base/base_class.py +281 -151
edsl/buckets/__init__.py +8 -3
edsl/buckets/bucket_collection.py +9 -3
edsl/buckets/model_buckets.py +4 -2
edsl/buckets/token_bucket.py +2 -2
edsl/buckets/token_bucket_client.py +5 -3
edsl/caching/cache.py +131 -62
edsl/caching/cache_entry.py +70 -58
edsl/caching/sql_dict.py +17 -0
edsl/cli.py +99 -0
edsl/config/config_class.py +16 -0
edsl/conversation/__init__.py +31 -0
edsl/coop/coop.py +276 -242
edsl/coop/coop_jobs_objects.py +59 -0
edsl/coop/coop_objects.py +29 -0
edsl/coop/coop_regular_objects.py +26 -0
edsl/coop/utils.py +24 -19
edsl/dataset/dataset.py +338 -101
edsl/db_list/sqlite_list.py +349 -0
edsl/inference_services/__init__.py +40 -5
edsl/inference_services/exceptions.py +11 -0
edsl/inference_services/services/anthropic_service.py +5 -2
edsl/inference_services/services/aws_bedrock.py +6 -2
edsl/inference_services/services/azure_ai.py +6 -2
edsl/inference_services/services/google_service.py +3 -2
edsl/inference_services/services/mistral_ai_service.py +6 -2
edsl/inference_services/services/open_ai_service.py +6 -2
edsl/inference_services/services/perplexity_service.py +6 -2
edsl/inference_services/services/test_service.py +105 -7
edsl/interviews/answering_function.py +167 -59
edsl/interviews/interview.py +124 -72
edsl/interviews/interview_task_manager.py +10 -0
edsl/invigilators/invigilators.py +10 -1
edsl/jobs/async_interview_runner.py +146 -104
edsl/jobs/data_structures.py +6 -4
edsl/jobs/decorators.py +61 -0
edsl/jobs/fetch_invigilator.py +61 -18
edsl/jobs/html_table_job_logger.py +14 -2
edsl/jobs/jobs.py +180 -104
edsl/jobs/jobs_component_constructor.py +2 -2
edsl/jobs/jobs_interview_constructor.py +2 -0
edsl/jobs/jobs_pricing_estimation.py +127 -46
edsl/jobs/jobs_remote_inference_logger.py +4 -0
edsl/jobs/jobs_runner_status.py +30 -25
edsl/jobs/progress_bar_manager.py +79 -0
edsl/jobs/remote_inference.py +35 -1
edsl/key_management/key_lookup_builder.py +6 -1
edsl/language_models/language_model.py +102 -12
edsl/language_models/model.py +10 -3
edsl/language_models/price_manager.py +45 -75
edsl/language_models/registry.py +5 -0
edsl/language_models/utilities.py +2 -1
edsl/notebooks/notebook.py +77 -10
edsl/questions/VALIDATION_README.md +134 -0
edsl/questions/__init__.py +24 -1
edsl/questions/exceptions.py +21 -0
edsl/questions/question_check_box.py +171 -149
edsl/questions/question_dict.py +243 -51
edsl/questions/question_multiple_choice_with_other.py +624 -0
edsl/questions/question_registry.py +2 -1
edsl/questions/templates/multiple_choice_with_other/__init__.py +0 -0
edsl/questions/templates/multiple_choice_with_other/answering_instructions.jinja +15 -0
edsl/questions/templates/multiple_choice_with_other/question_presentation.jinja +17 -0
edsl/questions/validation_analysis.py +185 -0
edsl/questions/validation_cli.py +131 -0
edsl/questions/validation_html_report.py +404 -0
edsl/questions/validation_logger.py +136 -0
edsl/results/result.py +63 -16
edsl/results/results.py +702 -171
edsl/scenarios/construct_download_link.py +16 -3
edsl/scenarios/directory_scanner.py +226 -226
edsl/scenarios/file_methods.py +5 -0
edsl/scenarios/file_store.py +117 -6
edsl/scenarios/handlers/__init__.py +5 -1
edsl/scenarios/handlers/mp4_file_store.py +104 -0
edsl/scenarios/handlers/webm_file_store.py +104 -0
edsl/scenarios/scenario.py +120 -101
edsl/scenarios/scenario_list.py +800 -727
edsl/scenarios/scenario_list_gc_test.py +146 -0
edsl/scenarios/scenario_list_memory_test.py +214 -0
edsl/scenarios/scenario_list_source_refactor.md +35 -0
edsl/scenarios/scenario_selector.py +5 -4
edsl/scenarios/scenario_source.py +1990 -0
edsl/scenarios/tests/test_scenario_list_sources.py +52 -0
edsl/surveys/survey.py +22 -0
edsl/tasks/__init__.py +4 -2
edsl/tasks/task_history.py +198 -36
edsl/tests/scenarios/test_ScenarioSource.py +51 -0
edsl/tests/scenarios/test_scenario_list_sources.py +51 -0
edsl/utilities/__init__.py +2 -1
edsl/utilities/decorators.py +121 -0
edsl/utilities/memory_debugger.py +1010 -0
{edsl-0.1.53.dist-info → edsl-0.1.55.dist-info}/METADATA +52 -76
{edsl-0.1.53.dist-info → edsl-0.1.55.dist-info}/RECORD +102 -78
edsl/jobs/jobs_runner_asyncio.py +0 -281
edsl/language_models/unused/fake_openai_service.py +0 -60
{edsl-0.1.53.dist-info → edsl-0.1.55.dist-info}/LICENSE +0 -0
{edsl-0.1.53.dist-info → edsl-0.1.55.dist-info}/WHEEL +0 -0
{edsl-0.1.53.dist-info → edsl-0.1.55.dist-info}/entry_points.txt +0 -0

edsl/jobs/jobs_pricing_estimation.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import logging
 import math
-from typing import List, TYPE_CHECKING
+from typing import List, TYPE_CHECKING, Union, Literal
 if TYPE_CHECKING:
     from .jobs import Jobs
@@ -26,53 +26,104 @@ class PromptCostEstimator:
     OUTPUT_TOKENS_PER_INPUT_TOKEN = 0.75
     PIPING_MULTIPLIER = 2
-    def __init__(self,
+    def __init__(
+        self,
         system_prompt: str,
         user_prompt: str,
         price_lookup: dict,
         inference_service: str,
-        model: str):
+        model: str,
+    ):
         self.system_prompt = system_prompt
         self.user_prompt = user_prompt
         self.price_lookup = price_lookup
         self.inference_service = inference_service
         self.model = model
-    @staticmethod
+    @staticmethod
     def get_piping_multiplier(prompt: str):
         """Returns 2 if a prompt includes Jinja braces, and 1 otherwise."""
         if "{{" in prompt and "}}" in prompt:
             return PromptCostEstimator.PIPING_MULTIPLIER
         return 1
     @property
     def key(self):
         return (self.inference_service, self.model)
     @property
     def relevant_prices(self):
         try:
             return self.price_lookup[self.key]
         except KeyError:
             return {}
-    def input_price_per_token(self):
+    def _get_highest_price_for_service(self, price_type: str) -> Union[float, None]:
+        """Returns the highest price per token for a given service and price type (input/output).
+        Args:
+            price_type: Either "input" or "output"
+        Returns:
+            float | None: The highest price per token for the service, or None if not found
+        """
+        prices_for_service = [
+            prices[price_type]["service_stated_token_price"]
+            / prices[price_type]["service_stated_token_qty"]
+            for (service, _), prices in self.price_lookup.items()
+            if service == self.inference_service and price_type in prices
+        ]
+        return max(prices_for_service) if prices_for_service else None
+    def input_price_per_token(
+        self,
+    ) -> tuple[float, Literal["price_lookup", "highest_price_for_service", "default"]]:
         try:
-            return self.relevant_prices["input"]["service_stated_token_price"] / self.relevant_prices["input"]["service_stated_token_qty"]
+            return (
+                self.relevant_prices["input"]["service_stated_token_price"]
+                / self.relevant_prices["input"]["service_stated_token_qty"]
+            ), "price_lookup"
         except KeyError:
+            highest_price = self._get_highest_price_for_service("input")
+            if highest_price is not None:
+                import warnings
+                warnings.warn(
+                    f"Price data not found for {self.key}. Using highest available input price for {self.inference_service}: ${highest_price:.6f} per token"
+                )
+                return highest_price, "highest_price_for_service"
             import warnings
             warnings.warn(
-                "Price data could not be retrieved. Using default estimates for input and output token prices. Input: $1.00 / 1M tokens; Output: $1.00 / 1M tokens"
+                f"Price data not found for {self.inference_service}. Using default estimate for input token price: $1.00 / 1M tokens"
             )
-            return self.DEFAULT_INPUT_PRICE_PER_TOKEN
+            return self.DEFAULT_INPUT_PRICE_PER_TOKEN, "default"
-    def output_price_per_token(self):
+    def output_price_per_token(
+        self,
+    ) -> tuple[float, Literal["price_lookup", "highest_price_for_service", "default"]]:
         try:
-            return self.relevant_prices["output"]["service_stated_token_price"] / self.relevant_prices["output"]["service_stated_token_qty"]
+            return (
+                self.relevant_prices["output"]["service_stated_token_price"]
+                / self.relevant_prices["output"]["service_stated_token_qty"]
+            ), "price_lookup"
         except KeyError:
-            return self.DEFAULT_OUTPUT_PRICE_PER_TOKEN
+            highest_price = self._get_highest_price_for_service("output")
+            if highest_price is not None:
+                import warnings
+                warnings.warn(
+                    f"Price data not found for {self.key}. Using highest available output price for {self.inference_service}: ${highest_price:.6f} per token"
+                )
+                return highest_price, "highest_price_for_service"
+            import warnings
+            warnings.warn(
+                f"Price data not found for {self.inference_service}. Using default estimate for output token price: $1.00 / 1M tokens"
+            )
+            return self.DEFAULT_OUTPUT_PRICE_PER_TOKEN, "default"
     def __call__(self):
         user_prompt_chars = len(str(self.user_prompt)) * self.get_piping_multiplier(
             str(self.user_prompt)
@@ -84,20 +135,37 @@ class PromptCostEstimator:
         input_tokens = (user_prompt_chars + system_prompt_chars) // self.CHARS_PER_TOKEN
         output_tokens = math.ceil(self.OUTPUT_TOKENS_PER_INPUT_TOKEN * input_tokens)
+        input_price_per_token, input_price_source = self.input_price_per_token()
+        output_price_per_token, output_price_source = self.output_price_per_token()
         cost = (
-            input_tokens * self.input_price_per_token()
-            + output_tokens * self.output_price_per_token()
+            input_tokens * input_price_per_token
+            + output_tokens * output_price_per_token
         )
         return {
+            "input_price_source": input_price_source,
+            "input_price_per_token": input_price_per_token,
             "input_tokens": input_tokens,
+            "output_price_source": output_price_source,
             "output_tokens": output_tokens,
+            "output_price_per_token": output_price_per_token,
             "cost_usd": cost,
         }
 class JobsPrompts:
-    relevant_keys = ["user_prompt", "system_prompt", "interview_index", "question_name", "scenario_index", "agent_index", "model", "estimated_cost", "cache_keys"]
+    relevant_keys = [
+        "user_prompt",
+        "system_prompt",
+        "interview_index",
+        "question_name",
+        "scenario_index",
+        "agent_index",
+        "model",
+        "estimated_cost",
+        "cache_keys",
+    ]
     """This generates the prompts for a job for price estimation purposes.
@@ -105,7 +173,6 @@ class JobsPrompts:
     So assumptions are made about expansion of Jinja braces, etc.
     """
     @classmethod
     def from_jobs(cls, jobs: "Jobs"):
         """Construct a JobsPrompts object from a Jobs object."""
@@ -114,13 +181,16 @@ class JobsPrompts:
         scenarios = jobs.scenarios
         survey = jobs.survey
         return cls(
-            interviews=interviews,
-            agents=agents,
-            scenarios=scenarios,
-            survey=survey
+            interviews=interviews, agents=agents, scenarios=scenarios, survey=survey
         )
-    def __init__(self, interviews: List['Interview'], agents:'AgentList', scenarios: 'ScenarioList', survey: 'Survey'):
+    def __init__(
+        self,
+        interviews: List["Interview"],
+        agents: "AgentList",
+        scenarios: "ScenarioList",
+        survey: "Survey",
+    ):
         """Initialize with extracted components rather than a Jobs object."""
         self.interviews = interviews
         self.agents = agents
@@ -143,17 +213,19 @@ class JobsPrompts:
             self._price_lookup = c.fetch_prices()
         return self._price_lookup
-    def _process_one_invigilator(self, invigilator: 'Invigilator', interview_index: int, iterations: int = 1) -> dict:
+    def _process_one_invigilator(
+        self, invigilator: "Invigilator", interview_index: int, iterations: int = 1
+    ) -> dict:
         """Process a single invigilator and return a dictionary with all needed data fields."""
         prompts = invigilator.get_prompts()
         user_prompt = prompts["user_prompt"]
         system_prompt = prompts["system_prompt"]
         agent_index = self._agent_lookup[invigilator.agent]
         scenario_index = self._scenario_lookup[invigilator.scenario]
         model = invigilator.model.model
         question_name = invigilator.question.question_name
         # Calculate prompt cost
         prompt_cost = self.estimate_prompt_cost(
             system_prompt=system_prompt,
@@ -163,7 +235,7 @@ class JobsPrompts:
             model=model,
         )
         cost = prompt_cost["cost_usd"]
         # Generate cache keys for each iteration
         cache_keys = []
         for iteration in range(iterations):
@@ -175,7 +247,7 @@ class JobsPrompts:
                 iteration=iteration,
             )
             cache_keys.append(cache_key)
         d = {
             "user_prompt": user_prompt,
             "system_prompt": system_prompt,
@@ -200,7 +272,7 @@ class JobsPrompts:
         dataset_of_prompts = {k: [] for k in self.relevant_keys}
         interviews = self.interviews
         # Process each interview and invigilator
         for interview_index, interview in enumerate(interviews):
             invigilators = [
@@ -210,11 +282,13 @@ class JobsPrompts:
             for invigilator in invigilators:
                 # Process the invigilator and get all data as a dictionary
-                data = self._process_one_invigilator(invigilator, interview_index, iterations)
+                data = self._process_one_invigilator(
+                    invigilator, interview_index, iterations
+                )
                 for k in self.relevant_keys:
                     dataset_of_prompts[k].append(data[k])
-        return Dataset([{k:dataset_of_prompts[k]} for k in self.relevant_keys])
+        return Dataset([{k: dataset_of_prompts[k]} for k in self.relevant_keys])
     @staticmethod
     def estimate_prompt_cost(
@@ -230,13 +304,13 @@ class JobsPrompts:
             user_prompt=user_prompt,
             price_lookup=price_lookup,
             inference_service=inference_service,
-            model=model
+            model=model,
         )()
     @staticmethod
     def _extract_prompt_details(invigilator: FetchInvigilator) -> dict:
         """Extracts the prompt details from the invigilator.
         >>> from edsl.invigilators import InvigilatorAI
         >>> invigilator = InvigilatorAI.example()
         >>> JobsPrompts._extract_prompt_details(invigilator)
@@ -276,11 +350,13 @@ class JobsPrompts:
             ]
             for invigilator in invigilators:
                 prompt_details = self._extract_prompt_details(invigilator)
-                prompt_cost = self.estimate_prompt_cost(**prompt_details, price_lookup=price_lookup)
+                prompt_cost = self.estimate_prompt_cost(
+                    **prompt_details, price_lookup=price_lookup
+                )
                 price_estimates = {
-                    'estimated_input_tokens': prompt_cost['input_tokens'],
-                    'estimated_output_tokens': prompt_cost['output_tokens'],
-                    'estimated_cost_usd': prompt_cost['cost_usd']
+                    "estimated_input_tokens": prompt_cost["input_tokens"],
+                    "estimated_output_tokens": prompt_cost["output_tokens"],
+                    "estimated_cost_usd": prompt_cost["cost_usd"],
                 }
                 data.append({**price_estimates, **prompt_details})
@@ -293,14 +369,18 @@ class JobsPrompts:
                     "model": item["model"],
                     "estimated_cost_usd": 0,
                     "estimated_input_tokens": 0,
-                    "estimated_output_tokens": 0
+                    "estimated_output_tokens": 0,
                 }
             # Accumulate values
             model_groups[key]["estimated_cost_usd"] += item["estimated_cost_usd"]
-            model_groups[key]["estimated_input_tokens"] += item["estimated_input_tokens"]
-            model_groups[key]["estimated_output_tokens"] += item["estimated_output_tokens"]
+            model_groups[key]["estimated_input_tokens"] += item[
+                "estimated_input_tokens"
+            ]
+            model_groups[key]["estimated_output_tokens"] += item[
+                "estimated_output_tokens"
+            ]
         # Apply iterations and convert to list
         estimated_costs_by_model = []
         for group_data in model_groups.values():
@@ -345,4 +425,5 @@ class JobsPrompts:
 if __name__ == "__main__":
     import doctest
     doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl/jobs/jobs_remote_inference_logger.py CHANGED Viewed

@@ -30,6 +30,8 @@ class JobsInfo:
     error_report_url: str = None
     results_uuid: str = None
     results_url: str = None
+    completed_interviews: int = None
+    failed_interviews: int = None
     pretty_names = {
         "job_uuid": "Job UUID",
@@ -53,6 +55,8 @@ class JobLogger(ABC):
             "error_report_url",
             "results_uuid",
             "results_url",
+            "completed_interviews",
+            "failed_interviews",
         ],
         value: str,
     ):

edsl/jobs/jobs_runner_status.py CHANGED Viewed

@@ -10,7 +10,7 @@ from typing import Any, Dict, Optional, TYPE_CHECKING
 from uuid import UUID
 if TYPE_CHECKING:
-    from .jobs_runner_asyncio import JobsRunnerAsyncio
+    from .jobs import Jobs
 @dataclass
@@ -65,14 +65,14 @@ class StatisticsTracker:
 class JobsRunnerStatusBase(ABC):
     def __init__(
         self,
-        jobs_runner: "JobsRunnerAsyncio",
+        jobs: "Jobs",
         n: int,
         refresh_rate: float = 1,
         endpoint_url: Optional[str] = "http://localhost:8000",
         job_uuid: Optional[UUID] = None,
         api_key: str = None,
     ):
-        self.jobs_runner = jobs_runner
+        self.jobs = jobs
         self.job_uuid = job_uuid
         self.base_url = f"{endpoint_url}"
         self.refresh_rate = refresh_rate
@@ -86,10 +86,10 @@ class JobsRunnerStatusBase(ABC):
             "unfixed_exceptions",
             "throughput",
         ]
-        self.num_total_interviews = n * len(self.jobs_runner)
+        self.num_total_interviews = n * len(self.jobs)
         self.distinct_models = list(
-            set(model.model for model in self.jobs_runner.jobs.models)
+            set(model.model for model in self.jobs.models)
         )
         self.stats_tracker = StatisticsTracker(
@@ -151,26 +151,31 @@ class JobsRunnerStatusBase(ABC):
         }
         model_queues = {}
-        # for model, bucket in self.jobs_runner.bucket_collection.items():
-        for model, bucket in self.jobs_runner.environment.bucket_collection.items():
-            model_name = model.model
-            model_queues[model_name] = {
-                "language_model_name": model_name,
-                "requests_bucket": {
-                    "completed": bucket.requests_bucket.num_released,
-                    "requested": bucket.requests_bucket.num_requests,
-                    "tokens_returned": bucket.requests_bucket.tokens_returned,
-                    "target_rate": round(bucket.requests_bucket.target_rate, 1),
-                    "current_rate": round(bucket.requests_bucket.get_throughput(), 1),
-                },
-                "tokens_bucket": {
-                    "completed": bucket.tokens_bucket.num_released,
-                    "requested": bucket.tokens_bucket.num_requests,
-                    "tokens_returned": bucket.tokens_bucket.tokens_returned,
-                    "target_rate": round(bucket.tokens_bucket.target_rate, 1),
-                    "current_rate": round(bucket.tokens_bucket.get_throughput(), 1),
-                },
-            }
+        # Check if bucket collection exists and is not empty
+        if (hasattr(self.jobs, 'run_config') and
+            hasattr(self.jobs.run_config, 'environment') and
+            hasattr(self.jobs.run_config.environment, 'bucket_collection') and
+            self.jobs.run_config.environment.bucket_collection):
+            for model, bucket in self.jobs.run_config.environment.bucket_collection.items():
+                model_name = model.model
+                model_queues[model_name] = {
+                    "language_model_name": model_name,
+                    "requests_bucket": {
+                        "completed": bucket.requests_bucket.num_released,
+                        "requested": bucket.requests_bucket.num_requests,
+                        "tokens_returned": bucket.requests_bucket.tokens_returned,
+                        "target_rate": round(bucket.requests_bucket.target_rate, 1),
+                        "current_rate": round(bucket.requests_bucket.get_throughput(), 1),
+                    },
+                    "tokens_bucket": {
+                        "completed": bucket.tokens_bucket.num_released,
+                        "requested": bucket.tokens_bucket.num_requests,
+                        "tokens_returned": bucket.tokens_bucket.tokens_returned,
+                        "target_rate": round(bucket.tokens_bucket.target_rate, 1),
+                        "current_rate": round(bucket.tokens_bucket.get_throughput(), 1),
+                    },
+                }
         status_dict["language_model_queues"] = model_queues
         return status_dict

edsl/jobs/progress_bar_manager.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""
+Progress bar management for asynchronous job execution.
+This module provides a context manager for handling progress bar setup and thread
+management during job execution. It coordinates the display and updating of progress
+bars, particularly for remote tracking via the Expected Parrot API.
+"""
+import threading
+import warnings
+from ..coop import Coop
+from .jobs_runner_status import JobsRunnerStatus
+class ProgressBarManager:
+    """Context manager for handling progress bar setup and thread management.
+    This class manages the progress bar display and updating during job execution,
+    particularly for remote tracking via the Expected Parrot API.
+    It handles:
+    1. Setting up a status tracking object
+    2. Creating and managing a background thread for progress updates
+    3. Properly cleaning up resources when execution completes
+    """
+    def __init__(self, jobs, run_config, parameters):
+        self.parameters = parameters
+        self.jobs = jobs
+        # Set up progress tracking
+        coop = Coop()
+        endpoint_url = coop.get_progress_bar_url()
+        # Set up jobs status object
+        params = {
+            "jobs": jobs,
+            "n": parameters.n,
+            "endpoint_url": endpoint_url,
+            "job_uuid": parameters.job_uuid,
+        }
+        # If the jobs_runner_status is already set, use it directly
+        if run_config.environment.jobs_runner_status is not None:
+            self.jobs_runner_status = run_config.environment.jobs_runner_status
+        else:
+            # Otherwise create a new one
+            self.jobs_runner_status = JobsRunnerStatus(**params)
+        # Store on run_config for use by other components
+        run_config.environment.jobs_runner_status = self.jobs_runner_status
+        self.progress_thread = None
+        self.stop_event = threading.Event()
+    def __enter__(self):
+        if self.parameters.progress_bar and self.jobs_runner_status.has_ep_api_key():
+            self.jobs_runner_status.setup()
+            self.progress_thread = threading.Thread(
+                target=self._run_progress_bar,
+                args=(self.stop_event, self.jobs_runner_status)
+            )
+            self.progress_thread.start()
+        elif self.parameters.progress_bar:
+            warnings.warn(
+                "You need an Expected Parrot API key to view job progress bars."
+            )
+        return self.stop_event
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self.stop_event.set()
+        if self.progress_thread is not None:
+            self.progress_thread.join()
+    @staticmethod
+    def _run_progress_bar(stop_event, jobs_runner_status):
+        """Runs the progress bar in a separate thread."""
+        jobs_runner_status.update_progress(stop_event)

edsl/jobs/remote_inference.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import re
 from typing import Optional, Union, Literal, TYPE_CHECKING, NewType, Callable, Any
 from dataclasses import dataclass
 from ..coop import CoopServerResponseError
@@ -112,13 +113,18 @@ class JobsRemoteInferenceHandler:
         )
         logger.add_info("job_uuid", job_uuid)
+        remote_inference_url = self.remote_inference_url
+        if "localhost" in remote_inference_url:
+            remote_inference_url = remote_inference_url.replace("8000", "1234")
         logger.update(
-            f"Job details are available at your Coop account. [Go to Remote Inference page]({self.remote_inference_url})",
+            f"Job details are available at your Coop account. [Go to Remote Inference page]({remote_inference_url})",
             status=JobsStatus.RUNNING,
         )
         progress_bar_url = (
             f"{self.expected_parrot_url}/home/remote-job-progress/{job_uuid}"
         )
+        if "localhost" in progress_bar_url:
+            progress_bar_url = progress_bar_url.replace("8000", "1234")
         logger.add_info("progress_bar_url", progress_bar_url)
         logger.update(
             f"View job progress [here]({progress_bar_url})", status=JobsStatus.RUNNING
@@ -200,10 +206,35 @@ class JobsRemoteInferenceHandler:
             status=JobsStatus.FAILED,
         )
+    def _handle_partially_failed_job_interview_details(
+        self, job_info: RemoteJobInfo, remote_job_data: RemoteInferenceResponse
+    ) -> None:
+        "Extracts the interview details from the remote job data."
+        try:
+            # Job details is a string of the form "64 out of 1,758 interviews failed"
+            job_details = remote_job_data.get("latest_failure_description")
+            text_without_commas = job_details.replace(",", "")
+            # Find all numbers in the text
+            numbers = [int(num) for num in re.findall(r"\d+", text_without_commas)]
+            failed = numbers[0]
+            total = numbers[1]
+            completed = total - failed
+            job_info.logger.add_info("completed_interviews", completed)
+            job_info.logger.add_info("failed_interviews", failed)
+        # This is mainly helpful metadata, and any errors here should not stop the code
+        except:
+            pass
     def _handle_partially_failed_job(
         self, job_info: RemoteJobInfo, remote_job_data: RemoteInferenceResponse
     ) -> None:
         "Handles a partially failed job by logging the error and updating the job status."
+        self._handle_partially_failed_job_interview_details(job_info, remote_job_data)
         latest_error_report_url = remote_job_data.get("latest_error_report_url")
         if latest_error_report_url:
@@ -244,6 +275,8 @@ class JobsRemoteInferenceHandler:
         job_info.logger.add_info("results_uuid", results_uuid)
         results = object_fetcher(results_uuid, expected_object_type="results")
         results_url = remote_job_data.get("results_url")
+        if "localhost" in results_url:
+            results_url = results_url.replace("8000", "1234")
         job_info.logger.add_info("results_url", results_url)
         if job_status == "completed":
@@ -256,6 +289,7 @@ class JobsRemoteInferenceHandler:
                 f"View partial results [here]({results_url})",
                 status=JobsStatus.PARTIALLY_FAILED,
             )
         results.job_uuid = job_info.job_uuid
         results.results_uuid = results_uuid
         return results

edsl/key_management/key_lookup_builder.py CHANGED Viewed

@@ -2,6 +2,7 @@ from typing import Optional, TYPE_CHECKING
 import os
 from functools import lru_cache
 import textwrap
+import requests
 if TYPE_CHECKING:
     from ..coop import Coop
@@ -255,7 +256,11 @@ class KeyLookupBuilder:
         return dict(list(os.environ.items()))
     def _coop_key_value_pairs(self):
-        return dict(list(self.coop.fetch_rate_limit_config_vars().items()))
+        try:
+            return dict(list(self.coop.fetch_rate_limit_config_vars().items()))
+        except requests.ConnectionError:
+            # If connection fails, return empty dict instead of raising error
+            return {}
     def _config_key_value_pairs(self):
         from ..config import CONFIG

edsl 0.1.53__py3-none-any.whl → 0.1.55__py3-none-any.whl

edsl 0.1.53py3-none-any.whl → 0.1.55py3-none-any.whl