PyPI - edsl - Versions diffs - 0.1.54__py3-none-any.whl → 0.1.56__py3-none-any.whl - Mend

edsl 0.1.54py3-none-any.whl → 0.1.56py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (105) hide show

edsl/__init__.py +8 -1
edsl/__init__original.py +134 -0
edsl/__version__.py +1 -1
edsl/agents/agent.py +29 -0
edsl/agents/agent_list.py +36 -1
edsl/base/base_class.py +281 -151
edsl/base/data_transfer_models.py +15 -4
edsl/buckets/__init__.py +8 -3
edsl/buckets/bucket_collection.py +9 -3
edsl/buckets/model_buckets.py +4 -2
edsl/buckets/token_bucket.py +2 -2
edsl/buckets/token_bucket_client.py +5 -3
edsl/caching/cache.py +131 -62
edsl/caching/cache_entry.py +70 -58
edsl/caching/sql_dict.py +17 -0
edsl/cli.py +99 -0
edsl/config/config_class.py +16 -0
edsl/conversation/__init__.py +31 -0
edsl/coop/coop.py +276 -242
edsl/coop/coop_jobs_objects.py +59 -0
edsl/coop/coop_objects.py +29 -0
edsl/coop/coop_regular_objects.py +26 -0
edsl/coop/utils.py +24 -19
edsl/dataset/dataset.py +338 -101
edsl/dataset/dataset_operations_mixin.py +216 -180
edsl/db_list/sqlite_list.py +349 -0
edsl/inference_services/__init__.py +40 -5
edsl/inference_services/exceptions.py +11 -0
edsl/inference_services/services/anthropic_service.py +5 -2
edsl/inference_services/services/aws_bedrock.py +6 -2
edsl/inference_services/services/azure_ai.py +6 -2
edsl/inference_services/services/google_service.py +7 -3
edsl/inference_services/services/mistral_ai_service.py +6 -2
edsl/inference_services/services/open_ai_service.py +6 -2
edsl/inference_services/services/perplexity_service.py +6 -2
edsl/inference_services/services/test_service.py +94 -5
edsl/interviews/answering_function.py +167 -59
edsl/interviews/interview.py +124 -72
edsl/interviews/interview_task_manager.py +10 -0
edsl/interviews/request_token_estimator.py +8 -0
edsl/invigilators/invigilators.py +35 -13
edsl/jobs/async_interview_runner.py +146 -104
edsl/jobs/data_structures.py +6 -4
edsl/jobs/decorators.py +61 -0
edsl/jobs/fetch_invigilator.py +61 -18
edsl/jobs/html_table_job_logger.py +14 -2
edsl/jobs/jobs.py +180 -104
edsl/jobs/jobs_component_constructor.py +2 -2
edsl/jobs/jobs_interview_constructor.py +2 -0
edsl/jobs/jobs_pricing_estimation.py +154 -113
edsl/jobs/jobs_remote_inference_logger.py +4 -0
edsl/jobs/jobs_runner_status.py +30 -25
edsl/jobs/progress_bar_manager.py +79 -0
edsl/jobs/remote_inference.py +35 -1
edsl/key_management/key_lookup_builder.py +6 -1
edsl/language_models/language_model.py +110 -12
edsl/language_models/model.py +10 -3
edsl/language_models/price_manager.py +176 -71
edsl/language_models/registry.py +5 -0
edsl/notebooks/notebook.py +77 -10
edsl/questions/VALIDATION_README.md +134 -0
edsl/questions/__init__.py +24 -1
edsl/questions/exceptions.py +21 -0
edsl/questions/question_dict.py +201 -16
edsl/questions/question_multiple_choice_with_other.py +624 -0
edsl/questions/question_registry.py +2 -1
edsl/questions/templates/multiple_choice_with_other/__init__.py +0 -0
edsl/questions/templates/multiple_choice_with_other/answering_instructions.jinja +15 -0
edsl/questions/templates/multiple_choice_with_other/question_presentation.jinja +17 -0
edsl/questions/validation_analysis.py +185 -0
edsl/questions/validation_cli.py +131 -0
edsl/questions/validation_html_report.py +404 -0
edsl/questions/validation_logger.py +136 -0
edsl/results/result.py +115 -46
edsl/results/results.py +702 -171
edsl/scenarios/construct_download_link.py +16 -3
edsl/scenarios/directory_scanner.py +226 -226
edsl/scenarios/file_methods.py +5 -0
edsl/scenarios/file_store.py +150 -9
edsl/scenarios/handlers/__init__.py +5 -1
edsl/scenarios/handlers/mp4_file_store.py +104 -0
edsl/scenarios/handlers/webm_file_store.py +104 -0
edsl/scenarios/scenario.py +120 -101
edsl/scenarios/scenario_list.py +800 -727
edsl/scenarios/scenario_list_gc_test.py +146 -0
edsl/scenarios/scenario_list_memory_test.py +214 -0
edsl/scenarios/scenario_list_source_refactor.md +35 -0
edsl/scenarios/scenario_selector.py +5 -4
edsl/scenarios/scenario_source.py +1990 -0
edsl/scenarios/tests/test_scenario_list_sources.py +52 -0
edsl/surveys/survey.py +22 -0
edsl/tasks/__init__.py +4 -2
edsl/tasks/task_history.py +198 -36
edsl/tests/scenarios/test_ScenarioSource.py +51 -0
edsl/tests/scenarios/test_scenario_list_sources.py +51 -0
edsl/utilities/__init__.py +2 -1
edsl/utilities/decorators.py +121 -0
edsl/utilities/memory_debugger.py +1010 -0
{edsl-0.1.54.dist-info → edsl-0.1.56.dist-info}/METADATA +51 -76
{edsl-0.1.54.dist-info → edsl-0.1.56.dist-info}/RECORD +103 -79
edsl/jobs/jobs_runner_asyncio.py +0 -281
edsl/language_models/unused/fake_openai_service.py +0 -60
{edsl-0.1.54.dist-info → edsl-0.1.56.dist-info}/LICENSE +0 -0
{edsl-0.1.54.dist-info → edsl-0.1.56.dist-info}/WHEEL +0 -0
{edsl-0.1.54.dist-info → edsl-0.1.56.dist-info}/entry_points.txt +0 -0

edsl/jobs/jobs_pricing_estimation.py CHANGED Viewed

@@ -1,7 +1,8 @@
 import logging
 import math
-from typing import List, TYPE_CHECKING, Union, Literal
+from typing import List, TYPE_CHECKING, Union, Literal, Dict
+from collections import namedtuple
 if TYPE_CHECKING:
     from .jobs import Jobs
@@ -20,8 +21,8 @@ logger = logging.getLogger(__name__)
 class PromptCostEstimator:
-    DEFAULT_INPUT_PRICE_PER_TOKEN = 0.000001
-    DEFAULT_OUTPUT_PRICE_PER_TOKEN = 0.000001
+    DEFAULT_INPUT_PRICE_PER_MILLION_TOKENS = 1.0
+    DEFAULT_OUTPUT_PRICE_PER_MILLION_TOKENS = 1.0
     CHARS_PER_TOKEN = 4
     OUTPUT_TOKENS_PER_INPUT_TOKEN = 0.75
     PIPING_MULTIPLIER = 2
@@ -48,81 +49,90 @@ class PromptCostEstimator:
             return PromptCostEstimator.PIPING_MULTIPLIER
         return 1
-    @property
-    def key(self):
-        return (self.inference_service, self.model)
-    @property
-    def relevant_prices(self):
-        try:
-            return self.price_lookup[self.key]
-        except KeyError:
-            return {}
-    def _get_highest_price_for_service(self, price_type: str) -> Union[float, None]:
-        """Returns the highest price per token for a given service and price type (input/output).
+    def _get_fallback_price(self, inference_service: str) -> Dict:
+        """
+        Get fallback prices for a service.
+        - First fallback: The highest input and output prices for that service from the price lookup.
+        - Second fallback: $1.00 per million tokens (for both input and output).
         Args:
-            price_type: Either "input" or "output"
+            inference_service (str): The inference service name
         Returns:
-            float | None: The highest price per token for the service, or None if not found
+            Dict: Price information
         """
-        prices_for_service = [
-            prices[price_type]["service_stated_token_price"]
-            / prices[price_type]["service_stated_token_qty"]
+        PriceEntry = namedtuple("PriceEntry", ["tokens_per_usd", "price_info"])
+        service_prices = [
+            prices
             for (service, _), prices in self.price_lookup.items()
-            if service == self.inference_service and price_type in prices
+            if service == inference_service
         ]
-        return max(prices_for_service) if prices_for_service else None
-    def input_price_per_token(
-        self,
-    ) -> tuple[float, Literal["price_lookup", "highest_price_for_service", "default"]]:
-        try:
-            return (
-                self.relevant_prices["input"]["service_stated_token_price"]
-                / self.relevant_prices["input"]["service_stated_token_qty"]
-            ), "price_lookup"
-        except KeyError:
-            highest_price = self._get_highest_price_for_service("input")
-            if highest_price is not None:
-                import warnings
-                warnings.warn(
-                    f"Price data not found for {self.key}. Using highest available input price for {self.inference_service}: ${highest_price:.6f} per token"
-                )
-                return highest_price, "highest_price_for_service"
-            import warnings
+        default_input_price_info = {
+            "one_usd_buys": 1_000_000,
+            "service_stated_token_qty": 1_000_000,
+            "service_stated_token_price": self.DEFAULT_INPUT_PRICE_PER_MILLION_TOKENS,
+        }
+        default_output_price_info = {
+            "one_usd_buys": 1_000_000,
+            "service_stated_token_qty": 1_000_000,
+            "service_stated_token_price": self.DEFAULT_OUTPUT_PRICE_PER_MILLION_TOKENS,
+        }
-            warnings.warn(
-                f"Price data not found for {self.inference_service}. Using default estimate for input token price: $1.00 / 1M tokens"
-            )
-            return self.DEFAULT_INPUT_PRICE_PER_TOKEN, "default"
+        # Find the most expensive price entries (lowest tokens per USD)
+        input_price_info = default_input_price_info
+        output_price_info = default_output_price_info
-    def output_price_per_token(
-        self,
-    ) -> tuple[float, Literal["price_lookup", "highest_price_for_service", "default"]]:
-        try:
-            return (
-                self.relevant_prices["output"]["service_stated_token_price"]
-                / self.relevant_prices["output"]["service_stated_token_qty"]
-            ), "price_lookup"
-        except KeyError:
-            highest_price = self._get_highest_price_for_service("output")
-            if highest_price is not None:
-                import warnings
-                warnings.warn(
-                    f"Price data not found for {self.key}. Using highest available output price for {self.inference_service}: ${highest_price:.6f} per token"
-                )
-                return highest_price, "highest_price_for_service"
-            import warnings
+        input_prices = [
+            PriceEntry(float(p["input"]["one_usd_buys"]), p["input"])
+            for p in service_prices
+            if "input" in p
+        ]
+        if input_prices:
+            input_price_info = min(
+                input_prices, key=lambda price: price.tokens_per_usd
+            ).price_info
+        output_prices = [
+            PriceEntry(float(p["output"]["one_usd_buys"]), p["output"])
+            for p in service_prices
+            if "output" in p
+        ]
+        if output_prices:
+            output_price_info = min(
+                output_prices, key=lambda price: price.tokens_per_usd
+            ).price_info
-            warnings.warn(
-                f"Price data not found for {self.inference_service}. Using default estimate for output token price: $1.00 / 1M tokens"
-            )
-            return self.DEFAULT_OUTPUT_PRICE_PER_TOKEN, "default"
+        return {
+            "input": input_price_info,
+            "output": output_price_info,
+        }
+    def get_price(self, inference_service: str, model: str) -> Dict:
+        """Get the price information for a specific service and model."""
+        key = (inference_service, model)
+        return self.price_lookup.get(key) or self._get_fallback_price(inference_service)
+    def get_price_per_million_tokens(
+        self,
+        relevant_prices: Dict,
+        token_type: Literal["input", "output"],
+    ) -> Dict:
+        """
+        Get the price per million tokens for a specific service, model, and token type.
+        """
+        service_price = relevant_prices[token_type]["service_stated_token_price"]
+        service_qty = relevant_prices[token_type]["service_stated_token_qty"]
+        if service_qty == 1_000_000:
+            price_per_million_tokens = service_price
+        elif service_qty == 1_000:
+            price_per_million_tokens = service_price * 1_000
+        else:
+            price_per_token = service_price / service_qty
+            price_per_million_tokens = round(price_per_token * 1_000_000, 10)
+        return price_per_million_tokens
     def __call__(self):
         user_prompt_chars = len(str(self.user_prompt)) * self.get_piping_multiplier(
@@ -135,20 +145,28 @@ class PromptCostEstimator:
         input_tokens = (user_prompt_chars + system_prompt_chars) // self.CHARS_PER_TOKEN
         output_tokens = math.ceil(self.OUTPUT_TOKENS_PER_INPUT_TOKEN * input_tokens)
-        input_price_per_token, input_price_source = self.input_price_per_token()
-        output_price_per_token, output_price_source = self.output_price_per_token()
+        relevant_prices = self.get_price(self.inference_service, self.model)
-        cost = (
-            input_tokens * input_price_per_token
-            + output_tokens * output_price_per_token
+        input_price_per_million_tokens = self.get_price_per_million_tokens(
+            relevant_prices, "input"
         )
+        output_price_per_million_tokens = self.get_price_per_million_tokens(
+            relevant_prices, "output"
+        )
+        input_price_per_token = input_price_per_million_tokens / 1_000_000
+        output_price_per_token = output_price_per_million_tokens / 1_000_000
+        input_cost = input_tokens * input_price_per_token
+        output_cost = output_tokens * output_price_per_token
+        cost = input_cost + output_cost
         return {
-            "input_price_source": input_price_source,
-            "input_price_per_token": input_price_per_token,
+            "input_price_per_million_tokens": input_price_per_million_tokens,
+            "output_price_per_million_tokens": output_price_per_million_tokens,
             "input_tokens": input_tokens,
-            "output_price_source": output_price_source,
             "output_tokens": output_tokens,
-            "output_price_per_token": output_price_per_token,
+            "input_cost_usd": input_cost,
+            "output_cost_usd": output_cost,
             "cost_usd": cost,
         }
@@ -328,6 +346,26 @@ class JobsPrompts:
             "model": model,
         }
+    def process_token_type(self, item: dict, token_type: str) -> tuple:
+        """
+        Helper function to process a single token type (input or output) for price estimation.
+        """
+        price = item[f"estimated_{token_type}_price_per_million_tokens"]
+        tokens = item[f"estimated_{token_type}_tokens"]
+        cost = item[f"estimated_{token_type}_cost_usd"]
+        return (
+            (item["inference_service"], item["model"], token_type, price),
+            {
+                "inference_service": item["inference_service"],
+                "model": item["model"],
+                "token_type": token_type,
+                "price_per_million_tokens": price,
+                "tokens": tokens,
+                "cost_usd": cost,
+            },
+        )
     def estimate_job_cost_from_external_prices(
         self, price_lookup: dict, iterations: int = 1
     ) -> dict:
@@ -341,9 +379,9 @@ class JobsPrompts:
         - 1 token = 4 characters.
         - For each prompt, output tokens = input tokens * 0.75, rounded up to the nearest integer.
         """
-        interviews = self.interviews
+        # Collect all prompt data
         data = []
-        for interview in interviews:
+        for interview in self.interviews:
             invigilators = [
                 FetchInvigilator(interview)(question)
                 for question in self.survey.questions
@@ -354,59 +392,62 @@ class JobsPrompts:
                     **prompt_details, price_lookup=price_lookup
                 )
                 price_estimates = {
+                    "estimated_input_price_per_million_tokens": prompt_cost[
+                        "input_price_per_million_tokens"
+                    ],
+                    "estimated_output_price_per_million_tokens": prompt_cost[
+                        "output_price_per_million_tokens"
+                    ],
                     "estimated_input_tokens": prompt_cost["input_tokens"],
                     "estimated_output_tokens": prompt_cost["output_tokens"],
+                    "estimated_input_cost_usd": prompt_cost["input_cost_usd"],
+                    "estimated_output_cost_usd": prompt_cost["output_cost_usd"],
                     "estimated_cost_usd": prompt_cost["cost_usd"],
                 }
-                data.append({**price_estimates, **prompt_details})
+                data.append(
+                    {
+                        **prompt_details,
+                        **price_estimates,
+                    }
+                )
-        model_groups = {}
+        # Group by service, model, token type, and price
+        detailed_groups = {}
         for item in data:
-            key = (item["inference_service"], item["model"])
-            if key not in model_groups:
-                model_groups[key] = {
-                    "inference_service": item["inference_service"],
-                    "model": item["model"],
-                    "estimated_cost_usd": 0,
-                    "estimated_input_tokens": 0,
-                    "estimated_output_tokens": 0,
-                }
-            # Accumulate values
-            model_groups[key]["estimated_cost_usd"] += item["estimated_cost_usd"]
-            model_groups[key]["estimated_input_tokens"] += item[
-                "estimated_input_tokens"
-            ]
-            model_groups[key]["estimated_output_tokens"] += item[
-                "estimated_output_tokens"
-            ]
-        # Apply iterations and convert to list
-        estimated_costs_by_model = []
-        for group_data in model_groups.values():
-            group_data["estimated_cost_usd"] *= iterations
-            group_data["estimated_input_tokens"] *= iterations
-            group_data["estimated_output_tokens"] *= iterations
-            estimated_costs_by_model.append(group_data)
+            for token_type in ["input", "output"]:
+                key, group_data = self.process_token_type(item, token_type)
+                if key not in detailed_groups:
+                    detailed_groups[key] = group_data
+                else:
+                    detailed_groups[key]["tokens"] += group_data["tokens"]
+                    detailed_groups[key]["cost_usd"] += group_data["cost_usd"]
+        # Apply iterations and prepare final output
+        detailed_costs = []
+        for group in detailed_groups.values():
+            group["tokens"] *= iterations
+            group["cost_usd"] *= iterations
+            detailed_costs.append(group)
         # Calculate totals
-        estimated_total_cost = sum(
-            model["estimated_cost_usd"] for model in estimated_costs_by_model
-        )
+        estimated_total_cost = sum(group["cost_usd"] for group in detailed_costs)
         estimated_total_input_tokens = sum(
-            model["estimated_input_tokens"] for model in estimated_costs_by_model
+            group["tokens"]
+            for group in detailed_costs
+            if group["token_type"] == "input"
         )
         estimated_total_output_tokens = sum(
-            model["estimated_output_tokens"] for model in estimated_costs_by_model
+            group["tokens"]
+            for group in detailed_costs
+            if group["token_type"] == "output"
         )
         output = {
             "estimated_total_cost_usd": estimated_total_cost,
             "estimated_total_input_tokens": estimated_total_input_tokens,
             "estimated_total_output_tokens": estimated_total_output_tokens,
-            "model_costs": estimated_costs_by_model,
+            "detailed_costs": detailed_costs,
         }
         return output
     def estimate_job_cost(self, iterations: int = 1) -> dict:

edsl/jobs/jobs_remote_inference_logger.py CHANGED Viewed

@@ -30,6 +30,8 @@ class JobsInfo:
     error_report_url: str = None
     results_uuid: str = None
     results_url: str = None
+    completed_interviews: int = None
+    failed_interviews: int = None
     pretty_names = {
         "job_uuid": "Job UUID",
@@ -53,6 +55,8 @@ class JobLogger(ABC):
             "error_report_url",
             "results_uuid",
             "results_url",
+            "completed_interviews",
+            "failed_interviews",
         ],
         value: str,
     ):

edsl/jobs/jobs_runner_status.py CHANGED Viewed

@@ -10,7 +10,7 @@ from typing import Any, Dict, Optional, TYPE_CHECKING
 from uuid import UUID
 if TYPE_CHECKING:
-    from .jobs_runner_asyncio import JobsRunnerAsyncio
+    from .jobs import Jobs
 @dataclass
@@ -65,14 +65,14 @@ class StatisticsTracker:
 class JobsRunnerStatusBase(ABC):
     def __init__(
         self,
-        jobs_runner: "JobsRunnerAsyncio",
+        jobs: "Jobs",
         n: int,
         refresh_rate: float = 1,
         endpoint_url: Optional[str] = "http://localhost:8000",
         job_uuid: Optional[UUID] = None,
         api_key: str = None,
     ):
-        self.jobs_runner = jobs_runner
+        self.jobs = jobs
         self.job_uuid = job_uuid
         self.base_url = f"{endpoint_url}"
         self.refresh_rate = refresh_rate
@@ -86,10 +86,10 @@ class JobsRunnerStatusBase(ABC):
             "unfixed_exceptions",
             "throughput",
         ]
-        self.num_total_interviews = n * len(self.jobs_runner)
+        self.num_total_interviews = n * len(self.jobs)
         self.distinct_models = list(
-            set(model.model for model in self.jobs_runner.jobs.models)
+            set(model.model for model in self.jobs.models)
         )
         self.stats_tracker = StatisticsTracker(
@@ -151,26 +151,31 @@ class JobsRunnerStatusBase(ABC):
         }
         model_queues = {}
-        # for model, bucket in self.jobs_runner.bucket_collection.items():
-        for model, bucket in self.jobs_runner.environment.bucket_collection.items():
-            model_name = model.model
-            model_queues[model_name] = {
-                "language_model_name": model_name,
-                "requests_bucket": {
-                    "completed": bucket.requests_bucket.num_released,
-                    "requested": bucket.requests_bucket.num_requests,
-                    "tokens_returned": bucket.requests_bucket.tokens_returned,
-                    "target_rate": round(bucket.requests_bucket.target_rate, 1),
-                    "current_rate": round(bucket.requests_bucket.get_throughput(), 1),
-                },
-                "tokens_bucket": {
-                    "completed": bucket.tokens_bucket.num_released,
-                    "requested": bucket.tokens_bucket.num_requests,
-                    "tokens_returned": bucket.tokens_bucket.tokens_returned,
-                    "target_rate": round(bucket.tokens_bucket.target_rate, 1),
-                    "current_rate": round(bucket.tokens_bucket.get_throughput(), 1),
-                },
-            }
+        # Check if bucket collection exists and is not empty
+        if (hasattr(self.jobs, 'run_config') and
+            hasattr(self.jobs.run_config, 'environment') and
+            hasattr(self.jobs.run_config.environment, 'bucket_collection') and
+            self.jobs.run_config.environment.bucket_collection):
+            for model, bucket in self.jobs.run_config.environment.bucket_collection.items():
+                model_name = model.model
+                model_queues[model_name] = {
+                    "language_model_name": model_name,
+                    "requests_bucket": {
+                        "completed": bucket.requests_bucket.num_released,
+                        "requested": bucket.requests_bucket.num_requests,
+                        "tokens_returned": bucket.requests_bucket.tokens_returned,
+                        "target_rate": round(bucket.requests_bucket.target_rate, 1),
+                        "current_rate": round(bucket.requests_bucket.get_throughput(), 1),
+                    },
+                    "tokens_bucket": {
+                        "completed": bucket.tokens_bucket.num_released,
+                        "requested": bucket.tokens_bucket.num_requests,
+                        "tokens_returned": bucket.tokens_bucket.tokens_returned,
+                        "target_rate": round(bucket.tokens_bucket.target_rate, 1),
+                        "current_rate": round(bucket.tokens_bucket.get_throughput(), 1),
+                    },
+                }
         status_dict["language_model_queues"] = model_queues
         return status_dict

edsl/jobs/progress_bar_manager.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""
+Progress bar management for asynchronous job execution.
+This module provides a context manager for handling progress bar setup and thread
+management during job execution. It coordinates the display and updating of progress
+bars, particularly for remote tracking via the Expected Parrot API.
+"""
+import threading
+import warnings
+from ..coop import Coop
+from .jobs_runner_status import JobsRunnerStatus
+class ProgressBarManager:
+    """Context manager for handling progress bar setup and thread management.
+    This class manages the progress bar display and updating during job execution,
+    particularly for remote tracking via the Expected Parrot API.
+    It handles:
+    1. Setting up a status tracking object
+    2. Creating and managing a background thread for progress updates
+    3. Properly cleaning up resources when execution completes
+    """
+    def __init__(self, jobs, run_config, parameters):
+        self.parameters = parameters
+        self.jobs = jobs
+        # Set up progress tracking
+        coop = Coop()
+        endpoint_url = coop.get_progress_bar_url()
+        # Set up jobs status object
+        params = {
+            "jobs": jobs,
+            "n": parameters.n,
+            "endpoint_url": endpoint_url,
+            "job_uuid": parameters.job_uuid,
+        }
+        # If the jobs_runner_status is already set, use it directly
+        if run_config.environment.jobs_runner_status is not None:
+            self.jobs_runner_status = run_config.environment.jobs_runner_status
+        else:
+            # Otherwise create a new one
+            self.jobs_runner_status = JobsRunnerStatus(**params)
+        # Store on run_config for use by other components
+        run_config.environment.jobs_runner_status = self.jobs_runner_status
+        self.progress_thread = None
+        self.stop_event = threading.Event()
+    def __enter__(self):
+        if self.parameters.progress_bar and self.jobs_runner_status.has_ep_api_key():
+            self.jobs_runner_status.setup()
+            self.progress_thread = threading.Thread(
+                target=self._run_progress_bar,
+                args=(self.stop_event, self.jobs_runner_status)
+            )
+            self.progress_thread.start()
+        elif self.parameters.progress_bar:
+            warnings.warn(
+                "You need an Expected Parrot API key to view job progress bars."
+            )
+        return self.stop_event
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self.stop_event.set()
+        if self.progress_thread is not None:
+            self.progress_thread.join()
+    @staticmethod
+    def _run_progress_bar(stop_event, jobs_runner_status):
+        """Runs the progress bar in a separate thread."""
+        jobs_runner_status.update_progress(stop_event)

edsl/jobs/remote_inference.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import re
 from typing import Optional, Union, Literal, TYPE_CHECKING, NewType, Callable, Any
 from dataclasses import dataclass
 from ..coop import CoopServerResponseError
@@ -112,13 +113,18 @@ class JobsRemoteInferenceHandler:
         )
         logger.add_info("job_uuid", job_uuid)
+        remote_inference_url = self.remote_inference_url
+        if "localhost" in remote_inference_url:
+            remote_inference_url = remote_inference_url.replace("8000", "1234")
         logger.update(
-            f"Job details are available at your Coop account. [Go to Remote Inference page]({self.remote_inference_url})",
+            f"Job details are available at your Coop account. [Go to Remote Inference page]({remote_inference_url})",
             status=JobsStatus.RUNNING,
         )
         progress_bar_url = (
             f"{self.expected_parrot_url}/home/remote-job-progress/{job_uuid}"
         )
+        if "localhost" in progress_bar_url:
+            progress_bar_url = progress_bar_url.replace("8000", "1234")
         logger.add_info("progress_bar_url", progress_bar_url)
         logger.update(
             f"View job progress [here]({progress_bar_url})", status=JobsStatus.RUNNING
@@ -200,10 +206,35 @@ class JobsRemoteInferenceHandler:
             status=JobsStatus.FAILED,
         )
+    def _handle_partially_failed_job_interview_details(
+        self, job_info: RemoteJobInfo, remote_job_data: RemoteInferenceResponse
+    ) -> None:
+        "Extracts the interview details from the remote job data."
+        try:
+            # Job details is a string of the form "64 out of 1,758 interviews failed"
+            job_details = remote_job_data.get("latest_failure_description")
+            text_without_commas = job_details.replace(",", "")
+            # Find all numbers in the text
+            numbers = [int(num) for num in re.findall(r"\d+", text_without_commas)]
+            failed = numbers[0]
+            total = numbers[1]
+            completed = total - failed
+            job_info.logger.add_info("completed_interviews", completed)
+            job_info.logger.add_info("failed_interviews", failed)
+        # This is mainly helpful metadata, and any errors here should not stop the code
+        except:
+            pass
     def _handle_partially_failed_job(
         self, job_info: RemoteJobInfo, remote_job_data: RemoteInferenceResponse
     ) -> None:
         "Handles a partially failed job by logging the error and updating the job status."
+        self._handle_partially_failed_job_interview_details(job_info, remote_job_data)
         latest_error_report_url = remote_job_data.get("latest_error_report_url")
         if latest_error_report_url:
@@ -244,6 +275,8 @@ class JobsRemoteInferenceHandler:
         job_info.logger.add_info("results_uuid", results_uuid)
         results = object_fetcher(results_uuid, expected_object_type="results")
         results_url = remote_job_data.get("results_url")
+        if "localhost" in results_url:
+            results_url = results_url.replace("8000", "1234")
         job_info.logger.add_info("results_url", results_url)
         if job_status == "completed":
@@ -256,6 +289,7 @@ class JobsRemoteInferenceHandler:
                 f"View partial results [here]({results_url})",
                 status=JobsStatus.PARTIALLY_FAILED,
             )
         results.job_uuid = job_info.job_uuid
         results.results_uuid = results_uuid
         return results

edsl/key_management/key_lookup_builder.py CHANGED Viewed

@@ -2,6 +2,7 @@ from typing import Optional, TYPE_CHECKING
 import os
 from functools import lru_cache
 import textwrap
+import requests
 if TYPE_CHECKING:
     from ..coop import Coop
@@ -255,7 +256,11 @@ class KeyLookupBuilder:
         return dict(list(os.environ.items()))
     def _coop_key_value_pairs(self):
-        return dict(list(self.coop.fetch_rate_limit_config_vars().items()))
+        try:
+            return dict(list(self.coop.fetch_rate_limit_config_vars().items()))
+        except requests.ConnectionError:
+            # If connection fails, return empty dict instead of raising error
+            return {}
     def _config_key_value_pairs(self):
         from ..config import CONFIG

edsl 0.1.54__py3-none-any.whl → 0.1.56__py3-none-any.whl

edsl 0.1.54py3-none-any.whl → 0.1.56py3-none-any.whl