PyPI - edsl - Versions diffs - 0.1.37.dev6__py3-none-any.whl → 0.1.38__py3-none-any.whl - Mend

edsl 0.1.37.dev6py3-none-any.whl → 0.1.38py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (271) hide show

edsl/Base.py +332 -303
edsl/BaseDiff.py +260 -260
edsl/TemplateLoader.py +24 -24
edsl/__init__.py +49 -48
edsl/__version__.py +1 -1
edsl/agents/Agent.py +867 -855
edsl/agents/AgentList.py +413 -350
edsl/agents/Invigilator.py +233 -222
edsl/agents/InvigilatorBase.py +265 -284
edsl/agents/PromptConstructor.py +354 -353
edsl/agents/__init__.py +3 -3
edsl/agents/descriptors.py +99 -99
edsl/agents/prompt_helpers.py +129 -129
edsl/auto/AutoStudy.py +117 -117
edsl/auto/StageBase.py +230 -230
edsl/auto/StageGenerateSurvey.py +178 -178
edsl/auto/StageLabelQuestions.py +125 -125
edsl/auto/StagePersona.py +61 -61
edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
edsl/auto/StagePersonaDimensionValues.py +74 -74
edsl/auto/StagePersonaDimensions.py +69 -69
edsl/auto/StageQuestions.py +73 -73
edsl/auto/SurveyCreatorPipeline.py +21 -21
edsl/auto/utilities.py +224 -224
edsl/base/Base.py +279 -289
edsl/config.py +157 -149
edsl/conversation/Conversation.py +290 -290
edsl/conversation/car_buying.py +58 -58
edsl/conversation/chips.py +95 -95
edsl/conversation/mug_negotiation.py +81 -81
edsl/conversation/next_speaker_utilities.py +93 -93
edsl/coop/PriceFetcher.py +54 -54
edsl/coop/__init__.py +2 -2
edsl/coop/coop.py +1028 -958
edsl/coop/utils.py +131 -131
edsl/data/Cache.py +555 -527
edsl/data/CacheEntry.py +233 -228
edsl/data/CacheHandler.py +149 -149
edsl/data/RemoteCacheSync.py +78 -97
edsl/data/SQLiteDict.py +292 -292
edsl/data/__init__.py +4 -4
edsl/data/orm.py +10 -10
edsl/data_transfer_models.py +73 -73
edsl/enums.py +175 -173
edsl/exceptions/BaseException.py +21 -21
edsl/exceptions/__init__.py +54 -54
edsl/exceptions/agents.py +42 -38
edsl/exceptions/cache.py +5 -0
edsl/exceptions/configuration.py +16 -16
edsl/exceptions/coop.py +10 -10
edsl/exceptions/data.py +14 -14
edsl/exceptions/general.py +34 -34
edsl/exceptions/jobs.py +33 -33
edsl/exceptions/language_models.py +63 -63
edsl/exceptions/prompts.py +15 -15
edsl/exceptions/questions.py +91 -91
edsl/exceptions/results.py +29 -29
edsl/exceptions/scenarios.py +22 -22
edsl/exceptions/surveys.py +37 -37
edsl/inference_services/AnthropicService.py +87 -87
edsl/inference_services/AwsBedrock.py +120 -120
edsl/inference_services/AzureAI.py +217 -217
edsl/inference_services/DeepInfraService.py +18 -18
edsl/inference_services/GoogleService.py +148 -156
edsl/inference_services/GroqService.py +20 -20
edsl/inference_services/InferenceServiceABC.py +147 -147
edsl/inference_services/InferenceServicesCollection.py +97 -97
edsl/inference_services/MistralAIService.py +123 -123
edsl/inference_services/OllamaService.py +18 -18
edsl/inference_services/OpenAIService.py +224 -224
edsl/inference_services/PerplexityService.py +163 -0
edsl/inference_services/TestService.py +89 -89
edsl/inference_services/TogetherAIService.py +170 -170
edsl/inference_services/models_available_cache.py +118 -118
edsl/inference_services/rate_limits_cache.py +25 -25
edsl/inference_services/registry.py +41 -39
edsl/inference_services/write_available.py +10 -10
edsl/jobs/Answers.py +56 -56
edsl/jobs/Jobs.py +898 -1347
edsl/jobs/JobsChecks.py +147 -0
edsl/jobs/JobsPrompts.py +268 -0
edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
edsl/jobs/__init__.py +1 -1
edsl/jobs/buckets/BucketCollection.py +63 -63
edsl/jobs/buckets/ModelBuckets.py +65 -65
edsl/jobs/buckets/TokenBucket.py +251 -248
edsl/jobs/interviews/Interview.py +661 -661
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
edsl/jobs/interviews/InterviewStatistic.py +63 -63
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
edsl/jobs/interviews/InterviewStatusLog.py +92 -92
edsl/jobs/interviews/ReportErrors.py +66 -66
edsl/jobs/interviews/interview_status_enum.py +9 -9
edsl/jobs/runners/JobsRunnerAsyncio.py +466 -338
edsl/jobs/runners/JobsRunnerStatus.py +330 -332
edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
edsl/jobs/tasks/TaskCreators.py +64 -64
edsl/jobs/tasks/TaskHistory.py +450 -442
edsl/jobs/tasks/TaskStatusLog.py +23 -23
edsl/jobs/tasks/task_status_enum.py +163 -163
edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
edsl/jobs/tokens/TokenUsage.py +34 -34
edsl/language_models/KeyLookup.py +30 -30
edsl/language_models/LanguageModel.py +668 -706
edsl/language_models/ModelList.py +155 -102
edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
edsl/language_models/__init__.py +3 -3
edsl/language_models/fake_openai_call.py +15 -15
edsl/language_models/fake_openai_service.py +61 -61
edsl/language_models/registry.py +190 -137
edsl/language_models/repair.py +156 -156
edsl/language_models/unused/ReplicateBase.py +83 -83
edsl/language_models/utilities.py +64 -64
edsl/notebooks/Notebook.py +258 -259
edsl/notebooks/__init__.py +1 -1
edsl/prompts/Prompt.py +362 -357
edsl/prompts/__init__.py +2 -2
edsl/questions/AnswerValidatorMixin.py +289 -289
edsl/questions/QuestionBase.py +664 -656
edsl/questions/QuestionBaseGenMixin.py +161 -161
edsl/questions/QuestionBasePromptsMixin.py +217 -234
edsl/questions/QuestionBudget.py +227 -227
edsl/questions/QuestionCheckBox.py +359 -359
edsl/questions/QuestionExtract.py +182 -183
edsl/questions/QuestionFreeText.py +114 -114
edsl/questions/QuestionFunctional.py +166 -159
edsl/questions/QuestionList.py +231 -231
edsl/questions/QuestionMultipleChoice.py +286 -286
edsl/questions/QuestionNumerical.py +153 -153
edsl/questions/QuestionRank.py +324 -324
edsl/questions/Quick.py +41 -41
edsl/questions/RegisterQuestionsMeta.py +71 -71
edsl/questions/ResponseValidatorABC.py +174 -174
edsl/questions/SimpleAskMixin.py +73 -73
edsl/questions/__init__.py +26 -26
edsl/questions/compose_questions.py +98 -98
edsl/questions/decorators.py +21 -21
edsl/questions/derived/QuestionLikertFive.py +76 -76
edsl/questions/derived/QuestionLinearScale.py +87 -87
edsl/questions/derived/QuestionTopK.py +93 -91
edsl/questions/derived/QuestionYesNo.py +82 -82
edsl/questions/descriptors.py +413 -413
edsl/questions/prompt_templates/question_budget.jinja +13 -13
edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
edsl/questions/prompt_templates/question_extract.jinja +11 -11
edsl/questions/prompt_templates/question_free_text.jinja +3 -3
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
edsl/questions/prompt_templates/question_list.jinja +17 -17
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
edsl/questions/prompt_templates/question_numerical.jinja +36 -36
edsl/questions/question_registry.py +177 -147
edsl/questions/settings.py +12 -12
edsl/questions/templates/budget/answering_instructions.jinja +7 -7
edsl/questions/templates/budget/question_presentation.jinja +7 -7
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
edsl/questions/templates/extract/answering_instructions.jinja +7 -7
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
edsl/questions/templates/list/answering_instructions.jinja +3 -3
edsl/questions/templates/list/question_presentation.jinja +5 -5
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
edsl/questions/templates/numerical/question_presentation.jinja +6 -6
edsl/questions/templates/rank/answering_instructions.jinja +11 -11
edsl/questions/templates/rank/question_presentation.jinja +15 -15
edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
edsl/questions/templates/top_k/question_presentation.jinja +22 -22
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +424 -293
edsl/results/DatasetExportMixin.py +731 -717
edsl/results/DatasetTree.py +275 -145
edsl/results/Result.py +465 -450
edsl/results/Results.py +1165 -1071
edsl/results/ResultsDBMixin.py +238 -238
edsl/results/ResultsExportMixin.py +43 -43
edsl/results/ResultsFetchMixin.py +33 -33
edsl/results/ResultsGGMixin.py +121 -121
edsl/results/ResultsToolsMixin.py +98 -98
edsl/results/Selector.py +135 -135
edsl/results/TableDisplay.py +198 -0
edsl/results/__init__.py +2 -2
edsl/results/table_display.css +78 -0
edsl/results/tree_explore.py +115 -115
edsl/scenarios/FileStore.py +632 -458
edsl/scenarios/Scenario.py +601 -546
edsl/scenarios/ScenarioHtmlMixin.py +64 -64
edsl/scenarios/ScenarioJoin.py +127 -0
edsl/scenarios/ScenarioList.py +1287 -1112
edsl/scenarios/ScenarioListExportMixin.py +52 -52
edsl/scenarios/ScenarioListPdfMixin.py +261 -261
edsl/scenarios/__init__.py +4 -4
edsl/shared.py +1 -1
edsl/study/ObjectEntry.py +173 -173
edsl/study/ProofOfWork.py +113 -113
edsl/study/SnapShot.py +80 -80
edsl/study/Study.py +528 -528
edsl/study/__init__.py +4 -4
edsl/surveys/DAG.py +148 -148
edsl/surveys/Memory.py +31 -31
edsl/surveys/MemoryPlan.py +244 -244
edsl/surveys/Rule.py +326 -330
edsl/surveys/RuleCollection.py +387 -387
edsl/surveys/Survey.py +1801 -1795
edsl/surveys/SurveyCSS.py +261 -261
edsl/surveys/SurveyExportMixin.py +259 -259
edsl/surveys/SurveyFlowVisualizationMixin.py +179 -121
edsl/surveys/SurveyQualtricsImport.py +284 -284
edsl/surveys/__init__.py +3 -3
edsl/surveys/base.py +53 -53
edsl/surveys/descriptors.py +56 -56
edsl/surveys/instructions/ChangeInstruction.py +49 -47
edsl/surveys/instructions/Instruction.py +65 -51
edsl/surveys/instructions/InstructionCollection.py +77 -77
edsl/templates/error_reporting/base.html +23 -23
edsl/templates/error_reporting/exceptions_by_model.html +34 -34
edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
edsl/templates/error_reporting/exceptions_by_type.html +16 -16
edsl/templates/error_reporting/interview_details.html +115 -115
edsl/templates/error_reporting/interviews.html +19 -10
edsl/templates/error_reporting/overview.html +4 -4
edsl/templates/error_reporting/performance_plot.html +1 -1
edsl/templates/error_reporting/report.css +73 -73
edsl/templates/error_reporting/report.html +117 -117
edsl/templates/error_reporting/report.js +25 -25
edsl/tools/__init__.py +1 -1
edsl/tools/clusters.py +192 -192
edsl/tools/embeddings.py +27 -27
edsl/tools/embeddings_plotting.py +118 -118
edsl/tools/plotting.py +112 -112
edsl/tools/summarize.py +18 -18
edsl/utilities/SystemInfo.py +28 -28
edsl/utilities/__init__.py +22 -22
edsl/utilities/ast_utilities.py +25 -25
edsl/utilities/data/Registry.py +6 -6
edsl/utilities/data/__init__.py +1 -1
edsl/utilities/data/scooter_results.json +1 -1
edsl/utilities/decorators.py +77 -77
edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
edsl/utilities/interface.py +627 -627
edsl/{conjure → utilities}/naming_utilities.py +263 -263
edsl/utilities/repair_functions.py +28 -28
edsl/utilities/restricted_python.py +70 -70
edsl/utilities/utilities.py +424 -409
{edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/LICENSE +21 -21
{edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/METADATA +2 -1
edsl-0.1.38.dist-info/RECORD +277 -0
edsl/conjure/AgentConstructionMixin.py +0 -160
edsl/conjure/Conjure.py +0 -62
edsl/conjure/InputData.py +0 -659
edsl/conjure/InputDataCSV.py +0 -48
edsl/conjure/InputDataMixinQuestionStats.py +0 -182
edsl/conjure/InputDataPyRead.py +0 -91
edsl/conjure/InputDataSPSS.py +0 -8
edsl/conjure/InputDataStata.py +0 -8
edsl/conjure/QuestionOptionMixin.py +0 -76
edsl/conjure/QuestionTypeMixin.py +0 -23
edsl/conjure/RawQuestion.py +0 -65
edsl/conjure/SurveyResponses.py +0 -7
edsl/conjure/__init__.py +0 -9
edsl/conjure/examples/placeholder.txt +0 -0
edsl/conjure/utilities.py +0 -201
edsl-0.1.37.dev6.dist-info/RECORD +0 -283
{edsl-0.1.37.dev6.dist-info → edsl-0.1.38.dist-info}/WHEEL +0 -0

edsl/jobs/JobsChecks.py ADDED Viewed

@@ -0,0 +1,147 @@
+import os
+from edsl.exceptions import MissingAPIKeyError
+class JobsChecks:
+    def __init__(self, jobs):
+        """ """
+        self.jobs = jobs
+    def check_api_keys(self) -> None:
+        from edsl import Model
+        for model in self.jobs.models + [Model()]:
+            if not model.has_valid_api_key():
+                raise MissingAPIKeyError(
+                    model_name=str(model.model),
+                    inference_service=model._inference_service_,
+                )
+    def get_missing_api_keys(self) -> set:
+        """
+        Returns a list of the api keys that a user needs to run this job, but does not currently have in their .env file.
+        """
+        missing_api_keys = set()
+        from edsl import Model
+        from edsl.enums import service_to_api_keyname
+        for model in self.jobs.models + [Model()]:
+            if not model.has_valid_api_key():
+                key_name = service_to_api_keyname.get(
+                    model._inference_service_, "NOT FOUND"
+                )
+                missing_api_keys.add(key_name)
+        return missing_api_keys
+    def user_has_ep_api_key(self) -> bool:
+        """
+        Returns True if the user has an EXPECTED_PARROT_API_KEY in their env.
+        Otherwise, returns False.
+        """
+        coop_api_key = os.getenv("EXPECTED_PARROT_API_KEY")
+        if coop_api_key is not None:
+            return True
+        else:
+            return False
+    def user_has_all_model_keys(self):
+        """
+        Returns True if the user has all model keys required to run their job.
+        Otherwise, returns False.
+        """
+        try:
+            self.check_api_keys()
+            return True
+        except MissingAPIKeyError:
+            return False
+        except Exception:
+            raise
+    def needs_external_llms(self) -> bool:
+        """
+        Returns True if the job needs external LLMs to run.
+        Otherwise, returns False.
+        """
+        # These cases are necessary to skip the API key check during doctests
+        # Accounts for Results.example()
+        all_agents_answer_questions_directly = len(self.jobs.agents) > 0 and all(
+            [hasattr(a, "answer_question_directly") for a in self.jobs.agents]
+        )
+        # Accounts for InterviewExceptionEntry.example()
+        only_model_is_test = set([m.model for m in self.jobs.models]) == set(["test"])
+        # Accounts for Survey.__call__
+        all_questions_are_functional = set(
+            [q.question_type for q in self.jobs.survey.questions]
+        ) == set(["functional"])
+        if (
+            all_agents_answer_questions_directly
+            or only_model_is_test
+            or all_questions_are_functional
+        ):
+            return False
+        else:
+            return True
+    def needs_key_process(self):
+        return (
+            not self.user_has_all_model_keys()
+            and not self.user_has_ep_api_key()
+            and self.needs_external_llms()
+        )
+    def key_process(self):
+        import secrets
+        from dotenv import load_dotenv
+        from edsl import CONFIG
+        from edsl.coop.coop import Coop
+        from edsl.utilities.utilities import write_api_key_to_env
+        missing_api_keys = self.get_missing_api_keys()
+        edsl_auth_token = secrets.token_urlsafe(16)
+        print("You're missing some of the API keys needed to run this job:")
+        for api_key in missing_api_keys:
+            print(f"     🔑 {api_key}")
+        print(
+            "\nYou can either add the missing keys to your .env file, or use remote inference."
+        )
+        print("Remote inference allows you to run jobs on our server.")
+        print("\n🚀 To use remote inference, sign up at the following link:")
+        coop = Coop()
+        coop._display_login_url(edsl_auth_token=edsl_auth_token)
+        print(
+            "\nOnce you log in, we will automatically retrieve your Expected Parrot API key and continue your job remotely."
+        )
+        api_key = coop._poll_for_api_key(edsl_auth_token)
+        if api_key is None:
+            print("\nTimed out waiting for login. Please try again.")
+            return
+        write_api_key_to_env(api_key)
+        print("✨ API key retrieved and written to .env file.\n")
+        # Retrieve API key so we can continue running the job
+        load_dotenv()
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()

edsl/jobs/JobsPrompts.py ADDED Viewed

@@ -0,0 +1,268 @@
+from typing import List, TYPE_CHECKING
+from edsl.results.Dataset import Dataset
+if TYPE_CHECKING:
+    from edsl.jobs import Jobs
+    # from edsl.jobs.interviews.Interview import Interview
+    # from edsl.results.Dataset import Dataset
+    # from edsl.agents.AgentList import AgentList
+    # from edsl.scenarios.ScenarioList import ScenarioList
+    # from edsl.surveys.Survey import Survey
+class JobsPrompts:
+    def __init__(self, jobs: "Jobs"):
+        self.interviews = jobs.interviews()
+        self.agents = jobs.agents
+        self.scenarios = jobs.scenarios
+        self.survey = jobs.survey
+        self._price_lookup = None
+    @property
+    def price_lookup(self):
+        if self._price_lookup is None:
+            from edsl import Coop
+            c = Coop()
+            self._price_lookup = c.fetch_prices()
+        return self._price_lookup
+    def prompts(self) -> "Dataset":
+        """Return a Dataset of prompts that will be used.
+        >>> from edsl.jobs import Jobs
+        >>> Jobs.example().prompts()
+        Dataset(...)
+        """
+        interviews = self.interviews
+        interview_indices = []
+        question_names = []
+        user_prompts = []
+        system_prompts = []
+        scenario_indices = []
+        agent_indices = []
+        models = []
+        costs = []
+        for interview_index, interview in enumerate(interviews):
+            invigilators = [
+                interview._get_invigilator(question)
+                for question in self.survey.questions
+            ]
+            for _, invigilator in enumerate(invigilators):
+                prompts = invigilator.get_prompts()
+                user_prompt = prompts["user_prompt"]
+                system_prompt = prompts["system_prompt"]
+                user_prompts.append(user_prompt)
+                system_prompts.append(system_prompt)
+                agent_index = self.agents.index(invigilator.agent)
+                agent_indices.append(agent_index)
+                interview_indices.append(interview_index)
+                scenario_index = self.scenarios.index(invigilator.scenario)
+                scenario_indices.append(scenario_index)
+                models.append(invigilator.model.model)
+                question_names.append(invigilator.question.question_name)
+                prompt_cost = self.estimate_prompt_cost(
+                    system_prompt=system_prompt,
+                    user_prompt=user_prompt,
+                    price_lookup=self.price_lookup,
+                    inference_service=invigilator.model._inference_service_,
+                    model=invigilator.model.model,
+                )
+                costs.append(prompt_cost["cost_usd"])
+        d = Dataset(
+            [
+                {"user_prompt": user_prompts},
+                {"system_prompt": system_prompts},
+                {"interview_index": interview_indices},
+                {"question_name": question_names},
+                {"scenario_index": scenario_indices},
+                {"agent_index": agent_indices},
+                {"model": models},
+                {"estimated_cost": costs},
+            ]
+        )
+        return d
+    @staticmethod
+    def estimate_prompt_cost(
+        system_prompt: str,
+        user_prompt: str,
+        price_lookup: dict,
+        inference_service: str,
+        model: str,
+    ) -> dict:
+        """Estimates the cost of a prompt. Takes piping into account."""
+        import math
+        def get_piping_multiplier(prompt: str):
+            """Returns 2 if a prompt includes Jinja braces, and 1 otherwise."""
+            if "{{" in prompt and "}}" in prompt:
+                return 2
+            return 1
+        # Look up prices per token
+        key = (inference_service, model)
+        try:
+            relevant_prices = price_lookup[key]
+            service_input_token_price = float(
+                relevant_prices["input"]["service_stated_token_price"]
+            )
+            service_input_token_qty = float(
+                relevant_prices["input"]["service_stated_token_qty"]
+            )
+            input_price_per_token = service_input_token_price / service_input_token_qty
+            service_output_token_price = float(
+                relevant_prices["output"]["service_stated_token_price"]
+            )
+            service_output_token_qty = float(
+                relevant_prices["output"]["service_stated_token_qty"]
+            )
+            output_price_per_token = (
+                service_output_token_price / service_output_token_qty
+            )
+        except KeyError:
+            # A KeyError is likely to occur if we cannot retrieve prices (the price_lookup dict is empty)
+            # Use a sensible default
+            import warnings
+            warnings.warn(
+                "Price data could not be retrieved. Using default estimates for input and output token prices. Input: $0.15 / 1M tokens; Output: $0.60 / 1M tokens"
+            )
+            input_price_per_token = 0.00000015  # $0.15 / 1M tokens
+            output_price_per_token = 0.00000060  # $0.60 / 1M tokens
+        # Compute the number of characters (double if the question involves piping)
+        user_prompt_chars = len(str(user_prompt)) * get_piping_multiplier(
+            str(user_prompt)
+        )
+        system_prompt_chars = len(str(system_prompt)) * get_piping_multiplier(
+            str(system_prompt)
+        )
+        # Convert into tokens (1 token approx. equals 4 characters)
+        input_tokens = (user_prompt_chars + system_prompt_chars) // 4
+        output_tokens = math.ceil(0.75 * input_tokens)
+        cost = (
+            input_tokens * input_price_per_token
+            + output_tokens * output_price_per_token
+        )
+        return {
+            "input_tokens": input_tokens,
+            "output_tokens": output_tokens,
+            "cost_usd": cost,
+        }
+    def estimate_job_cost_from_external_prices(
+        self, price_lookup: dict, iterations: int = 1
+    ) -> dict:
+        """
+        Estimates the cost of a job according to the following assumptions:
+        - 1 token = 4 characters.
+        - For each prompt, output tokens = input tokens * 0.75, rounded up to the nearest integer.
+        price_lookup is an external pricing dictionary.
+        """
+        import pandas as pd
+        interviews = self.interviews
+        data = []
+        for interview in interviews:
+            invigilators = [
+                interview._get_invigilator(question)
+                for question in self.survey.questions
+            ]
+            for invigilator in invigilators:
+                prompts = invigilator.get_prompts()
+                # By this point, agent and scenario data has already been added to the prompts
+                user_prompt = prompts["user_prompt"]
+                system_prompt = prompts["system_prompt"]
+                inference_service = invigilator.model._inference_service_
+                model = invigilator.model.model
+                prompt_cost = self.estimate_prompt_cost(
+                    system_prompt=system_prompt,
+                    user_prompt=user_prompt,
+                    price_lookup=price_lookup,
+                    inference_service=inference_service,
+                    model=model,
+                )
+                data.append(
+                    {
+                        "user_prompt": user_prompt,
+                        "system_prompt": system_prompt,
+                        "estimated_input_tokens": prompt_cost["input_tokens"],
+                        "estimated_output_tokens": prompt_cost["output_tokens"],
+                        "estimated_cost_usd": prompt_cost["cost_usd"],
+                        "inference_service": inference_service,
+                        "model": model,
+                    }
+                )
+        df = pd.DataFrame.from_records(data)
+        df = (
+            df.groupby(["inference_service", "model"])
+            .agg(
+                {
+                    "estimated_cost_usd": "sum",
+                    "estimated_input_tokens": "sum",
+                    "estimated_output_tokens": "sum",
+                }
+            )
+            .reset_index()
+        )
+        df["estimated_cost_usd"] = df["estimated_cost_usd"] * iterations
+        df["estimated_input_tokens"] = df["estimated_input_tokens"] * iterations
+        df["estimated_output_tokens"] = df["estimated_output_tokens"] * iterations
+        estimated_costs_by_model = df.to_dict("records")
+        estimated_total_cost = sum(
+            model["estimated_cost_usd"] for model in estimated_costs_by_model
+        )
+        estimated_total_input_tokens = sum(
+            model["estimated_input_tokens"] for model in estimated_costs_by_model
+        )
+        estimated_total_output_tokens = sum(
+            model["estimated_output_tokens"] for model in estimated_costs_by_model
+        )
+        output = {
+            "estimated_total_cost_usd": estimated_total_cost,
+            "estimated_total_input_tokens": estimated_total_input_tokens,
+            "estimated_total_output_tokens": estimated_total_output_tokens,
+            "model_costs": estimated_costs_by_model,
+        }
+        return output
+    def estimate_job_cost(self, iterations: int = 1) -> dict:
+        """
+        Estimates the cost of a job according to the following assumptions:
+        - 1 token = 4 characters.
+        - For each prompt, output tokens = input tokens * 0.75, rounded up to the nearest integer.
+        Fetches prices from Coop.
+        """
+        return self.estimate_job_cost_from_external_prices(
+            price_lookup=self.price_lookup, iterations=iterations
+        )

edsl/jobs/JobsRemoteInferenceHandler.py ADDED Viewed

@@ -0,0 +1,239 @@
+from typing import Optional, Union, Literal
+import requests
+import sys
+from edsl.exceptions.coop import CoopServerResponseError
+# from edsl.enums import VisibilityType
+from edsl.results import Results
+class JobsRemoteInferenceHandler:
+    def __init__(self, jobs, verbose=False, poll_interval=3):
+        """
+        >>> from edsl.jobs import Jobs
+        >>> jh = JobsRemoteInferenceHandler(Jobs.example(), verbose=True)
+        >>> jh.use_remote_inference(True)
+        False
+        >>> jh._poll_remote_inference_job({'uuid':1234}, testing_simulated_response={"status": "failed"}) # doctest: +NORMALIZE_WHITESPACE
+        Job failed.
+        ...
+        >>> jh._poll_remote_inference_job({'uuid':1234}, testing_simulated_response={"status": "completed"}) # doctest: +NORMALIZE_WHITESPACE
+        Job completed and Results stored on Coop: None.
+        Results(...)
+        """
+        self.jobs = jobs
+        self.verbose = verbose
+        self.poll_interval = poll_interval
+        self._remote_job_creation_data = None
+        self._job_uuid = None
+    @property
+    def remote_job_creation_data(self):
+        return self._remote_job_creation_data
+    @property
+    def job_uuid(self):
+        return self._job_uuid
+    def use_remote_inference(self, disable_remote_inference: bool) -> bool:
+        if disable_remote_inference:
+            return False
+        if not disable_remote_inference:
+            try:
+                from edsl import Coop
+                user_edsl_settings = Coop().edsl_settings
+                return user_edsl_settings.get("remote_inference", False)
+            except requests.ConnectionError:
+                pass
+            except CoopServerResponseError as e:
+                pass
+        return False
+    def create_remote_inference_job(
+        self,
+        iterations: int = 1,
+        remote_inference_description: Optional[str] = None,
+        remote_inference_results_visibility: Optional["VisibilityType"] = "unlisted",
+        verbose=False,
+    ):
+        """ """
+        from edsl.config import CONFIG
+        from edsl.coop.coop import Coop
+        from rich import print as rich_print
+        coop = Coop()
+        print("Remote inference activated. Sending job to server...")
+        remote_job_creation_data = coop.remote_inference_create(
+            self.jobs,
+            description=remote_inference_description,
+            status="queued",
+            iterations=iterations,
+            initial_results_visibility=remote_inference_results_visibility,
+        )
+        job_uuid = remote_job_creation_data.get("uuid")
+        print(f"Job sent to server. (Job uuid={job_uuid}).")
+        expected_parrot_url = CONFIG.get("EXPECTED_PARROT_URL")
+        progress_bar_url = f"{expected_parrot_url}/home/remote-job-progress/{job_uuid}"
+        rich_print(
+            f"View job progress here: [#38bdf8][link={progress_bar_url}]{progress_bar_url}[/link][/#38bdf8]"
+        )
+        self._remote_job_creation_data = remote_job_creation_data
+        self._job_uuid = job_uuid
+        # return remote_job_creation_data
+    @staticmethod
+    def check_status(job_uuid):
+        from edsl.coop.coop import Coop
+        coop = Coop()
+        return coop.remote_inference_get(job_uuid)
+    def poll_remote_inference_job(self):
+        return self._poll_remote_inference_job(
+            self.remote_job_creation_data, verbose=self.verbose
+        )
+    def _poll_remote_inference_job(
+        self,
+        remote_job_creation_data: dict,
+        verbose=False,
+        poll_interval: Optional[float] = None,
+        testing_simulated_response: Optional[dict] = None,
+    ) -> Union[Results, None]:
+        import time
+        from datetime import datetime
+        from edsl.config import CONFIG
+        from edsl.coop.coop import Coop
+        if poll_interval is None:
+            poll_interval = self.poll_interval
+        expected_parrot_url = CONFIG.get("EXPECTED_PARROT_URL")
+        job_uuid = remote_job_creation_data.get("uuid")
+        coop = Coop()
+        if testing_simulated_response is not None:
+            remote_job_data_fetcher = lambda job_uuid: testing_simulated_response
+            object_fetcher = (
+                lambda results_uuid, expected_object_type: Results.example()
+            )
+        else:
+            remote_job_data_fetcher = coop.remote_inference_get
+            object_fetcher = coop.get
+        job_in_queue = True
+        while job_in_queue:
+            remote_job_data = remote_job_data_fetcher(job_uuid)
+            status = remote_job_data.get("status")
+            if status == "cancelled":
+                print("\r" + " " * 80 + "\r", end="")
+                print("Job cancelled by the user.")
+                print(
+                    f"See {expected_parrot_url}/home/remote-inference for more details."
+                )
+                return None
+            elif status == "failed":
+                print("\r" + " " * 80 + "\r", end="")
+                # write to stderr
+                latest_error_report_url = remote_job_data.get("latest_error_report_url")
+                if latest_error_report_url:
+                    print("Job failed.")
+                    print(
+                        f"Your job generated exceptions. Details on these exceptions can be found in the following report: {latest_error_report_url}"
+                    )
+                    print(
+                        f"Need support? Post a message at the Expected Parrot Discord channel (https://discord.com/invite/mxAYkjfy9m) or send an email to info@expectedparrot.com."
+                    )
+                else:
+                    print("Job failed.")
+                    print(
+                        f"See {expected_parrot_url}/home/remote-inference for more details."
+                    )
+                return None
+            elif status == "completed":
+                results_uuid = remote_job_data.get("results_uuid")
+                results_url = remote_job_data.get("results_url")
+                results = object_fetcher(results_uuid, expected_object_type="results")
+                print("\r" + " " * 80 + "\r", end="")
+                print(f"Job completed and Results stored on Coop: {results_url}.")
+                return results
+            else:
+                duration = poll_interval
+                time_checked = datetime.now().strftime("%Y-%m-%d %I:%M:%S %p")
+                frames = ["⠋", "⠙", "⠹", "⠸", "⠼", "⠴", "⠦", "⠧", "⠇", "⠏"]
+                start_time = time.time()
+                i = 0
+                while time.time() - start_time < duration:
+                    print(
+                        f"\r{frames[i % len(frames)]} Job status: {status} - last update: {time_checked}",
+                        end="",
+                        flush=True,
+                    )
+                    time.sleep(0.1)
+                    i += 1
+    def use_remote_inference(self, disable_remote_inference: bool) -> bool:
+        if disable_remote_inference:
+            return False
+        if not disable_remote_inference:
+            try:
+                from edsl import Coop
+                user_edsl_settings = Coop().edsl_settings
+                return user_edsl_settings.get("remote_inference", False)
+            except requests.ConnectionError:
+                pass
+            except CoopServerResponseError as e:
+                pass
+        return False
+    async def create_and_poll_remote_job(
+        self,
+        iterations: int = 1,
+        remote_inference_description: Optional[str] = None,
+        remote_inference_results_visibility: Optional[
+            Literal["private", "public", "unlisted"]
+        ] = "unlisted",
+    ) -> Union[Results, None]:
+        """
+        Creates and polls a remote inference job asynchronously.
+        Reuses existing synchronous methods but runs them in an async context.
+        :param iterations: Number of times to run each interview
+        :param remote_inference_description: Optional description for the remote job
+        :param remote_inference_results_visibility: Visibility setting for results
+        :return: Results object if successful, None if job fails or is cancelled
+        """
+        import asyncio
+        from functools import partial
+        # Create job using existing method
+        loop = asyncio.get_event_loop()
+        remote_job_creation_data = await loop.run_in_executor(
+            None,
+            partial(
+                self.create_remote_inference_job,
+                iterations=iterations,
+                remote_inference_description=remote_inference_description,
+                remote_inference_results_visibility=remote_inference_results_visibility,
+            ),
+        )
+        # Poll using existing method but with async sleep
+        return await loop.run_in_executor(
+            None, partial(self.poll_remote_inference_job, remote_job_creation_data)
+        )
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl/jobs/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- from edsl.jobs.Jobs import Jobs
1	+ from edsl.jobs.Jobs import Jobs

edsl 0.1.37.dev6__py3-none-any.whl → 0.1.38__py3-none-any.whl

edsl 0.1.37.dev6py3-none-any.whl → 0.1.38py3-none-any.whl