PyPI - edsl - Versions diffs - 0.1.46__py3-none-any.whl → 0.1.48__py3-none-any.whl - Mend

edsl 0.1.46py3-none-any.whl → 0.1.48py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (328) hide show

edsl/__init__.py +44 -39
edsl/__version__.py +1 -1
edsl/agents/__init__.py +4 -2
edsl/agents/{Agent.py → agent.py} +442 -152
edsl/agents/{AgentList.py → agent_list.py} +220 -162
edsl/agents/descriptors.py +46 -7
edsl/{exceptions/agents.py → agents/exceptions.py} +3 -12
edsl/base/__init__.py +75 -0
edsl/base/base_class.py +1303 -0
edsl/base/data_transfer_models.py +114 -0
edsl/base/enums.py +215 -0
edsl/base.py +8 -0
edsl/buckets/__init__.py +25 -0
edsl/buckets/bucket_collection.py +324 -0
edsl/buckets/model_buckets.py +206 -0
edsl/buckets/token_bucket.py +502 -0
edsl/{jobs/buckets/TokenBucketAPI.py → buckets/token_bucket_api.py} +1 -1
edsl/buckets/token_bucket_client.py +509 -0
edsl/caching/__init__.py +20 -0
edsl/caching/cache.py +814 -0
edsl/caching/cache_entry.py +427 -0
edsl/{data/CacheHandler.py → caching/cache_handler.py} +14 -15
edsl/caching/exceptions.py +24 -0
edsl/caching/orm.py +30 -0
edsl/{data/RemoteCacheSync.py → caching/remote_cache_sync.py} +3 -3
edsl/caching/sql_dict.py +441 -0
edsl/config/__init__.py +8 -0
edsl/config/config_class.py +177 -0
edsl/config.py +4 -176
edsl/conversation/Conversation.py +7 -7
edsl/conversation/car_buying.py +4 -4
edsl/conversation/chips.py +6 -6
edsl/coop/__init__.py +25 -2
edsl/coop/coop.py +430 -113
edsl/coop/{ExpectedParrotKeyHandler.py → ep_key_handling.py} +86 -10
edsl/coop/exceptions.py +62 -0
edsl/coop/price_fetcher.py +126 -0
edsl/coop/utils.py +89 -24
edsl/data_transfer_models.py +5 -72
edsl/dataset/__init__.py +10 -0
edsl/{results/Dataset.py → dataset/dataset.py} +116 -36
edsl/dataset/dataset_operations_mixin.py +1492 -0
edsl/{results/DatasetTree.py → dataset/dataset_tree.py} +156 -75
edsl/{results/TableDisplay.py → dataset/display/table_display.py} +18 -7
edsl/{results → dataset/display}/table_renderers.py +58 -2
edsl/{results → dataset}/file_exports.py +4 -5
edsl/{results → dataset}/smart_objects.py +2 -2
edsl/enums.py +5 -205
edsl/inference_services/__init__.py +5 -0
edsl/inference_services/{AvailableModelCacheHandler.py → available_model_cache_handler.py} +2 -3
edsl/inference_services/{AvailableModelFetcher.py → available_model_fetcher.py} +8 -14
edsl/inference_services/data_structures.py +3 -2
edsl/{exceptions/inference_services.py → inference_services/exceptions.py} +1 -1
edsl/inference_services/{InferenceServiceABC.py → inference_service_abc.py} +1 -1
edsl/inference_services/{InferenceServicesCollection.py → inference_services_collection.py} +8 -7
edsl/inference_services/registry.py +4 -41
edsl/inference_services/{ServiceAvailability.py → service_availability.py} +5 -25
edsl/inference_services/services/__init__.py +31 -0
edsl/inference_services/{AnthropicService.py → services/anthropic_service.py} +3 -3
edsl/inference_services/{AwsBedrock.py → services/aws_bedrock.py} +2 -2
edsl/inference_services/{AzureAI.py → services/azure_ai.py} +2 -2
edsl/inference_services/{DeepInfraService.py → services/deep_infra_service.py} +1 -3
edsl/inference_services/{DeepSeekService.py → services/deep_seek_service.py} +2 -4
edsl/inference_services/{GoogleService.py → services/google_service.py} +5 -4
edsl/inference_services/{GroqService.py → services/groq_service.py} +1 -1
edsl/inference_services/{MistralAIService.py → services/mistral_ai_service.py} +3 -3
edsl/inference_services/{OllamaService.py → services/ollama_service.py} +1 -7
edsl/inference_services/{OpenAIService.py → services/open_ai_service.py} +5 -6
edsl/inference_services/{PerplexityService.py → services/perplexity_service.py} +12 -12
edsl/inference_services/{TestService.py → services/test_service.py} +7 -6
edsl/inference_services/{TogetherAIService.py → services/together_ai_service.py} +2 -6
edsl/inference_services/{XAIService.py → services/xai_service.py} +1 -1
edsl/inference_services/write_available.py +1 -2
edsl/instructions/__init__.py +6 -0
edsl/{surveys/instructions/Instruction.py → instructions/instruction.py} +11 -6
edsl/{surveys/instructions/InstructionCollection.py → instructions/instruction_collection.py} +10 -5
edsl/{surveys/InstructionHandler.py → instructions/instruction_handler.py} +3 -3
edsl/{jobs/interviews → interviews}/ReportErrors.py +2 -2
edsl/interviews/__init__.py +4 -0
edsl/{jobs/AnswerQuestionFunctionConstructor.py → interviews/answering_function.py} +45 -18
edsl/{jobs/interviews/InterviewExceptionEntry.py → interviews/exception_tracking.py} +107 -22
edsl/interviews/interview.py +638 -0
edsl/{jobs/interviews/InterviewStatusDictionary.py → interviews/interview_status_dictionary.py} +21 -12
edsl/{jobs/interviews/InterviewStatusLog.py → interviews/interview_status_log.py} +16 -7
edsl/{jobs/InterviewTaskManager.py → interviews/interview_task_manager.py} +12 -7
edsl/{jobs/RequestTokenEstimator.py → interviews/request_token_estimator.py} +8 -3
edsl/{jobs/interviews/InterviewStatistic.py → interviews/statistics.py} +36 -10
edsl/invigilators/__init__.py +38 -0
edsl/invigilators/invigilator_base.py +477 -0
edsl/{agents/Invigilator.py → invigilators/invigilators.py} +263 -10
edsl/invigilators/prompt_constructor.py +476 -0
edsl/{agents → invigilators}/prompt_helpers.py +2 -1
edsl/{agents/QuestionInstructionPromptBuilder.py → invigilators/question_instructions_prompt_builder.py} +18 -13
edsl/{agents → invigilators}/question_option_processor.py +96 -21
edsl/{agents/QuestionTemplateReplacementsBuilder.py → invigilators/question_template_replacements_builder.py} +64 -12
edsl/jobs/__init__.py +7 -1
edsl/jobs/async_interview_runner.py +99 -35
edsl/jobs/check_survey_scenario_compatibility.py +7 -5
edsl/jobs/data_structures.py +153 -22
edsl/{exceptions/jobs.py → jobs/exceptions.py} +2 -1
edsl/jobs/{FetchInvigilator.py → fetch_invigilator.py} +4 -4
edsl/jobs/{loggers/HTMLTableJobLogger.py → html_table_job_logger.py} +6 -2
edsl/jobs/{Jobs.py → jobs.py} +321 -155
edsl/jobs/{JobsChecks.py → jobs_checks.py} +15 -7
edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} +20 -17
edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} +10 -5
edsl/jobs/jobs_pricing_estimation.py +347 -0
edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} +4 -3
edsl/jobs/jobs_runner_asyncio.py +282 -0
edsl/jobs/{JobsRemoteInferenceHandler.py → remote_inference.py} +19 -22
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/key_management/__init__.py +28 -0
edsl/key_management/key_lookup.py +161 -0
edsl/{language_models/key_management/KeyLookupBuilder.py → key_management/key_lookup_builder.py} +118 -47
edsl/key_management/key_lookup_collection.py +82 -0
edsl/key_management/models.py +218 -0
edsl/language_models/__init__.py +7 -2
edsl/language_models/{ComputeCost.py → compute_cost.py} +18 -3
edsl/{exceptions/language_models.py → language_models/exceptions.py} +2 -1
edsl/language_models/language_model.py +1080 -0
edsl/language_models/model.py +10 -25
edsl/language_models/{ModelList.py → model_list.py} +9 -14
edsl/language_models/{RawResponseHandler.py → raw_response_handler.py} +1 -1
edsl/language_models/{RegisterLanguageModelsMeta.py → registry.py} +1 -1
edsl/language_models/repair.py +4 -4
edsl/language_models/utilities.py +4 -4
edsl/notebooks/__init__.py +3 -1
edsl/notebooks/{Notebook.py → notebook.py} +7 -8
edsl/prompts/__init__.py +1 -1
edsl/{exceptions/prompts.py → prompts/exceptions.py} +3 -1
edsl/prompts/{Prompt.py → prompt.py} +101 -95
edsl/questions/HTMLQuestion.py +1 -1
edsl/questions/__init__.py +154 -25
edsl/questions/answer_validator_mixin.py +1 -1
edsl/questions/compose_questions.py +4 -3
edsl/questions/derived/question_likert_five.py +166 -0
edsl/questions/derived/{QuestionLinearScale.py → question_linear_scale.py} +4 -4
edsl/questions/derived/{QuestionTopK.py → question_top_k.py} +4 -4
edsl/questions/derived/{QuestionYesNo.py → question_yes_no.py} +4 -5
edsl/questions/descriptors.py +24 -30
edsl/questions/loop_processor.py +65 -19
edsl/questions/question_base.py +881 -0
edsl/questions/question_base_gen_mixin.py +15 -16
edsl/questions/{QuestionBasePromptsMixin.py → question_base_prompts_mixin.py} +2 -2
edsl/questions/{QuestionBudget.py → question_budget.py} +3 -4
edsl/questions/{QuestionCheckBox.py → question_check_box.py} +16 -16
edsl/questions/{QuestionDict.py → question_dict.py} +39 -5
edsl/questions/{QuestionExtract.py → question_extract.py} +9 -9
edsl/questions/question_free_text.py +282 -0
edsl/questions/{QuestionFunctional.py → question_functional.py} +6 -5
edsl/questions/{QuestionList.py → question_list.py} +6 -7
edsl/questions/{QuestionMatrix.py → question_matrix.py} +6 -5
edsl/questions/{QuestionMultipleChoice.py → question_multiple_choice.py} +126 -21
edsl/questions/{QuestionNumerical.py → question_numerical.py} +5 -5
edsl/questions/{QuestionRank.py → question_rank.py} +6 -6
edsl/questions/question_registry.py +10 -16
edsl/questions/register_questions_meta.py +8 -4
edsl/questions/response_validator_abc.py +17 -16
edsl/results/__init__.py +4 -1
edsl/{exceptions/results.py → results/exceptions.py} +1 -1
edsl/results/report.py +197 -0
edsl/results/{Result.py → result.py} +131 -45
edsl/results/{Results.py → results.py} +420 -216
edsl/results/results_selector.py +344 -25
edsl/scenarios/__init__.py +30 -3
edsl/scenarios/{ConstructDownloadLink.py → construct_download_link.py} +7 -0
edsl/scenarios/directory_scanner.py +156 -13
edsl/scenarios/document_chunker.py +186 -0
edsl/scenarios/exceptions.py +101 -0
edsl/scenarios/file_methods.py +2 -3
edsl/scenarios/file_store.py +755 -0
edsl/scenarios/handlers/__init__.py +14 -14
edsl/scenarios/handlers/{csv.py → csv_file_store.py} +1 -2
edsl/scenarios/handlers/{docx.py → docx_file_store.py} +8 -7
edsl/scenarios/handlers/{html.py → html_file_store.py} +1 -2
edsl/scenarios/handlers/{jpeg.py → jpeg_file_store.py} +1 -1
edsl/scenarios/handlers/{json.py → json_file_store.py} +1 -1
edsl/scenarios/handlers/latex_file_store.py +5 -0
edsl/scenarios/handlers/{md.py → md_file_store.py} +1 -1
edsl/scenarios/handlers/{pdf.py → pdf_file_store.py} +2 -2
edsl/scenarios/handlers/{png.py → png_file_store.py} +1 -1
edsl/scenarios/handlers/{pptx.py → pptx_file_store.py} +8 -7
edsl/scenarios/handlers/{py.py → py_file_store.py} +1 -3
edsl/scenarios/handlers/{sql.py → sql_file_store.py} +2 -1
edsl/scenarios/handlers/{sqlite.py → sqlite_file_store.py} +2 -3
edsl/scenarios/handlers/{txt.py → txt_file_store.py} +1 -1
edsl/scenarios/scenario.py +928 -0
edsl/scenarios/scenario_join.py +18 -5
edsl/scenarios/{ScenarioList.py → scenario_list.py} +424 -106
edsl/scenarios/{ScenarioListPdfMixin.py → scenario_list_pdf_tools.py} +16 -15
edsl/scenarios/scenario_selector.py +5 -1
edsl/study/ObjectEntry.py +2 -2
edsl/study/SnapShot.py +5 -5
edsl/study/Study.py +20 -21
edsl/study/__init__.py +6 -4
edsl/surveys/__init__.py +7 -4
edsl/surveys/dag/__init__.py +2 -0
edsl/surveys/{ConstructDAG.py → dag/construct_dag.py} +3 -3
edsl/surveys/{DAG.py → dag/dag.py} +13 -10
edsl/surveys/descriptors.py +1 -1
edsl/surveys/{EditSurvey.py → edit_survey.py} +9 -9
edsl/{exceptions/surveys.py → surveys/exceptions.py} +1 -2
edsl/surveys/memory/__init__.py +3 -0
edsl/surveys/{MemoryPlan.py → memory/memory_plan.py} +10 -9
edsl/surveys/rules/__init__.py +3 -0
edsl/surveys/{Rule.py → rules/rule.py} +103 -43
edsl/surveys/{RuleCollection.py → rules/rule_collection.py} +21 -30
edsl/surveys/{RuleManager.py → rules/rule_manager.py} +19 -13
edsl/surveys/survey.py +1743 -0
edsl/surveys/{SurveyExportMixin.py → survey_export.py} +22 -27
edsl/surveys/{SurveyFlowVisualization.py → survey_flow_visualization.py} +11 -2
edsl/surveys/{Simulator.py → survey_simulator.py} +10 -3
edsl/tasks/__init__.py +32 -0
edsl/{jobs/tasks/QuestionTaskCreator.py → tasks/question_task_creator.py} +115 -57
edsl/tasks/task_creators.py +135 -0
edsl/{jobs/tasks/TaskHistory.py → tasks/task_history.py} +86 -47
edsl/{jobs/tasks → tasks}/task_status_enum.py +91 -7
edsl/tasks/task_status_log.py +85 -0
edsl/tokens/__init__.py +2 -0
edsl/tokens/interview_token_usage.py +53 -0
edsl/utilities/PrettyList.py +1 -1
edsl/utilities/SystemInfo.py +25 -22
edsl/utilities/__init__.py +29 -21
edsl/utilities/gcp_bucket/__init__.py +2 -0
edsl/utilities/gcp_bucket/cloud_storage.py +99 -96
edsl/utilities/interface.py +44 -536
edsl/{results/MarkdownToPDF.py → utilities/markdown_to_pdf.py} +13 -5
edsl/utilities/repair_functions.py +1 -1
{edsl-0.1.46.dist-info → edsl-0.1.48.dist-info}/METADATA +3 -2
edsl-0.1.48.dist-info/RECORD +347 -0
edsl/Base.py +0 -426
edsl/BaseDiff.py +0 -260
edsl/agents/InvigilatorBase.py +0 -260
edsl/agents/PromptConstructor.py +0 -318
edsl/auto/AutoStudy.py +0 -130
edsl/auto/StageBase.py +0 -243
edsl/auto/StageGenerateSurvey.py +0 -178
edsl/auto/StageLabelQuestions.py +0 -125
edsl/auto/StagePersona.py +0 -61
edsl/auto/StagePersonaDimensionValueRanges.py +0 -88
edsl/auto/StagePersonaDimensionValues.py +0 -74
edsl/auto/StagePersonaDimensions.py +0 -69
edsl/auto/StageQuestions.py +0 -74
edsl/auto/SurveyCreatorPipeline.py +0 -21
edsl/auto/utilities.py +0 -218
edsl/base/Base.py +0 -279
edsl/coop/PriceFetcher.py +0 -54
edsl/data/Cache.py +0 -580
edsl/data/CacheEntry.py +0 -230
edsl/data/SQLiteDict.py +0 -292
edsl/data/__init__.py +0 -5
edsl/data/orm.py +0 -10
edsl/exceptions/cache.py +0 -5
edsl/exceptions/coop.py +0 -14
edsl/exceptions/data.py +0 -14
edsl/exceptions/scenarios.py +0 -29
edsl/jobs/Answers.py +0 -43
edsl/jobs/JobsPrompts.py +0 -354
edsl/jobs/buckets/BucketCollection.py +0 -134
edsl/jobs/buckets/ModelBuckets.py +0 -65
edsl/jobs/buckets/TokenBucket.py +0 -283
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/interviews/Interview.py +0 -395
edsl/jobs/interviews/InterviewExceptionCollection.py +0 -99
edsl/jobs/interviews/InterviewStatisticsCollection.py +0 -25
edsl/jobs/runners/JobsRunnerAsyncio.py +0 -163
edsl/jobs/runners/JobsRunnerStatusData.py +0 -0
edsl/jobs/tasks/TaskCreators.py +0 -64
edsl/jobs/tasks/TaskStatusLog.py +0 -23
edsl/jobs/tokens/InterviewTokenUsage.py +0 -27
edsl/language_models/LanguageModel.py +0 -635
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/models.py +0 -137
edsl/questions/QuestionBase.py +0 -539
edsl/questions/QuestionFreeText.py +0 -130
edsl/questions/derived/QuestionLikertFive.py +0 -76
edsl/results/DatasetExportMixin.py +0 -911
edsl/results/ResultsExportMixin.py +0 -45
edsl/results/TextEditor.py +0 -50
edsl/results/results_fetch_mixin.py +0 -33
edsl/results/results_tools_mixin.py +0 -98
edsl/scenarios/DocumentChunker.py +0 -104
edsl/scenarios/FileStore.py +0 -564
edsl/scenarios/Scenario.py +0 -548
edsl/scenarios/ScenarioHtmlMixin.py +0 -65
edsl/scenarios/ScenarioListExportMixin.py +0 -45
edsl/scenarios/handlers/latex.py +0 -5
edsl/shared.py +0 -1
edsl/surveys/Survey.py +0 -1306
edsl/surveys/SurveyQualtricsImport.py +0 -284
edsl/surveys/SurveyToApp.py +0 -141
edsl/surveys/instructions/__init__.py +0 -0
edsl/tools/__init__.py +0 -1
edsl/tools/clusters.py +0 -192
edsl/tools/embeddings.py +0 -27
edsl/tools/embeddings_plotting.py +0 -118
edsl/tools/plotting.py +0 -112
edsl/tools/summarize.py +0 -18
edsl/utilities/data/Registry.py +0 -6
edsl/utilities/data/__init__.py +0 -1
edsl/utilities/data/scooter_results.json +0 -1
edsl-0.1.46.dist-info/RECORD +0 -366
/edsl/coop/{CoopFunctionsMixin.py → coop_functions.py} +0 -0
/edsl/{results → dataset/display}/CSSParameterizer.py +0 -0
/edsl/{language_models/key_management → dataset/display}/__init__.py +0 -0
/edsl/{results → dataset/display}/table_data_class.py +0 -0
/edsl/{results → dataset/display}/table_display.css +0 -0
/edsl/{results/ResultsGGMixin.py → dataset/r/ggplot.py} +0 -0
/edsl/{results → dataset}/tree_explore.py +0 -0
/edsl/{surveys/instructions/ChangeInstruction.py → instructions/change_instruction.py} +0 -0
/edsl/{jobs/interviews → interviews}/interview_status_enum.py +0 -0
/edsl/jobs/{runners/JobsRunnerStatus.py → jobs_runner_status.py} +0 -0
/edsl/language_models/{PriceManager.py → price_manager.py} +0 -0
/edsl/language_models/{fake_openai_call.py → unused/fake_openai_call.py} +0 -0
/edsl/language_models/{fake_openai_service.py → unused/fake_openai_service.py} +0 -0
/edsl/notebooks/{NotebookToLaTeX.py → notebook_to_latex.py} +0 -0
/edsl/{exceptions/questions.py → questions/exceptions.py} +0 -0
/edsl/questions/{SimpleAskMixin.py → simple_ask_mixin.py} +0 -0
/edsl/surveys/{Memory.py → memory/memory.py} +0 -0
/edsl/surveys/{MemoryManagement.py → memory/memory_management.py} +0 -0
/edsl/surveys/{SurveyCSS.py → survey_css.py} +0 -0
/edsl/{jobs/tokens/TokenUsage.py → tokens/token_usage.py} +0 -0
/edsl/{results/MarkdownToDocx.py → utilities/markdown_to_docx.py} +0 -0
/edsl/{TemplateLoader.py → utilities/template_loader.py} +0 -0
{edsl-0.1.46.dist-info → edsl-0.1.48.dist-info}/LICENSE +0 -0
{edsl-0.1.46.dist-info → edsl-0.1.48.dist-info}/WHEEL +0 -0

edsl/jobs/{JobsChecks.py → jobs_checks.py} RENAMED Viewed

@@ -1,8 +1,16 @@
+"""
+Checks a Jobs object for missing API keys and other requirements.
+"""
 import os
 from edsl.exceptions.general import MissingAPIKeyError
 class JobsChecks:
+    """
+    Checks a Jobs object for missing API keys and other requirements.
+    """
     def __init__(self, jobs):
         """Checks a Jobs object for missing API keys and other requirements."""
         self.jobs = jobs
@@ -42,9 +50,7 @@ class JobsChecks:
     def user_has_ep_api_key(self) -> bool:
         """
-        Returns True if the user has an EXPECTED_PARROT_API_KEY in their env.
-        Otherwise, returns False.
+        Does the user have an EXPECTED_PARROT_API_KEY in their env?
         """
         coop_api_key = os.getenv("EXPECTED_PARROT_API_KEY")
@@ -54,9 +60,9 @@ class JobsChecks:
         else:
             return False
-    def user_has_all_model_keys(self):
+    def user_has_all_model_keys(self) -> bool:
         """
-        Returns True if the user has all model keys required to run their job.
+        Does the user have all the model keys required to run their job?
         Otherwise, returns False.
         """
@@ -71,7 +77,7 @@ class JobsChecks:
     def needs_external_llms(self) -> bool:
         """
-        Returns True if the job needs external LLMs to run.
+        Does the job need external LLMs to run?
         Otherwise, returns False.
         """
@@ -99,8 +105,10 @@ class JobsChecks:
         else:
             return True
-    def needs_key_process(self):
+    def needs_key_process(self) -> bool:
         """
+        Determines if the user needs to go through the key process.
         A User needs the key process when:
         1. They don't have all the model keys
         2. They don't have the EP API

edsl/jobs/{JobsComponentConstructor.py → jobs_component_constructor.py} RENAMED Viewed

@@ -1,11 +1,11 @@
 from typing import Union, Sequence, TYPE_CHECKING
 if TYPE_CHECKING:
-    from edsl.agents.Agent import Agent
-    from edsl.language_models.LanguageModel import LanguageModel
-    from edsl.scenarios.Scenario import Scenario
-    from edsl.jobs.Jobs import Jobs
+    from ..agents import Agent
+    from ..language_models import LanguageModel
+    from ..scenarios import Scenario
+    from .jobs import Jobs
+    from ..invigilators import InvigilatorBase
 class JobsComponentConstructor:
     "Handles the creation of Agents, Scenarios, and LanguageModels in a job."
@@ -50,7 +50,8 @@ class JobsComponentConstructor:
         - scenarios: traits of new scenarios are combined with traits of old existing. New scenarios will overwrite overlapping traits, and do not increase the number of scenarios in the instance
         - models: new models overwrite old models.
         """
-        from edsl.results.Dataset import Dataset
+        from ..dataset.dataset import Dataset
         if isinstance(
             args[0], Dataset
@@ -107,9 +108,10 @@ class JobsComponentConstructor:
     def _get_current_objects_of_this_type(
         self, object: Union["Agent", "Scenario", "LanguageModel"]
     ) -> tuple[list, str]:
-        from edsl.agents.Agent import Agent
-        from edsl.scenarios.Scenario import Scenario
-        from edsl.language_models.LanguageModel import LanguageModel
+        from ..agents import Agent
+        from ..scenarios import Scenario
+        from ..language_models import LanguageModel
         """Return the current objects of the same type as the first argument.
@@ -138,8 +140,8 @@ class JobsComponentConstructor:
     @staticmethod
     def _get_empty_container_object(object):
-        from edsl.agents.AgentList import AgentList
-        from edsl.scenarios.ScenarioList import ScenarioList
+        from edsl.agents import AgentList
+        from edsl.scenarios import ScenarioList
         return {"Agent": AgentList([]), "Scenario": ScenarioList([])}.get(
             object.__class__.__name__, []
@@ -153,7 +155,8 @@ class JobsComponentConstructor:
         For example, if the user passes in 3 agents,
         and there are 2 existing agents, this will create 6 new agents
         >>> from edsl.jobs import Jobs
-        >>> JobsComponentConstructor(Jobs(survey = []))._merge_objects([1,2,3], [4,5,6])
+        >>> from edsl.surveys import Survey
+        >>> JobsComponentConstructor(Jobs(survey = Survey.example()))._merge_objects([1,2,3], [4,5,6])
         [5, 6, 7, 6, 7, 8, 7, 8, 9]
         """
         new_objects = JobsComponentConstructor._get_empty_container_object(
@@ -166,11 +169,11 @@ class JobsComponentConstructor:
     @staticmethod
     def _get_container_class(object):
-        from edsl.agents.AgentList import AgentList
-        from edsl.agents.Agent import Agent
-        from edsl.scenarios.Scenario import Scenario
-        from edsl.scenarios.ScenarioList import ScenarioList
-        from edsl.language_models.ModelList import ModelList
+        from ..agents import AgentList
+        from ..agents import Agent
+        from ..scenarios import Scenario
+        from ..scenarios import ScenarioList
+        from ..language_models import ModelList
         if isinstance(object, Agent):
             return AgentList

edsl/jobs/{InterviewsConstructor.py → jobs_interview_constructor.py} RENAMED Viewed

@@ -2,8 +2,9 @@ from typing import Generator, TYPE_CHECKING
 from itertools import product
 if TYPE_CHECKING:
-    from edsl.jobs.interviews.Interview import Interview
+    from ..interviews import Interview
+    from .jobs import Jobs
+    from ..caching import Cache
 class InterviewsConstructor:
     def __init__(self, jobs: "Jobs", cache: "Cache"):
@@ -12,14 +13,14 @@ class InterviewsConstructor:
     def create_interviews(self) -> Generator["Interview", None, None]:
         """
-        Generate interviews.
+        Generates interviews.
         Note that this sets the agents, model and scenarios if they have not been set. This is a side effect of the method.
         This is useful because a user can create a job without setting the agents, models, or scenarios, and the job will still run,
         with us filling in defaults.
         """
-        from edsl.jobs.interviews.Interview import Interview
+        from ..interviews import Interview
         agent_index = {
             hash(agent): index for index, agent in enumerate(self.jobs.agents)
@@ -35,7 +36,7 @@ class InterviewsConstructor:
             self.jobs.agents, self.jobs.scenarios, self.jobs.models
         ):
             yield Interview(
-                survey=self.jobs.survey.draw(),
+                survey=self.jobs.survey.draw(), # this draw is to support shuffling of question options
                 agent=agent,
                 scenario=scenario,
                 model=model,
@@ -48,3 +49,7 @@ class InterviewsConstructor:
                     "scenario": scenario_index[hash(scenario)],
                 },
             )
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()

edsl/jobs/jobs_pricing_estimation.py ADDED Viewed

@@ -0,0 +1,347 @@
+import logging
+import math
+from typing import List, TYPE_CHECKING
+if TYPE_CHECKING:
+    from .jobs import Jobs
+    from ..agents import AgentList
+    from ..scenarios import ScenarioList
+    from ..surveys import Survey
+    from .interviews.Interview import Interview
+from .fetch_invigilator import FetchInvigilator
+from ..caching import CacheEntry
+from ..dataset import Dataset
+logger = logging.getLogger(__name__)
+class PromptCostEstimator:
+    DEFAULT_INPUT_PRICE_PER_TOKEN = 0.000001
+    DEFAULT_OUTPUT_PRICE_PER_TOKEN = 0.000001
+    CHARS_PER_TOKEN = 4
+    OUTPUT_TOKENS_PER_INPUT_TOKEN = 0.75
+    PIPING_MULTIPLIER = 2
+    def __init__(self,
+        system_prompt: str,
+        user_prompt: str,
+        price_lookup: dict,
+        inference_service: str,
+        model: str):
+        self.system_prompt = system_prompt
+        self.user_prompt = user_prompt
+        self.price_lookup = price_lookup
+        self.inference_service = inference_service
+        self.model = model
+    @staticmethod
+    def get_piping_multiplier(prompt: str):
+        """Returns 2 if a prompt includes Jinja braces, and 1 otherwise."""
+        if "{{" in prompt and "}}" in prompt:
+            return PromptCostEstimator.PIPING_MULTIPLIER
+        return 1
+    @property
+    def key(self):
+        return (self.inference_service, self.model)
+    @property
+    def relevant_prices(self):
+        try:
+            return self.price_lookup[self.key]
+        except KeyError:
+            return {}
+    def input_price_per_token(self):
+        try:
+            return self.relevant_prices["input"]["service_stated_token_price"] / self.relevant_prices["input"]["service_stated_token_qty"]
+        except KeyError:
+            import warnings
+            warnings.warn(
+                "Price data could not be retrieved. Using default estimates for input and output token prices. Input: $1.00 / 1M tokens; Output: $1.00 / 1M tokens"
+            )
+            return self.DEFAULT_INPUT_PRICE_PER_TOKEN
+    def output_price_per_token(self):
+        try:
+            return self.relevant_prices["output"]["service_stated_token_price"] / self.relevant_prices["output"]["service_stated_token_qty"]
+        except KeyError:
+            return self.DEFAULT_OUTPUT_PRICE_PER_TOKEN
+    def __call__(self):
+        user_prompt_chars = len(str(self.user_prompt)) * self.get_piping_multiplier(
+            str(self.user_prompt)
+        )
+        system_prompt_chars = len(str(self.system_prompt)) * self.get_piping_multiplier(
+            str(self.system_prompt)
+        )
+        # Convert into tokens (1 token approx. equals 4 characters)
+        input_tokens = (user_prompt_chars + system_prompt_chars) // self.CHARS_PER_TOKEN
+        output_tokens = math.ceil(self.OUTPUT_TOKENS_PER_INPUT_TOKEN * input_tokens)
+        cost = (
+            input_tokens * self.input_price_per_token()
+            + output_tokens * self.output_price_per_token()
+        )
+        return {
+            "input_tokens": input_tokens,
+            "output_tokens": output_tokens,
+            "cost_usd": cost,
+        }
+class JobsPrompts:
+    relevant_keys = ["user_prompt", "system_prompt", "interview_index", "question_name", "scenario_index", "agent_index", "model", "estimated_cost", "cache_keys"]
+    """This generates the prompts for a job for price estimation purposes.
+    It does *not* do the full job execution---that requires an LLM.
+    So assumptions are made about expansion of Jinja braces, etc.
+    """
+    @classmethod
+    def from_jobs(cls, jobs: "Jobs"):
+        """Construct a JobsPrompts object from a Jobs object."""
+        interviews = jobs.interviews()
+        agents = jobs.agents
+        scenarios = jobs.scenarios
+        survey = jobs.survey
+        return cls(
+            interviews=interviews,
+            agents=agents,
+            scenarios=scenarios,
+            survey=survey
+        )
+    def __init__(self, interviews: List['Interview'], agents:'AgentList', scenarios: 'ScenarioList', survey: 'Survey'):
+        """Initialize with extracted components rather than a Jobs object."""
+        self.interviews = interviews
+        self.agents = agents
+        self.scenarios = scenarios
+        self.survey = survey
+        self._price_lookup = None
+        self._agent_lookup = {agent: idx for idx, agent in enumerate(self.agents)}
+        self._scenario_lookup = {
+            scenario: idx for idx, scenario in enumerate(self.scenarios)
+        }
+    @property
+    def price_lookup(self) -> dict:
+        """Fetches the price lookup from Coop if it is not already cached."""
+        if self._price_lookup is None:
+            from edsl.coop.coop import Coop
+            c = Coop()
+            self._price_lookup = c.fetch_prices()
+        return self._price_lookup
+    def _process_one_invigilator(self, invigilator: 'Invigilator', interview_index: int, iterations: int = 1) -> dict   :
+        """Process a single invigilator and return a dictionary with all needed data fields."""
+        prompts = invigilator.get_prompts()
+        user_prompt = prompts["user_prompt"]
+        system_prompt = prompts["system_prompt"]
+        agent_index = self._agent_lookup[invigilator.agent]
+        scenario_index = self._scenario_lookup[invigilator.scenario]
+        model = invigilator.model.model
+        question_name = invigilator.question.question_name
+        # Calculate prompt cost
+        prompt_cost = self.estimate_prompt_cost(
+            system_prompt=system_prompt,
+            user_prompt=user_prompt,
+            price_lookup=self.price_lookup,
+            inference_service=invigilator.model._inference_service_,
+            model=model,
+        )
+        cost = prompt_cost["cost_usd"]
+        # Generate cache keys for each iteration
+        cache_keys = []
+        for iteration in range(iterations):
+            cache_key = CacheEntry.gen_key(
+                model=model,
+                parameters=invigilator.model.parameters,
+                system_prompt=system_prompt,
+                user_prompt=user_prompt,
+                iteration=iteration,
+            )
+            cache_keys.append(cache_key)
+        d = {
+            "user_prompt": user_prompt,
+            "system_prompt": system_prompt,
+            "interview_index": interview_index,
+            "question_name": question_name,
+            "scenario_index": scenario_index,
+            "agent_index": agent_index,
+            "model": model,
+            "estimated_cost": cost,
+            "cache_keys": cache_keys,
+        }
+        assert list(d.keys()) == self.relevant_keys
+        return d
+    def prompts(self, iterations=1) -> "Dataset":
+        """Return a Dataset of prompts that will be used.
+        >>> from edsl.jobs import Jobs
+        >>> Jobs.example().prompts()
+        Dataset(...)
+        """
+        dataset_of_prompts = {k: [] for k in self.relevant_keys}
+        interviews = self.interviews
+        # Process each interview and invigilator
+        for interview_index, interview in enumerate(interviews):
+            invigilators = [
+                FetchInvigilator(interview)(question)
+                for question in interview.survey.questions
+            ]
+            for invigilator in invigilators:
+                # Process the invigilator and get all data as a dictionary
+                data = self._process_one_invigilator(invigilator, interview_index, iterations)
+                for k in self.relevant_keys:
+                    dataset_of_prompts[k].append(data[k])
+        return Dataset([{k:dataset_of_prompts[k]} for k in self.relevant_keys])
+    @staticmethod
+    def estimate_prompt_cost(
+        system_prompt: str,
+        user_prompt: str,
+        price_lookup: dict,
+        inference_service: str,
+        model: str,
+    ) -> dict:
+        """Estimates the cost of a prompt, taking piping into account."""
+        return PromptCostEstimator(
+            system_prompt=system_prompt,
+            user_prompt=user_prompt,
+            price_lookup=price_lookup,
+            inference_service=inference_service,
+            model=model
+        )()
+    @staticmethod
+    def _extract_prompt_details(invigilator: FetchInvigilator) -> dict:
+        """Extracts the prompt details from the invigilator.
+        >>> from edsl.invigilators import InvigilatorAI
+        >>> invigilator = InvigilatorAI.example()
+        >>> JobsPrompts._extract_prompt_details(invigilator)
+        {'user_prompt': ...
+        """
+        prompts = invigilator.get_prompts()
+        user_prompt = prompts["user_prompt"]
+        system_prompt = prompts["system_prompt"]
+        inference_service = invigilator.model._inference_service_
+        model = invigilator.model.model
+        return {
+            "user_prompt": user_prompt,
+            "system_prompt": system_prompt,
+            "inference_service": inference_service,
+            "model": model,
+        }
+    def estimate_job_cost_from_external_prices(
+        self, price_lookup: dict, iterations: int = 1
+    ) -> dict:
+        """
+        Estimates the cost of a job.
+        :param price_lookup: An external pricing dictionary.
+        :param iterations: The number of times to iterate over the job.
+        Key assumptions:
+        - 1 token = 4 characters.
+        - For each prompt, output tokens = input tokens * 0.75, rounded up to the nearest integer.
+        """
+        interviews = self.interviews
+        data = []
+        for interview in interviews:
+            invigilators = [
+                FetchInvigilator(interview)(question)
+                for question in self.survey.questions
+            ]
+            for invigilator in invigilators:
+                prompt_details = self._extract_prompt_details(invigilator)
+                prompt_cost = self.estimate_prompt_cost(**prompt_details, price_lookup=price_lookup)
+                price_estimates = {
+                    'estimated_input_tokens': prompt_cost['input_tokens'],
+                    'estimated_output_tokens': prompt_cost['output_tokens'],
+                    'estimated_cost_usd': prompt_cost['cost_usd']
+                }
+                data.append({**price_estimates, **prompt_details})
+        model_groups = {}
+        for item in data:
+            key = (item["inference_service"], item["model"])
+            if key not in model_groups:
+                model_groups[key] = {
+                    "inference_service": item["inference_service"],
+                    "model": item["model"],
+                    "estimated_cost_usd": 0,
+                    "estimated_input_tokens": 0,
+                    "estimated_output_tokens": 0
+                }
+            # Accumulate values
+            model_groups[key]["estimated_cost_usd"] += item["estimated_cost_usd"]
+            model_groups[key]["estimated_input_tokens"] += item["estimated_input_tokens"]
+            model_groups[key]["estimated_output_tokens"] += item["estimated_output_tokens"]
+        # Apply iterations and convert to list
+        estimated_costs_by_model = []
+        for group_data in model_groups.values():
+            group_data["estimated_cost_usd"] *= iterations
+            group_data["estimated_input_tokens"] *= iterations
+            group_data["estimated_output_tokens"] *= iterations
+            estimated_costs_by_model.append(group_data)
+        # Calculate totals
+        estimated_total_cost = sum(
+            model["estimated_cost_usd"] for model in estimated_costs_by_model
+        )
+        estimated_total_input_tokens = sum(
+            model["estimated_input_tokens"] for model in estimated_costs_by_model
+        )
+        estimated_total_output_tokens = sum(
+            model["estimated_output_tokens"] for model in estimated_costs_by_model
+        )
+        output = {
+            "estimated_total_cost_usd": estimated_total_cost,
+            "estimated_total_input_tokens": estimated_total_input_tokens,
+            "estimated_total_output_tokens": estimated_total_output_tokens,
+            "model_costs": estimated_costs_by_model,
+        }
+        return output
+    def estimate_job_cost(self, iterations: int = 1) -> dict:
+        """
+        Estimates the cost of a job according to the following assumptions:
+        - 1 token = 4 characters.
+        - For each prompt, output tokens = input tokens * 0.75, rounded up to the nearest integer.
+        Fetches prices from Coop.
+        """
+        return self.estimate_job_cost_from_external_prices(
+            price_lookup=self.price_lookup, iterations=iterations
+        )
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl/jobs/{JobsRemoteInferenceLogger.py → jobs_remote_inference_logger.py} RENAMED Viewed

@@ -5,12 +5,13 @@ from abc import ABC, abstractmethod
 from typing import Optional, Union, Literal, TYPE_CHECKING, List, Dict
 from datetime import datetime
 from dataclasses import dataclass
-from edsl.exceptions.coop import CoopServerResponseError
-from edsl.jobs.jobs_status_enums import JobsStatus
+from ..coop import CoopServerResponseError
+from .jobs_status_enums import JobsStatus
 if TYPE_CHECKING:
-    from edsl.results.Results import Results
+    from ..results import Results
 @dataclass

edsl 0.1.46__py3-none-any.whl → 0.1.48__py3-none-any.whl

edsl 0.1.46py3-none-any.whl → 0.1.48py3-none-any.whl