PyPI - edsl - Versions diffs - 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl - Mend

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (407) hide show

edsl/Base.py +348 -38
edsl/BaseDiff.py +260 -0
edsl/TemplateLoader.py +24 -0
edsl/__init__.py +46 -10
edsl/__version__.py +1 -0
edsl/agents/Agent.py +842 -144
edsl/agents/AgentList.py +521 -25
edsl/agents/Invigilator.py +250 -374
edsl/agents/InvigilatorBase.py +257 -0
edsl/agents/PromptConstructor.py +272 -0
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/descriptors.py +43 -13
edsl/agents/prompt_helpers.py +129 -0
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +130 -0
edsl/auto/StageBase.py +243 -0
edsl/auto/StageGenerateSurvey.py +178 -0
edsl/auto/StageLabelQuestions.py +125 -0
edsl/auto/StagePersona.py +61 -0
edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
edsl/auto/StagePersonaDimensionValues.py +74 -0
edsl/auto/StagePersonaDimensions.py +69 -0
edsl/auto/StageQuestions.py +74 -0
edsl/auto/SurveyCreatorPipeline.py +21 -0
edsl/auto/utilities.py +218 -0
edsl/base/Base.py +279 -0
edsl/config.py +121 -104
edsl/conversation/Conversation.py +290 -0
edsl/conversation/car_buying.py +59 -0
edsl/conversation/chips.py +95 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +54 -0
edsl/coop/__init__.py +1 -0
edsl/coop/coop.py +1029 -134
edsl/coop/utils.py +131 -0
edsl/data/Cache.py +560 -89
edsl/data/CacheEntry.py +230 -0
edsl/data/CacheHandler.py +168 -0
edsl/data/RemoteCacheSync.py +186 -0
edsl/data/SQLiteDict.py +292 -0
edsl/data/__init__.py +5 -3
edsl/data/orm.py +6 -33
edsl/data_transfer_models.py +74 -27
edsl/enums.py +165 -8
edsl/exceptions/BaseException.py +21 -0
edsl/exceptions/__init__.py +52 -46
edsl/exceptions/agents.py +33 -15
edsl/exceptions/cache.py +5 -0
edsl/exceptions/coop.py +8 -0
edsl/exceptions/general.py +34 -0
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/jobs.py +15 -0
edsl/exceptions/language_models.py +46 -1
edsl/exceptions/questions.py +80 -5
edsl/exceptions/results.py +16 -5
edsl/exceptions/scenarios.py +29 -0
edsl/exceptions/surveys.py +13 -10
edsl/inference_services/AnthropicService.py +106 -0
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +118 -0
edsl/inference_services/AzureAI.py +215 -0
edsl/inference_services/DeepInfraService.py +18 -0
edsl/inference_services/GoogleService.py +143 -0
edsl/inference_services/GroqService.py +20 -0
edsl/inference_services/InferenceServiceABC.py +80 -0
edsl/inference_services/InferenceServicesCollection.py +138 -0
edsl/inference_services/MistralAIService.py +120 -0
edsl/inference_services/OllamaService.py +18 -0
edsl/inference_services/OpenAIService.py +236 -0
edsl/inference_services/PerplexityService.py +160 -0
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +90 -0
edsl/inference_services/TogetherAIService.py +172 -0
edsl/inference_services/data_structures.py +134 -0
edsl/inference_services/models_available_cache.py +118 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/registry.py +41 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +21 -20
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +684 -204
edsl/jobs/JobsChecks.py +172 -0
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +270 -0
edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +104 -0
edsl/jobs/buckets/ModelBuckets.py +65 -0
edsl/jobs/buckets/TokenBucket.py +283 -0
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +392 -0
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
edsl/jobs/interviews/InterviewStatistic.py +63 -0
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
edsl/jobs/interviews/InterviewStatusLog.py +92 -0
edsl/jobs/interviews/ReportErrors.py +66 -0
edsl/jobs/interviews/interview_status_enum.py +9 -0
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
edsl/jobs/runners/JobsRunnerStatus.py +298 -0
edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
edsl/jobs/tasks/TaskCreators.py +64 -0
edsl/jobs/tasks/TaskHistory.py +470 -0
edsl/jobs/tasks/TaskStatusLog.py +23 -0
edsl/jobs/tasks/task_status_enum.py +161 -0
edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
edsl/jobs/tokens/TokenUsage.py +34 -0
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +507 -386
edsl/language_models/ModelList.py +164 -0
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
edsl/language_models/__init__.py +1 -8
edsl/language_models/fake_openai_call.py +15 -0
edsl/language_models/fake_openai_service.py +61 -0
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +109 -41
edsl/language_models/utilities.py +65 -0
edsl/notebooks/Notebook.py +263 -0
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/notebooks/__init__.py +1 -0
edsl/prompts/Prompt.py +222 -93
edsl/prompts/__init__.py +1 -1
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +518 -0
edsl/questions/QuestionBasePromptsMixin.py +221 -0
edsl/questions/QuestionBudget.py +164 -67
edsl/questions/QuestionCheckBox.py +281 -62
edsl/questions/QuestionDict.py +343 -0
edsl/questions/QuestionExtract.py +136 -50
edsl/questions/QuestionFreeText.py +79 -55
edsl/questions/QuestionFunctional.py +138 -41
edsl/questions/QuestionList.py +184 -57
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +293 -69
edsl/questions/QuestionNumerical.py +109 -56
edsl/questions/QuestionRank.py +244 -49
edsl/questions/Quick.py +41 -0
edsl/questions/SimpleAskMixin.py +74 -0
edsl/questions/__init__.py +9 -6
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
edsl/questions/compose_questions.py +13 -7
edsl/questions/data_structures.py +20 -0
edsl/questions/decorators.py +21 -0
edsl/questions/derived/QuestionLikertFive.py +28 -26
edsl/questions/derived/QuestionLinearScale.py +41 -28
edsl/questions/derived/QuestionTopK.py +34 -26
edsl/questions/derived/QuestionYesNo.py +40 -27
edsl/questions/descriptors.py +228 -74
edsl/questions/loop_processor.py +149 -0
edsl/questions/prompt_templates/question_budget.jinja +13 -0
edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
edsl/questions/prompt_templates/question_extract.jinja +11 -0
edsl/questions/prompt_templates/question_free_text.jinja +3 -0
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
edsl/questions/prompt_templates/question_list.jinja +17 -0
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
edsl/questions/prompt_templates/question_numerical.jinja +37 -0
edsl/questions/question_base_gen_mixin.py +168 -0
edsl/questions/question_registry.py +130 -46
edsl/questions/register_questions_meta.py +71 -0
edsl/questions/response_validator_abc.py +188 -0
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/settings.py +5 -2
edsl/questions/templates/__init__.py +0 -0
edsl/questions/templates/budget/__init__.py +0 -0
edsl/questions/templates/budget/answering_instructions.jinja +7 -0
edsl/questions/templates/budget/question_presentation.jinja +7 -0
edsl/questions/templates/checkbox/__init__.py +0 -0
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
edsl/questions/templates/dict/__init__.py +0 -0
edsl/questions/templates/dict/answering_instructions.jinja +21 -0
edsl/questions/templates/dict/question_presentation.jinja +1 -0
edsl/questions/templates/extract/__init__.py +0 -0
edsl/questions/templates/extract/answering_instructions.jinja +7 -0
edsl/questions/templates/extract/question_presentation.jinja +1 -0
edsl/questions/templates/free_text/__init__.py +0 -0
edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
edsl/questions/templates/free_text/question_presentation.jinja +1 -0
edsl/questions/templates/likert_five/__init__.py +0 -0
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
edsl/questions/templates/linear_scale/__init__.py +0 -0
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
edsl/questions/templates/list/__init__.py +0 -0
edsl/questions/templates/list/answering_instructions.jinja +4 -0
edsl/questions/templates/list/question_presentation.jinja +5 -0
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/questions/templates/multiple_choice/__init__.py +0 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
edsl/questions/templates/multiple_choice/html.jinja +0 -0
edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
edsl/questions/templates/numerical/__init__.py +0 -0
edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
edsl/questions/templates/numerical/question_presentation.jinja +7 -0
edsl/questions/templates/rank/__init__.py +0 -0
edsl/questions/templates/rank/answering_instructions.jinja +11 -0
edsl/questions/templates/rank/question_presentation.jinja +15 -0
edsl/questions/templates/top_k/__init__.py +0 -0
edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
edsl/questions/templates/top_k/question_presentation.jinja +22 -0
edsl/questions/templates/yes_no/__init__.py +0 -0
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +550 -19
edsl/results/DatasetExportMixin.py +594 -0
edsl/results/DatasetTree.py +295 -0
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +477 -173
edsl/results/Results.py +987 -269
edsl/results/ResultsExportMixin.py +28 -125
edsl/results/ResultsGGMixin.py +83 -15
edsl/results/TableDisplay.py +125 -0
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +1 -1
edsl/results/file_exports.py +252 -0
edsl/results/results_fetch_mixin.py +33 -0
edsl/results/results_selector.py +145 -0
edsl/results/results_tools_mixin.py +98 -0
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_display.css +78 -0
edsl/results/table_renderers.py +118 -0
edsl/results/tree_explore.py +115 -0
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +543 -0
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +431 -62
edsl/scenarios/ScenarioHtmlMixin.py +65 -0
edsl/scenarios/ScenarioList.py +1415 -45
edsl/scenarios/ScenarioListExportMixin.py +45 -0
edsl/scenarios/ScenarioListPdfMixin.py +239 -0
edsl/scenarios/__init__.py +2 -0
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +49 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/scenario_join.py +131 -0
edsl/scenarios/scenario_selector.py +156 -0
edsl/shared.py +1 -0
edsl/study/ObjectEntry.py +173 -0
edsl/study/ProofOfWork.py +113 -0
edsl/study/SnapShot.py +80 -0
edsl/study/Study.py +521 -0
edsl/study/__init__.py +4 -0
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/DAG.py +92 -11
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/Memory.py +9 -4
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/MemoryPlan.py +156 -35
edsl/surveys/Rule.py +221 -74
edsl/surveys/RuleCollection.py +241 -61
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +1079 -339
edsl/surveys/SurveyCSS.py +273 -0
edsl/surveys/SurveyExportMixin.py +235 -40
edsl/surveys/SurveyFlowVisualization.py +181 -0
edsl/surveys/SurveyQualtricsImport.py +284 -0
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +4 -2
edsl/surveys/base.py +19 -3
edsl/surveys/descriptors.py +17 -6
edsl/surveys/instructions/ChangeInstruction.py +48 -0
edsl/surveys/instructions/Instruction.py +56 -0
edsl/surveys/instructions/InstructionCollection.py +82 -0
edsl/surveys/instructions/__init__.py +0 -0
edsl/templates/error_reporting/base.html +24 -0
edsl/templates/error_reporting/exceptions_by_model.html +35 -0
edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
edsl/templates/error_reporting/exceptions_by_type.html +17 -0
edsl/templates/error_reporting/interview_details.html +116 -0
edsl/templates/error_reporting/interviews.html +19 -0
edsl/templates/error_reporting/overview.html +5 -0
edsl/templates/error_reporting/performance_plot.html +2 -0
edsl/templates/error_reporting/report.css +74 -0
edsl/templates/error_reporting/report.html +118 -0
edsl/templates/error_reporting/report.js +25 -0
edsl/tools/__init__.py +1 -0
edsl/tools/clusters.py +192 -0
edsl/tools/embeddings.py +27 -0
edsl/tools/embeddings_plotting.py +118 -0
edsl/tools/plotting.py +112 -0
edsl/tools/summarize.py +18 -0
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/SystemInfo.py +5 -0
edsl/utilities/__init__.py +21 -20
edsl/utilities/ast_utilities.py +3 -0
edsl/utilities/data/Registry.py +2 -0
edsl/utilities/decorators.py +41 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/interface.py +310 -60
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/naming_utilities.py +263 -0
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/restricted_python.py +70 -0
edsl/utilities/utilities.py +203 -13
edsl-0.1.40.dist-info/METADATA +111 -0
edsl-0.1.40.dist-info/RECORD +362 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
edsl/agents/AgentListExportMixin.py +0 -24
edsl/coop/old.py +0 -31
edsl/data/Database.py +0 -141
edsl/data/crud.py +0 -121
edsl/jobs/Interview.py +0 -417
edsl/jobs/JobsRunner.py +0 -63
edsl/jobs/JobsRunnerStatusMixin.py +0 -115
edsl/jobs/base.py +0 -47
edsl/jobs/buckets.py +0 -166
edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
edsl/jobs/task_management.py +0 -218
edsl/jobs/token_tracking.py +0 -78
edsl/language_models/DeepInfra.py +0 -69
edsl/language_models/OpenAI.py +0 -98
edsl/language_models/model_interfaces/GeminiPro.py +0 -66
edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
edsl/language_models/registry.py +0 -81
edsl/language_models/schemas.py +0 -15
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/prompts/QuestionInstructionsBase.py +0 -6
edsl/prompts/library/agent_instructions.py +0 -29
edsl/prompts/library/agent_persona.py +0 -17
edsl/prompts/library/question_budget.py +0 -26
edsl/prompts/library/question_checkbox.py +0 -32
edsl/prompts/library/question_extract.py +0 -19
edsl/prompts/library/question_freetext.py +0 -14
edsl/prompts/library/question_linear_scale.py +0 -20
edsl/prompts/library/question_list.py +0 -22
edsl/prompts/library/question_multiple_choice.py +0 -44
edsl/prompts/library/question_numerical.py +0 -31
edsl/prompts/library/question_rank.py +0 -21
edsl/prompts/prompt_config.py +0 -33
edsl/prompts/registry.py +0 -185
edsl/questions/Question.py +0 -240
edsl/report/InputOutputDataTypes.py +0 -134
edsl/report/RegressionMixin.py +0 -28
edsl/report/ReportOutputs.py +0 -1228
edsl/report/ResultsFetchMixin.py +0 -106
edsl/report/ResultsOutputMixin.py +0 -14
edsl/report/demo.ipynb +0 -645
edsl/results/ResultsDBMixin.py +0 -184
edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
edsl/trackers/Tracker.py +0 -91
edsl/trackers/TrackerAPI.py +0 -196
edsl/trackers/TrackerTasks.py +0 -70
edsl/utilities/pastebin.py +0 -141
edsl-0.1.14.dist-info/METADATA +0 -69
edsl-0.1.14.dist-info/RECORD +0 -141
/edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
/edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
/edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0

edsl/agents/QuestionTemplateReplacementsBuilder.py ADDED Viewed

@@ -0,0 +1,137 @@
+from jinja2 import Environment, meta
+from typing import Any, Set, TYPE_CHECKING
+if TYPE_CHECKING:
+    from edsl.agents.PromptConstructor import PromptConstructor
+    from edsl.scenarios.Scenario import Scenario
+class QuestionTemplateReplacementsBuilder:
+    def __init__(self, prompt_constructor: "PromptConstructor"):
+        self.prompt_constructor = prompt_constructor
+    def question_file_keys(self):
+        question_text = self.prompt_constructor.question.question_text
+        file_keys = self._find_file_keys(self.prompt_constructor.scenario)
+        return self._extract_file_keys_from_question_text(question_text, file_keys)
+    def scenario_file_keys(self):
+        return self._find_file_keys(self.prompt_constructor.scenario)
+    def get_jinja2_variables(template_str: str) -> Set[str]:
+        """
+        Extracts all variable names from a Jinja2 template using Jinja2's built-in parsing.
+        Args:
+        template_str (str): The Jinja2 template string
+        Returns:
+        Set[str]: A set of variable names found in the template
+        """
+        env = Environment()
+        ast = env.parse(template_str)
+        return meta.find_undeclared_variables(ast)
+    @staticmethod
+    def _find_file_keys(scenario: "Scenario") -> list:
+        """We need to find all the keys in the scenario that refer to FileStore objects.
+        These will be used to append to the prompt a list of files that are part of the scenario.
+        >>> from edsl import Scenario
+        >>> from edsl.scenarios.FileStore import FileStore
+        >>> import tempfile
+        >>> with tempfile.NamedTemporaryFile() as f:
+        ...     _ = f.write(b"Hello, world!")
+        ...     _ = f.seek(0)
+        ...     fs = FileStore(f.name)
+        ...     scenario = Scenario({"fs_file": fs, 'a': 1})
+        ...     QuestionTemplateReplacementsBuilder._find_file_keys(scenario)
+        ['fs_file']
+        """
+        from edsl.scenarios.FileStore import FileStore
+        file_entries = []
+        for key, value in scenario.items():
+            if isinstance(value, FileStore):
+                file_entries.append(key)
+        return file_entries
+    @staticmethod
+    def _extract_file_keys_from_question_text(
+        question_text: str, scenario_file_keys: list
+    ) -> list:
+        """
+        Extracts the file keys from a question text.
+        >>> from edsl import Scenario
+        >>> from edsl.scenarios.FileStore import FileStore
+        >>> import tempfile
+        >>> with tempfile.NamedTemporaryFile() as f:
+        ...     _ = f.write(b"Hello, world!")
+        ...     _ = f.seek(0)
+        ...     fs = FileStore(f.name)
+        ...     scenario = Scenario({"fs_file": fs, 'a': 1})
+        ...     QuestionTemplateReplacementsBuilder._extract_file_keys_from_question_text("{{ fs_file }}", ['fs_file'])
+        ['fs_file']
+        """
+        variables = QuestionTemplateReplacementsBuilder.get_jinja2_variables(
+            question_text
+        )
+        question_file_keys = []
+        for var in variables:
+            if var in scenario_file_keys:
+                question_file_keys.append(var)
+        return question_file_keys
+    def _scenario_replacements(self) -> dict[str, Any]:
+        # File references dictionary
+        file_refs = {key: f"<see file {key}>" for key in self.scenario_file_keys()}
+        # Scenario items excluding file keys
+        scenario_items = {
+            k: v
+            for k, v in self.prompt_constructor.scenario.items()
+            if k not in self.scenario_file_keys()
+        }
+        return {**file_refs, **scenario_items}
+    @staticmethod
+    def _question_data_replacements(
+        question: dict, question_data: dict
+    ) -> dict[str, Any]:
+        """Builds a dictionary of replacement values for rendering a prompt by combining multiple data sources.
+        >>> from edsl import QuestionMultipleChoice
+        >>> q = QuestionMultipleChoice(question_text="Do you like school?", question_name = "q0", question_options = ["yes", "no"])
+        >>> QuestionTemplateReplacementsBuilder._question_data_replacements(q, q.data)
+        {'use_code': False, 'include_comment': True, 'question_name': 'q0', 'question_text': 'Do you like school?', 'question_options': ['yes', 'no']}
+        """
+        question_settings = {
+            "use_code": getattr(question, "_use_code", True),
+            "include_comment": getattr(question, "_include_comment", False),
+        }
+        return {**question_settings, **question_data}
+    def build_replacement_dict(self, question_data: dict) -> dict[str, Any]:
+        """Builds a dictionary of replacement values for rendering a prompt by combining multiple data sources."""
+        rpl = {}
+        rpl["scenario"] = self._scenario_replacements()
+        rpl["question"] = self._question_data_replacements(
+            self.prompt_constructor.question, question_data
+        )
+        rpl["prior_answers"] = self.prompt_constructor.prior_answers_dict()
+        rpl["agent"] = {"agent": self.prompt_constructor.agent}
+        # Combine all dictionaries using dict.update() for clarity
+        replacement_dict = {}
+        for r in rpl.values():
+            replacement_dict.update(r)
+        return replacement_dict
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()

edsl/agents/descriptors.py CHANGED Viewed

@@ -1,42 +1,68 @@
+"""This module contains the descriptors used to set the attributes of the Agent class."""
 from typing import Dict
-from edsl.utilities.utilities import is_valid_variable_name
-from edsl.exceptions.agents import AgentNameError
+from edsl.exceptions.agents import AgentNameError, AgentTraitKeyError
+def convert_agent_name(x):
+    # potentially a numpy int64
+    import numpy as np
+    if isinstance(x, np.int64):
+        return int(x)
+    elif x is None:
+        return None
+    elif isinstance(x, int):
+        return x
+    else:
+        return str(x)
 class NameDescriptor:
     """ABC for something."""
     def __get__(self, instance, owner):
-        """"""
+        """Return the value of the attribute."""
         return instance.__dict__[self.name]
     def __set__(self, instance, name: str) -> None:
-        instance.__dict__[self.name] = name
+        """Set the value of the attribute."""
+        instance.__dict__[self.name] = convert_agent_name(name)
     def __set_name__(self, owner, name: str) -> None:
+        """Set the name of the attribute."""
         self.name = "_" + name
 class TraitsDescriptor:
-    """ABC for something."""
+    """Traits descriptor."""
     def __get__(self, instance, owner):
-        """"""
+        """Return the value of the attribute."""
         return instance.__dict__[self.name]
     def __set__(self, instance, traits_dict: Dict[str, str]) -> None:
+        """Set the value of the attribute."""
+        from edsl.utilities.utilities import is_valid_variable_name
         for key, value in traits_dict.items():
-            if not is_valid_variable_name(key):
-                raise AgentNameError("Trait keys must be a valid variable name!")
             if key == "name":
                 raise AgentNameError(
-                    """Trait keys cannot be 'name'!. Instead, use the 'name' attribute directly e.g.,
-                                >>> Agent(name="my_agent", traits={"trait1": "value1", "trait2": "value2"})
-                                """
+                    "Trait keys cannot be 'name'. Instead, use the 'name' attribute directly e.g.,\n"
+                    'Agent(name="my_agent", traits={"trait1": "value1", "trait2": "value2"})'
                 )
+            if not is_valid_variable_name(key):
+                raise AgentTraitKeyError(
+                    f"""Trait keys must be valid Python identifiers (must be alphanumeric, cannot start with a number and must use underscores instead of spaces).
+                    You passed: {key}
+                    """
+                )
         instance.__dict__[self.name] = traits_dict
     def __set_name__(self, owner, name: str) -> None:
+        """Set the name of the attribute."""
         self.name = name
@@ -44,13 +70,15 @@ class CodebookDescriptor:
     """ABC for something."""
     def __get__(self, instance, owner):
-        """"""
+        """Return the value of the attribute."""
         return instance.__dict__[self.name]
     def __set__(self, instance, codebook_dict: Dict[str, str]) -> None:
+        """Set the value of the attribute."""
         instance.__dict__[self.name] = codebook_dict
     def __set_name__(self, owner, name: str) -> None:
+        """Set the name of the attribute."""
         self.name = "_" + name
@@ -58,12 +86,14 @@ class InstructionDescriptor:
     """ABC for something."""
     def __get__(self, instance, owner):
-        """"""
+        """Return the value of the attribute."""
         return instance.__dict__[self.name]
     def __set__(self, instance, instruction) -> None:
+        """Set the value of the attribute."""
         instance.__dict__[self.name] = instruction
         instance.set_instructions = instruction != instance.default_instruction
     def __set_name__(self, owner, name: str) -> None:
+        """Set the name of the attribute."""
         self.name = "_" + name

edsl/agents/prompt_helpers.py ADDED Viewed

@@ -0,0 +1,129 @@
+import enum
+from typing import Dict, Optional
+from collections import UserList
+from edsl.prompts.Prompt import Prompt
+class PromptComponent(enum.Enum):
+    AGENT_INSTRUCTIONS = "agent_instructions"
+    AGENT_PERSONA = "agent_persona"
+    QUESTION_INSTRUCTIONS = "question_instructions"
+    PRIOR_QUESTION_MEMORY = "prior_question_memory"
+class PromptList(UserList):
+    separator = Prompt("")
+    def reduce(self):
+        """Reduce the list of prompts to a single prompt.
+        >>> p = PromptList([Prompt("You are a happy-go lucky agent."), Prompt("You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}")])
+        >>> p.reduce()
+        Prompt(text=\"""You are a happy-go lucky agent.You are an agent with the following persona: {'age': 22, 'hair': 'brown', 'height': 5.5}\""")
+        """
+        p = self[0]
+        for prompt in self[1:]:
+            if len(prompt) > 0:
+                p = p + self.separator + prompt
+        return p
+class PromptPlan:
+    """A plan for constructing prompts for the LLM call.
+    Every prompt plan has a user prompt order and a system prompt order.
+    It must contain each of the values in the PromptComponent enum.
+    >>> p = PromptPlan(user_prompt_order=(PromptComponent.AGENT_INSTRUCTIONS, PromptComponent.AGENT_PERSONA),system_prompt_order=(PromptComponent.QUESTION_INSTRUCTIONS, PromptComponent.PRIOR_QUESTION_MEMORY))
+    >>> p._is_valid_plan()
+    True
+    >>> p.arrange_components(agent_instructions=1, agent_persona=2, question_instructions=3, prior_question_memory=4)
+    {'user_prompt': ..., 'system_prompt': ...}
+    >>> p = PromptPlan(user_prompt_order=("agent_instructions", ), system_prompt_order=("question_instructions", "prior_question_memory"))
+    Traceback (most recent call last):
+    ...
+    ValueError: Invalid plan: must contain each value of PromptComponent exactly once.
+    """
+    def __init__(
+        self,
+        user_prompt_order: Optional[tuple] = None,
+        system_prompt_order: Optional[tuple] = None,
+    ):
+        """Initialize the PromptPlan."""
+        if user_prompt_order is None:
+            user_prompt_order = (
+                PromptComponent.QUESTION_INSTRUCTIONS,
+                PromptComponent.PRIOR_QUESTION_MEMORY,
+            )
+        if system_prompt_order is None:
+            system_prompt_order = (
+                PromptComponent.AGENT_INSTRUCTIONS,
+                PromptComponent.AGENT_PERSONA,
+            )
+        # very commmon way to screw this up given how python treats single strings as iterables
+        if isinstance(user_prompt_order, str):
+            user_prompt_order = (user_prompt_order,)
+        if isinstance(system_prompt_order, str):
+            system_prompt_order = (system_prompt_order,)
+        if not isinstance(user_prompt_order, tuple):
+            raise TypeError(
+                f"Expected a tuple, but got {type(user_prompt_order).__name__}"
+            )
+        if not isinstance(system_prompt_order, tuple):
+            raise TypeError(
+                f"Expected a tuple, but got {type(system_prompt_order).__name__}"
+            )
+        self.user_prompt_order = self._convert_to_enum(user_prompt_order)
+        self.system_prompt_order = self._convert_to_enum(system_prompt_order)
+        if not self._is_valid_plan():
+            raise ValueError(
+                "Invalid plan: must contain each value of PromptComponent exactly once."
+            )
+    def _convert_to_enum(self, prompt_order: tuple):
+        """Convert string names to PromptComponent enum values."""
+        return tuple(
+            PromptComponent(component) if isinstance(component, str) else component
+            for component in prompt_order
+        )
+    def _is_valid_plan(self):
+        """Check if the plan is valid."""
+        combined = self.user_prompt_order + self.system_prompt_order
+        return set(combined) == set(PromptComponent)
+    def arrange_components(self, **kwargs) -> Dict[PromptComponent, Prompt]:
+        """Arrange the components in the order specified by the plan."""
+        # check is valid components passed
+        component_strings = set([pc.value for pc in PromptComponent])
+        if not set(kwargs.keys()) == component_strings:
+            raise ValueError(
+                f"Invalid components passed: {set(kwargs.keys())} but expected {PromptComponent}"
+            )
+        user_prompt = PromptList(
+            [kwargs[component.value] for component in self.user_prompt_order]
+        )
+        system_prompt = PromptList(
+            [kwargs[component.value] for component in self.system_prompt_order]
+        )
+        return {"user_prompt": user_prompt, "system_prompt": system_prompt}
+    def get_prompts(self, **kwargs) -> Dict[str, Prompt]:
+        """Get both prompts for the LLM call."""
+        prompts = self.arrange_components(**kwargs)
+        return {
+            "user_prompt": prompts["user_prompt"].reduce(),
+            "system_prompt": prompts["system_prompt"].reduce(),
+        }

edsl/agents/question_option_processor.py ADDED Viewed

@@ -0,0 +1,172 @@
+from jinja2 import Environment, meta
+from typing import List, Optional, Union
+class QuestionOptionProcessor:
+    """
+    Class that manages the processing of question options.
+    These can be provided directly, as a template string, or fetched from prior answers or the scenario.
+    """
+    def __init__(self, prompt_constructor):
+        self.prompt_constructor = prompt_constructor
+    @staticmethod
+    def _get_default_options() -> list:
+        """Return default placeholder options."""
+        return [f"<< Option {i} - Placeholder >>" for i in range(1, 4)]
+    @staticmethod
+    def _parse_template_variable(template_str: str) -> str:
+        """
+        Extract the variable name from a template string.
+        Args:
+            template_str (str): Jinja template string
+        Returns:
+            str: Name of the first undefined variable in the template
+        >>> QuestionOptionProcessor._parse_template_variable("Here are some {{ options }}")
+        'options'
+        >>> QuestionOptionProcessor._parse_template_variable("Here are some {{ options }} and {{ other }}")
+        Traceback (most recent call last):
+        ...
+        ValueError: Multiple variables found in template string
+        >>> QuestionOptionProcessor._parse_template_variable("Here are some")
+        Traceback (most recent call last):
+        ...
+        ValueError: No variables found in template string
+        """
+        env = Environment()
+        parsed_content = env.parse(template_str)
+        undeclared_variables = list(meta.find_undeclared_variables(parsed_content))
+        if not undeclared_variables:
+            raise ValueError("No variables found in template string")
+        if len(undeclared_variables) > 1:
+            raise ValueError("Multiple variables found in template string")
+        return undeclared_variables[0]
+    @staticmethod
+    def _get_options_from_scenario(
+        scenario: dict, option_key: str
+    ) -> Union[list, None]:
+        """
+        Try to get options from scenario data.
+        >>> from edsl import Scenario
+        >>> scenario = Scenario({"options": ["Option 1", "Option 2"]})
+        >>> QuestionOptionProcessor._get_options_from_scenario(scenario, "options")
+        ['Option 1', 'Option 2']
+        Returns:
+            list | None: List of options if found in scenario, None otherwise
+        """
+        scenario_options = scenario.get(option_key)
+        return scenario_options if isinstance(scenario_options, list) else None
+    @staticmethod
+    def _get_options_from_prior_answers(
+        prior_answers: dict, option_key: str
+    ) -> Union[list, None]:
+        """
+        Try to get options from prior answers.
+        prior_answers (dict): Dictionary of prior answers
+        option_key (str): Key to look up in prior answers
+        >>> from edsl import QuestionList as Q
+        >>> q = Q.example()
+        >>> q.answer = ["Option 1", "Option 2"]
+        >>> prior_answers = {"options": q}
+        >>> QuestionOptionProcessor._get_options_from_prior_answers(prior_answers, "options")
+        ['Option 1', 'Option 2']
+        >>> QuestionOptionProcessor._get_options_from_prior_answers(prior_answers, "wrong_key") is None
+        True
+        Returns:
+            list | None: List of options if found in prior answers, None otherwise
+        """
+        prior_answer = prior_answers.get(option_key)
+        if prior_answer and hasattr(prior_answer, "answer"):
+            if isinstance(prior_answer.answer, list):
+                return prior_answer.answer
+        return None
+    def get_question_options(self, question_data: dict) -> list:
+        """
+        Extract and process question options from question data.
+        Args:
+            question_data (dict): Dictionary containing question configuration
+        Returns:
+            list: List of question options. Returns default placeholders if no valid options found.
+        >>> class MockPromptConstructor:
+        ...     pass
+        >>> mpc = MockPromptConstructor()
+        >>> from edsl import Scenario
+        >>> mpc.scenario = Scenario({"options": ["Option 1", "Option 2"]})
+        >>> processor = QuestionOptionProcessor(mpc)
+        The basic case where options are directly provided:
+        >>> question_data = {"question_options": ["Option 1", "Option 2"]}
+        >>> processor.get_question_options(question_data)
+        ['Option 1', 'Option 2']
+        The case where options are provided as a template string:
+        >>> question_data = {"question_options": "{{ options }}"}
+        >>> processor.get_question_options(question_data)
+        ['Option 1', 'Option 2']
+        The case where there is a templace string but it's in the prior answers:
+        >>> class MockQuestion:
+        ...     pass
+        >>> q0 = MockQuestion()
+        >>> q0.answer = ["Option 1", "Option 2"]
+        >>> mpc.prior_answers_dict = lambda: {'q0': q0}
+        >>> processor = QuestionOptionProcessor(mpc)
+        >>> question_data = {"question_options": "{{ q0 }}"}
+        >>> processor.get_question_options(question_data)
+        ['Option 1', 'Option 2']
+        The case we're no options are found:
+        >>> processor.get_question_options({"question_options": "{{ poop }}"})
+        ['<< Option 1 - Placeholder >>', '<< Option 2 - Placeholder >>', '<< Option 3 - Placeholder >>']
+        """
+        options_entry = question_data.get("question_options")
+        # If not a template string, return as is or default
+        if not isinstance(options_entry, str):
+            return options_entry if options_entry else self._get_default_options()
+        # Parse template to get variable name
+        option_key = self._parse_template_variable(options_entry)
+        # Try getting options from scenario
+        scenario_options = self._get_options_from_scenario(
+            self.prompt_constructor.scenario, option_key
+        )
+        if scenario_options:
+            return scenario_options
+        # Try getting options from prior answers
+        prior_answer_options = self._get_options_from_prior_answers(
+            self.prompt_constructor.prior_answers_dict(), option_key
+        )
+        if prior_answer_options:
+            return prior_answer_options
+        return self._get_default_options()
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()

edsl/auto/AutoStudy.py ADDED Viewed

@@ -0,0 +1,130 @@
+from typing import Optional, TYPE_CHECKING
+from edsl import Model
+from edsl.auto.StageQuestions import StageQuestions
+from edsl.auto.StagePersona import StagePersona
+from edsl.auto.StagePersonaDimensions import StagePersonaDimensions
+from edsl.auto.StagePersonaDimensionValues import StagePersonaDimensionValues
+from edsl.auto.StagePersonaDimensionValueRanges import (
+    StagePersonaDimensionValueRanges,
+)
+from edsl.auto.StageLabelQuestions import StageLabelQuestions
+from edsl.auto.StageGenerateSurvey import StageGenerateSurvey
+from edsl.auto.utilities import agent_generator, create_agents, gen_pipeline
+if TYPE_CHECKING:
+    from edsl.surveys.Survey import Survey
+    from edsl.agents.AgentList import AgentList
+class AutoStudy:
+    def __init__(
+        self,
+        overall_question: str,
+        population: str,
+        model: Optional["Model"] = None,
+        survey: Optional["Survey"] = None,
+        agent_list: Optional["AgentList"] = None,
+        default_num_agents: int = 11,
+    ):
+        """AutoStudy class for generating surveys and agents."""
+        self.overall_question = overall_question
+        self.population = population
+        self._survey = survey
+        self._agent_list = agent_list
+        self._agent_list_generator = None
+        self._persona_mapping = None
+        self._results = None
+        self.default_num_agents = default_num_agents
+        self.model = model or Model()
+    def to_dict(self):
+        return {
+            "overall_question": self.overall_question,
+            "population": self.population,
+            "survey": self.survey.to_dict(),
+            "persona_mapping": self.persona_mapping.to_dict(),
+            "results": self.results.to_dict(),
+        }
+    @property
+    def survey(self):
+        if self._survey is None:
+            self._survey = self._create_survey()
+        return self._survey
+    @property
+    def persona_mapping(self):
+        if self._persona_mapping is None:
+            self._persona_mapping = self._create_persona_mapping()
+        return self._persona_mapping
+    @property
+    def agent_list_generator(self):
+        if self._agent_list_generator is None:
+            self._agent_list_generator = self._create_agent_list_generator()
+        return self._agent_list_generator
+    @property
+    def results(self):
+        if self._results is None:
+            self._results = self._create_results()
+        return self._results
+    def _create_survey(self):
+        survey_pipline_stages = [
+            StageQuestions,
+            StageLabelQuestions,
+            StageGenerateSurvey,
+        ]
+        survey_pipeline = gen_pipeline(survey_pipline_stages)
+        return survey_pipeline.process(
+            data=survey_pipeline.input(
+                overall_question=self.overall_question, population=self.population
+            )
+        ).survey
+    def _create_persona_mapping(self):
+        persona_pipeline_stages = [
+            StageQuestions,
+            StagePersona,
+            StagePersonaDimensions,
+            StagePersonaDimensionValues,
+            StagePersonaDimensionValueRanges,
+        ]
+        persona_pipeline = gen_pipeline(persona_pipeline_stages)
+        sample_agent_results = persona_pipeline.process(
+            persona_pipeline.input(
+                overall_question=overall_question, population=self.population
+            )
+        )
+        return sample_agent_results
+    def _create_agent_list_generator(self):
+        return agent_generator(
+            persona=self.persona_mapping.persona,
+            dimension_dict=self.persona_mapping.mapping,
+        )
+    def agent_list(self, num_agents):
+        return create_agents(
+            agent_generator=self.agent_list_generator,
+            survey=self.survey,
+            num_agents=num_agents,
+        )
+    def _create_results(self, num_agents=None):
+        if num_agents is None:
+            num_agents = self.default_num_agents
+        agent_list = self.agent_list(num_agents)
+        return self.survey.by(agent_list).by(self.model).run()
+if __name__ == "__main__":
+    overall_question = "I have an open source Python library for working with LLMs. What are some ways we can market this to others?"
+    auto_study = AutoStudy(overall_question, population="US Adults")
+    results = auto_study.results

edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl