PyPI - edsl - Versions diffs - 0.1.15__py3-none-any.whl → 0.1.40__py3-none-any.whl - Mend

edsl 0.1.15py3-none-any.whl → 0.1.40py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (407) hide show

edsl/Base.py +348 -38
edsl/BaseDiff.py +260 -0
edsl/TemplateLoader.py +24 -0
edsl/__init__.py +45 -10
edsl/__version__.py +1 -1
edsl/agents/Agent.py +842 -144
edsl/agents/AgentList.py +521 -25
edsl/agents/Invigilator.py +250 -374
edsl/agents/InvigilatorBase.py +257 -0
edsl/agents/PromptConstructor.py +272 -0
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/descriptors.py +43 -13
edsl/agents/prompt_helpers.py +129 -0
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +130 -0
edsl/auto/StageBase.py +243 -0
edsl/auto/StageGenerateSurvey.py +178 -0
edsl/auto/StageLabelQuestions.py +125 -0
edsl/auto/StagePersona.py +61 -0
edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
edsl/auto/StagePersonaDimensionValues.py +74 -0
edsl/auto/StagePersonaDimensions.py +69 -0
edsl/auto/StageQuestions.py +74 -0
edsl/auto/SurveyCreatorPipeline.py +21 -0
edsl/auto/utilities.py +218 -0
edsl/base/Base.py +279 -0
edsl/config.py +115 -113
edsl/conversation/Conversation.py +290 -0
edsl/conversation/car_buying.py +59 -0
edsl/conversation/chips.py +95 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +54 -0
edsl/coop/__init__.py +1 -0
edsl/coop/coop.py +1029 -134
edsl/coop/utils.py +131 -0
edsl/data/Cache.py +560 -89
edsl/data/CacheEntry.py +230 -0
edsl/data/CacheHandler.py +168 -0
edsl/data/RemoteCacheSync.py +186 -0
edsl/data/SQLiteDict.py +292 -0
edsl/data/__init__.py +5 -3
edsl/data/orm.py +6 -33
edsl/data_transfer_models.py +74 -27
edsl/enums.py +165 -8
edsl/exceptions/BaseException.py +21 -0
edsl/exceptions/__init__.py +52 -46
edsl/exceptions/agents.py +33 -15
edsl/exceptions/cache.py +5 -0
edsl/exceptions/coop.py +8 -0
edsl/exceptions/general.py +34 -0
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/jobs.py +15 -0
edsl/exceptions/language_models.py +46 -1
edsl/exceptions/questions.py +80 -5
edsl/exceptions/results.py +16 -5
edsl/exceptions/scenarios.py +29 -0
edsl/exceptions/surveys.py +13 -10
edsl/inference_services/AnthropicService.py +106 -0
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +118 -0
edsl/inference_services/AzureAI.py +215 -0
edsl/inference_services/DeepInfraService.py +18 -0
edsl/inference_services/GoogleService.py +143 -0
edsl/inference_services/GroqService.py +20 -0
edsl/inference_services/InferenceServiceABC.py +80 -0
edsl/inference_services/InferenceServicesCollection.py +138 -0
edsl/inference_services/MistralAIService.py +120 -0
edsl/inference_services/OllamaService.py +18 -0
edsl/inference_services/OpenAIService.py +236 -0
edsl/inference_services/PerplexityService.py +160 -0
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +90 -0
edsl/inference_services/TogetherAIService.py +172 -0
edsl/inference_services/data_structures.py +134 -0
edsl/inference_services/models_available_cache.py +118 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/registry.py +41 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +21 -20
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +684 -206
edsl/jobs/JobsChecks.py +172 -0
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +270 -0
edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +104 -0
edsl/jobs/buckets/ModelBuckets.py +65 -0
edsl/jobs/buckets/TokenBucket.py +283 -0
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +392 -0
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
edsl/jobs/interviews/InterviewStatistic.py +63 -0
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
edsl/jobs/interviews/InterviewStatusLog.py +92 -0
edsl/jobs/interviews/ReportErrors.py +66 -0
edsl/jobs/interviews/interview_status_enum.py +9 -0
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
edsl/jobs/runners/JobsRunnerStatus.py +298 -0
edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
edsl/jobs/tasks/TaskCreators.py +64 -0
edsl/jobs/tasks/TaskHistory.py +470 -0
edsl/jobs/tasks/TaskStatusLog.py +23 -0
edsl/jobs/tasks/task_status_enum.py +161 -0
edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
edsl/jobs/tokens/TokenUsage.py +34 -0
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +507 -386
edsl/language_models/ModelList.py +164 -0
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
edsl/language_models/__init__.py +1 -8
edsl/language_models/fake_openai_call.py +15 -0
edsl/language_models/fake_openai_service.py +61 -0
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +109 -41
edsl/language_models/utilities.py +65 -0
edsl/notebooks/Notebook.py +263 -0
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/notebooks/__init__.py +1 -0
edsl/prompts/Prompt.py +222 -93
edsl/prompts/__init__.py +1 -1
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +518 -0
edsl/questions/QuestionBasePromptsMixin.py +221 -0
edsl/questions/QuestionBudget.py +164 -67
edsl/questions/QuestionCheckBox.py +281 -62
edsl/questions/QuestionDict.py +343 -0
edsl/questions/QuestionExtract.py +136 -50
edsl/questions/QuestionFreeText.py +79 -55
edsl/questions/QuestionFunctional.py +138 -41
edsl/questions/QuestionList.py +184 -57
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +293 -69
edsl/questions/QuestionNumerical.py +109 -56
edsl/questions/QuestionRank.py +244 -49
edsl/questions/Quick.py +41 -0
edsl/questions/SimpleAskMixin.py +74 -0
edsl/questions/__init__.py +9 -6
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
edsl/questions/compose_questions.py +13 -7
edsl/questions/data_structures.py +20 -0
edsl/questions/decorators.py +21 -0
edsl/questions/derived/QuestionLikertFive.py +28 -26
edsl/questions/derived/QuestionLinearScale.py +41 -28
edsl/questions/derived/QuestionTopK.py +34 -26
edsl/questions/derived/QuestionYesNo.py +40 -27
edsl/questions/descriptors.py +228 -74
edsl/questions/loop_processor.py +149 -0
edsl/questions/prompt_templates/question_budget.jinja +13 -0
edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
edsl/questions/prompt_templates/question_extract.jinja +11 -0
edsl/questions/prompt_templates/question_free_text.jinja +3 -0
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
edsl/questions/prompt_templates/question_list.jinja +17 -0
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
edsl/questions/prompt_templates/question_numerical.jinja +37 -0
edsl/questions/question_base_gen_mixin.py +168 -0
edsl/questions/question_registry.py +130 -46
edsl/questions/register_questions_meta.py +71 -0
edsl/questions/response_validator_abc.py +188 -0
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/settings.py +5 -2
edsl/questions/templates/__init__.py +0 -0
edsl/questions/templates/budget/__init__.py +0 -0
edsl/questions/templates/budget/answering_instructions.jinja +7 -0
edsl/questions/templates/budget/question_presentation.jinja +7 -0
edsl/questions/templates/checkbox/__init__.py +0 -0
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
edsl/questions/templates/dict/__init__.py +0 -0
edsl/questions/templates/dict/answering_instructions.jinja +21 -0
edsl/questions/templates/dict/question_presentation.jinja +1 -0
edsl/questions/templates/extract/__init__.py +0 -0
edsl/questions/templates/extract/answering_instructions.jinja +7 -0
edsl/questions/templates/extract/question_presentation.jinja +1 -0
edsl/questions/templates/free_text/__init__.py +0 -0
edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
edsl/questions/templates/free_text/question_presentation.jinja +1 -0
edsl/questions/templates/likert_five/__init__.py +0 -0
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
edsl/questions/templates/linear_scale/__init__.py +0 -0
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
edsl/questions/templates/list/__init__.py +0 -0
edsl/questions/templates/list/answering_instructions.jinja +4 -0
edsl/questions/templates/list/question_presentation.jinja +5 -0
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/questions/templates/multiple_choice/__init__.py +0 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
edsl/questions/templates/multiple_choice/html.jinja +0 -0
edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
edsl/questions/templates/numerical/__init__.py +0 -0
edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
edsl/questions/templates/numerical/question_presentation.jinja +7 -0
edsl/questions/templates/rank/__init__.py +0 -0
edsl/questions/templates/rank/answering_instructions.jinja +11 -0
edsl/questions/templates/rank/question_presentation.jinja +15 -0
edsl/questions/templates/top_k/__init__.py +0 -0
edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
edsl/questions/templates/top_k/question_presentation.jinja +22 -0
edsl/questions/templates/yes_no/__init__.py +0 -0
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +550 -19
edsl/results/DatasetExportMixin.py +594 -0
edsl/results/DatasetTree.py +295 -0
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +477 -173
edsl/results/Results.py +987 -269
edsl/results/ResultsExportMixin.py +28 -125
edsl/results/ResultsGGMixin.py +83 -15
edsl/results/TableDisplay.py +125 -0
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +1 -1
edsl/results/file_exports.py +252 -0
edsl/results/results_fetch_mixin.py +33 -0
edsl/results/results_selector.py +145 -0
edsl/results/results_tools_mixin.py +98 -0
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_display.css +78 -0
edsl/results/table_renderers.py +118 -0
edsl/results/tree_explore.py +115 -0
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +543 -0
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +431 -62
edsl/scenarios/ScenarioHtmlMixin.py +65 -0
edsl/scenarios/ScenarioList.py +1415 -45
edsl/scenarios/ScenarioListExportMixin.py +45 -0
edsl/scenarios/ScenarioListPdfMixin.py +239 -0
edsl/scenarios/__init__.py +2 -0
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +49 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/scenario_join.py +131 -0
edsl/scenarios/scenario_selector.py +156 -0
edsl/shared.py +1 -0
edsl/study/ObjectEntry.py +173 -0
edsl/study/ProofOfWork.py +113 -0
edsl/study/SnapShot.py +80 -0
edsl/study/Study.py +521 -0
edsl/study/__init__.py +4 -0
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/DAG.py +92 -11
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/Memory.py +9 -4
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/MemoryPlan.py +156 -35
edsl/surveys/Rule.py +221 -74
edsl/surveys/RuleCollection.py +241 -61
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +1079 -339
edsl/surveys/SurveyCSS.py +273 -0
edsl/surveys/SurveyExportMixin.py +235 -40
edsl/surveys/SurveyFlowVisualization.py +181 -0
edsl/surveys/SurveyQualtricsImport.py +284 -0
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +4 -2
edsl/surveys/base.py +19 -3
edsl/surveys/descriptors.py +17 -6
edsl/surveys/instructions/ChangeInstruction.py +48 -0
edsl/surveys/instructions/Instruction.py +56 -0
edsl/surveys/instructions/InstructionCollection.py +82 -0
edsl/surveys/instructions/__init__.py +0 -0
edsl/templates/error_reporting/base.html +24 -0
edsl/templates/error_reporting/exceptions_by_model.html +35 -0
edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
edsl/templates/error_reporting/exceptions_by_type.html +17 -0
edsl/templates/error_reporting/interview_details.html +116 -0
edsl/templates/error_reporting/interviews.html +19 -0
edsl/templates/error_reporting/overview.html +5 -0
edsl/templates/error_reporting/performance_plot.html +2 -0
edsl/templates/error_reporting/report.css +74 -0
edsl/templates/error_reporting/report.html +118 -0
edsl/templates/error_reporting/report.js +25 -0
edsl/tools/__init__.py +1 -0
edsl/tools/clusters.py +192 -0
edsl/tools/embeddings.py +27 -0
edsl/tools/embeddings_plotting.py +118 -0
edsl/tools/plotting.py +112 -0
edsl/tools/summarize.py +18 -0
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/SystemInfo.py +5 -0
edsl/utilities/__init__.py +21 -20
edsl/utilities/ast_utilities.py +3 -0
edsl/utilities/data/Registry.py +2 -0
edsl/utilities/decorators.py +41 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/interface.py +310 -60
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/naming_utilities.py +263 -0
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/restricted_python.py +70 -0
edsl/utilities/utilities.py +203 -13
edsl-0.1.40.dist-info/METADATA +111 -0
edsl-0.1.40.dist-info/RECORD +362 -0
{edsl-0.1.15.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
edsl/agents/AgentListExportMixin.py +0 -24
edsl/coop/old.py +0 -31
edsl/data/Database.py +0 -141
edsl/data/crud.py +0 -121
edsl/jobs/Interview.py +0 -435
edsl/jobs/JobsRunner.py +0 -63
edsl/jobs/JobsRunnerStatusMixin.py +0 -115
edsl/jobs/base.py +0 -47
edsl/jobs/buckets.py +0 -178
edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
edsl/jobs/task_management.py +0 -215
edsl/jobs/token_tracking.py +0 -78
edsl/language_models/DeepInfra.py +0 -69
edsl/language_models/OpenAI.py +0 -98
edsl/language_models/model_interfaces/GeminiPro.py +0 -66
edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
edsl/language_models/registry.py +0 -81
edsl/language_models/schemas.py +0 -15
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/prompts/QuestionInstructionsBase.py +0 -6
edsl/prompts/library/agent_instructions.py +0 -29
edsl/prompts/library/agent_persona.py +0 -17
edsl/prompts/library/question_budget.py +0 -26
edsl/prompts/library/question_checkbox.py +0 -32
edsl/prompts/library/question_extract.py +0 -19
edsl/prompts/library/question_freetext.py +0 -14
edsl/prompts/library/question_linear_scale.py +0 -20
edsl/prompts/library/question_list.py +0 -22
edsl/prompts/library/question_multiple_choice.py +0 -44
edsl/prompts/library/question_numerical.py +0 -31
edsl/prompts/library/question_rank.py +0 -21
edsl/prompts/prompt_config.py +0 -33
edsl/prompts/registry.py +0 -185
edsl/questions/Question.py +0 -240
edsl/report/InputOutputDataTypes.py +0 -134
edsl/report/RegressionMixin.py +0 -28
edsl/report/ReportOutputs.py +0 -1228
edsl/report/ResultsFetchMixin.py +0 -106
edsl/report/ResultsOutputMixin.py +0 -14
edsl/report/demo.ipynb +0 -645
edsl/results/ResultsDBMixin.py +0 -184
edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
edsl/trackers/Tracker.py +0 -91
edsl/trackers/TrackerAPI.py +0 -196
edsl/trackers/TrackerTasks.py +0 -70
edsl/utilities/pastebin.py +0 -141
edsl-0.1.15.dist-info/METADATA +0 -69
edsl-0.1.15.dist-info/RECORD +0 -142
/edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
/edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
/edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
{edsl-0.1.15.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0

edsl/data/crud.py DELETED Viewed

@@ -1,121 +0,0 @@
-from sqlalchemy import desc
-from typing import Union
-from edsl.data import Database, database, LLMOutputDataDB
-from edsl.data.orm import ResultDB
-class CRUDOperations:
-    """
-    A class that implementes CRUD operations for the EDSL package.
-    Initalization:
-    - `database`: A Database object.
-    Methods:
-    - `get_LLMOutputData(model, parameters, system_prompt, prompt)`: Retrieves a cached LLM output from the database.
-    - `write_LLMOutputData(model, parameters, system_prompt, prompt, output)`: Writes an LLM output to the database.
-    """
-    def __init__(self, database: Database) -> None:
-        self.database = database
-    def get_LLMOutputData(
-        self, model: str, parameters: str, system_prompt: str, prompt: str
-    ) -> Union[str, None]:
-        """
-        Retrieves a cached LLM output from the database. Arguments: in string format, the model, parameters, system_prompt, and prompt used to generate the output. Returns the output (json string) if it exists, otherwise None.
-        """
-        with self.database.get_db() as db:
-            record = (
-                db.query(LLMOutputDataDB)
-                .filter_by(
-                    prompt=prompt,
-                    system_prompt=system_prompt,
-                    model=model,
-                    parameters=parameters,
-                )
-                .order_by(desc(LLMOutputDataDB.id))
-                .first()
-            )
-        return record.output if record else None
-    def write_LLMOutputData(
-        self, model: str, parameters: str, system_prompt: str, prompt: str, output: str
-    ) -> None:
-        """
-        Writes an LLM output to the database. Arguments: in string format, the model, parameters, system_prompt, prompt, and the generated output.
-        """
-        record = LLMOutputDataDB(
-            model=model,
-            parameters=parameters,
-            system_prompt=system_prompt,
-            prompt=prompt,
-            output=output,
-        )
-        with self.database.get_db() as db:
-            db.add(record)
-            db.commit()
-    def clear_LLMOutputData(self) -> None:
-        """
-        Clears all LLM output data from the database.
-        """
-        with self.database.get_db() as db:
-            db.query(LLMOutputDataDB).delete()
-            db.commit()
-    def get_all_LLMOutputData(self) -> list:
-        """
-        Retrieves all LLM output data from the database and returns them as a list of dictionaries.
-        """
-        with self.database.get_db() as db:
-            records = db.query(LLMOutputDataDB).all()
-            return [
-                {
-                    "id": record.id,
-                    "model": record.model,
-                    "parameters": record.parameters,
-                    "system_prompt": record.system_prompt,
-                    "prompt": record.prompt,
-                    "output": record.output,
-                }
-                for record in records
-            ]
-    def write_result(
-        self,
-        job_uuid: str,
-        result_uuid: str,
-        agent: str,
-        scenario: str,
-        model: str,
-        answer: str,
-    ) -> None:
-        """Writes a Result record to the database."""
-        record = ResultDB(
-            job_uuid=job_uuid,
-            result_uuid=result_uuid,
-            agent=agent,
-            scenario=scenario,
-            model=model,
-            answer=answer,
-        )
-        with self.database.get_db() as db:
-            db.add(record)
-            db.commit()
-    def read_results(self, job_uuid: str) -> list[ResultDB]:
-        """Reads all Result records associated with job_uuid from the database."""
-        with self.database.get_db() as db:
-            records = (
-                db.query(ResultDB)
-                .filter_by(job_uuid=job_uuid)
-                .order_by(desc(ResultDB.id))
-                .all()
-            )
-        return records
-CRUD = CRUDOperations(database)

edsl/jobs/Interview.py DELETED Viewed

@@ -1,435 +0,0 @@
-from __future__ import annotations
-import traceback
-import asyncio
-import logging
-import textwrap
-from collections import UserList
-from typing import Any, Type, List, Generator, Callable, List, Tuple
-from collections import defaultdict
-# from tenacity import retry, wait_exponential, stop_after_attempt, retry_if_exception_type, AsyncRetrying, before_sleep
-from tenacity import (
-    retry,
-    wait_exponential,
-    stop_after_attempt,
-    retry_if_exception_type,
-    before_sleep,
-)
-from edsl import CONFIG
-from edsl.agents import Agent
-from edsl.exceptions import InterviewErrorPriorTaskCanceled, InterviewTimeoutError
-from edsl.language_models import LanguageModel
-from edsl.questions import Question
-from edsl.scenarios import Scenario
-from edsl.surveys import Survey
-from edsl.utilities.decorators import sync_wrapper
-from edsl.data_transfer_models import AgentResponseDict
-from edsl.jobs.Answers import Answers
-from edsl.surveys.base import EndOfSurvey
-from edsl.jobs.buckets import ModelBuckets
-from edsl.jobs.token_tracking import TokenUsage, InterviewTokenUsage
-from edsl.jobs.task_management import (
-    InterviewStatusDictionary,
-    QuestionTaskCreator,
-    TasksList,
-)
-# create logger
-logger = logging.getLogger(__name__)
-logger.setLevel(logging.INFO)
-logger.propagate = False
-# create  file handler
-fh = logging.FileHandler(CONFIG.get("EDSL_LOGGING_PATH"))
-fh.setLevel(logging.INFO)
-# add formatter to the handlers
-formatter = logging.Formatter(
-    "%(asctime)s - %(name)s - %(levelname)s - %(module)s:%(lineno)d - %(funcName)s - %(message)s"
-)
-fh.setFormatter(formatter)
-# add handler to logger
-logger.addHandler(fh)
-# start loggin'
-logger.info("Interview.py loaded")
-TIMEOUT = float(CONFIG.get("EDSL_API_TIMEOUT"))
-EDSL_BACKOFF_START_SEC = float(CONFIG.get("EDSL_BACKOFF_START_SEC"))
-EDSL_MAX_BACKOFF_SEC = float(CONFIG.get("EDSL_MAX_BACKOFF_SEC"))
-EDSL_MAX_ATTEMPTS = int(CONFIG.get("EDSL_MAX_ATTEMPTS"))
-def print_retry(retry_state):
-    "Prints details on tenacity retries"
-    attempt_number = retry_state.attempt_number
-    exception = retry_state.outcome.exception()
-    wait_time = retry_state.next_action.sleep
-    print(
-        f"Attempt {attempt_number} failed with exception: {exception}; "
-        f"now waiting {wait_time:.2f} seconds before retrying."
-    )
-retry_strategy = retry(
-    wait=wait_exponential(
-        multiplier=EDSL_BACKOFF_START_SEC, max=EDSL_MAX_BACKOFF_SEC
-    ),  # Exponential back-off starting at 1s, doubling, maxing out at 60s
-    stop=stop_after_attempt(EDSL_MAX_ATTEMPTS),  # Stop after 5 attempts
-    # retry=retry_if_exception_type(Exception),  # Customize this as per your specific retry-able exception
-    before_sleep=print_retry,  # Use custom print function for retries
-)
-retry_strategy = retry(
-    wait=wait_exponential(
-        multiplier=1, max=60
-    ),  # Exponential back-off starting at 1s, doubling, maxing out at 60s
-    stop=stop_after_attempt(5),  # Stop after 5 attempts
-    # retry=retry_if_exception_type(Exception),  # Customize this as per your specific retry-able exception
-    before_sleep=print_retry,  # Use custom print function for retries
-)
-class Interview:
-    """
-    An 'interview' is one agent answering one survey, with one language model, for a given scenario.
-    """
-    def __init__(
-        self,
-        agent: Agent,
-        survey: Survey,
-        scenario: Scenario,
-        model: Type[LanguageModel],
-        verbose: bool = False,
-        debug: bool = False,
-    ):
-        self.agent = agent
-        self.survey = survey
-        self.scenario = scenario
-        self.model = model
-        self.debug = debug
-        self.verbose = verbose
-        self.answers: dict[str, str] = Answers()  # will get filled in
-        # The DAG, or directed acyclic graph, is a dictionary that maps question names to their dependencies.
-        # It is used to determine the order in which questions should be answered.
-        # This reflects both agent 'memory' considerations and 'skip' logic.
-        self.dag = self.survey.dag(textify=True)
-        self.to_index = {
-            name: index for index, name in enumerate(self.survey.question_names)
-        }
-        logger.info(f"Interview instantiated")
-        # task creators is a dictionary that maps question names to their task creators.
-        # this is used to track the status of each task for real-time reporting on status of a job
-        # being executed.
-        # 1 task = 1 question.
-        self.task_creators = {}
-    @property
-    def token_usage(self) -> InterviewTokenUsage:
-        "Determins how many tokens were used for the interview."
-        cached_tokens = TokenUsage(from_cache=True)
-        new_tokens = TokenUsage(from_cache=False)
-        for task_creator in self.task_creators.values():
-            token_usage = task_creator.token_usage()
-            cached_tokens += token_usage["cached_tokens"]
-            new_tokens += token_usage["new_tokens"]
-        return InterviewTokenUsage(
-            new_token_usage=new_tokens, cached_token_usage=cached_tokens
-        )
-    @property
-    def interview_status(self) -> InterviewStatusDictionary:
-        """Returns a dictionary mapping task status codes to counts"""
-        status_dict = InterviewStatusDictionary()
-        for task_creator in self.task_creators.values():
-            status_dict[task_creator.task_status] += 1
-            status_dict["number_from_cache"] += task_creator.from_cache
-        return status_dict
-    async def async_conduct_interview(
-        self,
-        model_buckets: ModelBuckets = None,
-        debug: bool = False,
-        replace_missing: bool = True,
-    ) -> tuple["Answers", List[dict[str, Any]]]:
-        """
-        Conducts an interview asynchronously.
-        params
-        - `model_buckets`: a dictionary of token buckets for the model
-        - `debug`: prints debug messages
-        - `replace_missing`: if True, replaces missing answers with None
-        """
-        # if no model bucket is passed, create an 'infinity' bucket with no rate limits
-        model_buckets = model_buckets or ModelBuckets.infinity_bucket()
-        # we create both tasks and invigilators lists.
-        # this is because it's easier to extract info
-        # we need from the invigilators list when a task fails.
-        # it's challenging to get info from failed asyncio tasks.
-        self.tasks, self.invigilators = self._build_question_tasks(
-            debug=debug, model_buckets=model_buckets
-        )
-        await asyncio.gather(*self.tasks, return_exceptions=not debug)
-        if replace_missing:
-            self.answers.replace_missing_answers_with_none(self.survey)
-        valid_results = list(self._extract_valid_results())
-        return self.answers, valid_results
-    def _extract_valid_results(
-        self, print_traceback=False
-    ) -> Generator["Answers", None, None]:
-        """Extracts the valid results from the list of results."""
-        # we only need to print the warning once if a task failed.
-        warning_printed = False
-        warning_header = textwrap.dedent(
-            """\
-            WARNING: At least one question in the survey was not answered.
-            """
-        )
-        # there should be one one invigilator for each task
-        assert len(self.tasks) == len(self.invigilators)
-        for task, invigilator in zip(self.tasks, self.invigilators):
-            logger.info(f"Iterating through task: {task}")
-            if task.done():
-                try:
-                    # it worked!
-                    result = task.result()
-                except asyncio.CancelledError:
-                    # task was cancelled
-                    logger.info(f"Task `{task.edsl_name}` was cancelled.")
-                    result = invigilator.get_failed_task_result()
-                except Exception as exception:
-                    # any other kind of exception in the task
-                    if not warning_printed:
-                        warning_printed = True
-                        print(warning_header)
-                    error_message = f"Task `{task.edsl_name}` failed with `{exception.__class__.__name__}`:`{exception}`."
-                    logger.error(error_message)
-                    print(error_message)
-                    if print_traceback:
-                        traceback.print_exc()
-                    result = invigilator.get_failed_task_result()
-                else:
-                    # No exception means the task completed successfully
-                    pass
-                yield result
-    def _build_question_tasks(
-        self, debug: bool, model_buckets: ModelBuckets
-    ) -> Tuple[List[asyncio.Task], List["Invigilators"]]:
-        """Creates a task for each question, with dependencies on the questions that must be answered before this one can be answered."""
-        logger.info("Creating tasks for each question")
-        tasks = []
-        invigilators = []
-        for question in self.survey.questions:
-            # finds dependency tasks for that question
-            tasks_that_must_be_completed_before = (
-                self._get_tasks_that_must_be_completed_before(tasks, question)
-            )
-            # creates the task for that question
-            question_task = self._create_question_task(
-                question=question,
-                tasks_that_must_be_completed_before=tasks_that_must_be_completed_before,
-                model_buckets=model_buckets,
-                debug=debug,
-            )
-            # adds the task to the list of tasks
-            tasks.append(question_task)
-            invigilators.append(self.get_invigilator(question, debug))
-        return TasksList(tasks), invigilators
-    def _get_tasks_that_must_be_completed_before(
-        self, tasks, question
-    ) -> List[asyncio.Task]:
-        """Returns the tasks that must be completed before the given question can be answered.
-        If a question has no dependencies, this will be an empty list, [].
-        """
-        parents_of_focal_question: List[str] = self.dag.get(question.question_name, [])
-        return [
-            tasks[self.to_index[parent_question_name]]
-            for parent_question_name in parents_of_focal_question
-        ]
-    def _create_question_task(
-        self,
-        question: Question,
-        tasks_that_must_be_completed_before: List[asyncio.Task],
-        model_buckets: ModelBuckets,
-        debug,
-    ):
-        """Creates a task that depends on the passed-in dependencies that are awaited before the task is run."""
-        task_creator = QuestionTaskCreator(
-            question=question,
-            answer_question_func=self._answer_question_and_record_task,
-            token_estimator=self._get_estimated_request_tokens,
-            model_buckets=model_buckets,
-        )
-        [task_creator.add_dependency(x) for x in tasks_that_must_be_completed_before]
-        self.task_creators[question.question_name] = task_creator
-        return task_creator.generate_task(debug)
-    def async_timeout_handler(timeout):
-        def decorator(func):
-            async def wrapper(*args, **kwargs):
-                try:
-                    return await asyncio.wait_for(func(*args, **kwargs), timeout)
-                except asyncio.TimeoutError:
-                    raise InterviewTimeoutError(
-                        f"Task timed out after {timeout} seconds."
-                    )
-            return wrapper
-        return decorator
-    def get_invigilator(self, question, debug) -> "Invigilator":
-        invigilator = self.agent.create_invigilator(
-            question=question,
-            scenario=self.scenario,
-            model=self.model,
-            debug=debug,
-            memory_plan=self.survey.memory_plan,
-            current_answers=self.answers,
-        )
-        return invigilator
-    def _get_estimated_request_tokens(self, question) -> float:
-        """Estimates the number of tokens that will be required to run the focal task."""
-        invigilator = self.get_invigilator(question, debug=False)
-        # TODO: There should be a way to get a more accurate estimate.
-        combined_text = ""
-        for prompt in invigilator.get_prompts().values():
-            if hasattr(prompt, "text"):
-                combined_text += prompt.text
-            elif isinstance(prompt, str):
-                combined_text += prompt
-            else:
-                raise ValueError(f"Prompt is of type {type(prompt)}")
-        return len(combined_text) / 4.0
-    @async_timeout_handler(TIMEOUT)
-    async def _answer_question_and_record_task(
-        self,
-        question: Question,
-        debug: bool,
-    ) -> AgentResponseDict:
-        """Answers a question and records the task.
-        This in turn calls the the passed-in agent's async_answer_question method, which returns a response dictionary.
-        """
-        invigilator = self.get_invigilator(question, debug=debug)
-        @retry_strategy
-        async def attempt_to_answer_question():
-            return await invigilator.async_answer_question()
-        response: AgentResponseDict = await attempt_to_answer_question()
-        # TODO: Move this back into actual agent response dict and enforce it.
-        response["question_name"] = question.question_name
-        self.answers.add_answer(response, question)
-        self._cancel_skipped_questions(question)
-        # TODO: This should be forced to be a data-exchange model to cement attributes.
-        return response
-    def _cancel_skipped_questions(self, current_question) -> None:
-        """Cancels the tasks for questions that are skipped."""
-        logger.info(f"Current question is {current_question.question_name}")
-        current_question_index = self.to_index[current_question.question_name]
-        next_question = self.survey.rule_collection.next_question(
-            q_now=current_question_index, answers=self.answers
-        )
-        next_question_index = next_question.next_q
-        def cancel_between(start, end):
-            for i in range(start, end):
-                logger.info(
-                    f"Cancelling task for question {i}; {self.tasks[i].edsl_name}"
-                )
-                self.tasks[i].cancel()
-                skipped_question_name = self.survey.question_names[i]
-                logger.info(f"{skipped_question_name} skipped.")
-        if next_question_index == EndOfSurvey:
-            cancel_between(current_question_index + 1, len(self.survey.questions))
-            return
-        if next_question_index > (current_question_index + 1):
-            cancel_between(current_question_index + 1, next_question_index)
-        self.tasks.status()
-    #######################
-    # Dunder methods
-    #######################
-    def __repr__(self) -> str:
-        """Returns a string representation of the Interview instance."""
-        return f"Interview(agent = {self.agent}, survey = {self.survey}, scenario = {self.scenario}, model = {self.model})"
-if __name__ == "__main__":
-    from edsl.language_models import LanguageModelOpenAIThreeFiveTurbo
-    from edsl.agents import Agent
-    from edsl.surveys import Survey
-    from edsl.scenarios import Scenario
-    from edsl.questions import QuestionMultipleChoice
-    # from edsl.jobs.Interview import Interview
-    #  a survey with skip logic
-    q0 = QuestionMultipleChoice(
-        question_text="Do you like school?",
-        question_options=["yes", "no"],
-        question_name="q0",
-    )
-    q1 = QuestionMultipleChoice(
-        question_text="Why not?",
-        question_options=["killer bees in cafeteria", "other"],
-        question_name="q1",
-    )
-    q2 = QuestionMultipleChoice(
-        question_text="Why?",
-        question_options=["**lack*** of killer bees in cafeteria", "other"],
-        question_name="q2",
-    )
-    s = Survey(questions=[q0, q1, q2])
-    s = s.add_rule(q0, "q0 == 'yes'", q2)
-    # create an interview
-    a = Agent(traits=None)
-    def direct_question_answering_method(self, question, scenario):
-        raise Exception("Fuck you!")
-        # return "yes"
-    a.add_direct_question_answering_method(direct_question_answering_method)
-    scenario = Scenario()
-    m = LanguageModelOpenAIThreeFiveTurbo(use_cache=False)
-    I = Interview(agent=a, survey=s, scenario=scenario, model=m)
-    result = asyncio.run(I.async_conduct_interview())
-    # # conduct five interviews
-    # for _ in range(5):
-    #     I.conduct_interview(debug=True)
-    # # replace missing answers
-    # I
-    # repr(I)
-    # eval(repr(I))

edsl/jobs/JobsRunner.py DELETED Viewed

@@ -1,63 +0,0 @@
-from __future__ import annotations
-from collections import UserDict
-from abc import ABC, ABCMeta, abstractmethod
-from edsl.jobs import Jobs
-from edsl.results import Results
-class RegisterJobsRunnerMeta(ABCMeta):
-    "Metaclass to register output elements in a registry i.e., those that have a parent"
-    _registry = {}  # Initialize the registry as a dictionary
-    def __init__(cls, name, bases, dct):
-        super(RegisterJobsRunnerMeta, cls).__init__(name, bases, dct)
-        if name != "JobsRunner":
-            RegisterJobsRunnerMeta._registry[name] = cls
-    @classmethod
-    def get_registered_classes(cls):
-        return cls._registry
-    @classmethod
-    def lookup(cls):
-        d = {}
-        for classname, cls in cls._registry.items():
-            if hasattr(cls, "runner_name"):
-                d[cls.runner_name] = cls
-            else:
-                raise Exception(
-                    f"Class {classname} does not have a runner_name attribute"
-                )
-        return d
-class JobsRunner(ABC, metaclass=RegisterJobsRunnerMeta):
-    """ABC for JobRunners, which take in a job, conduct interviews, and return their results."""
-    def __init__(self, jobs: Jobs):
-        self.jobs = jobs
-        # create the interviews here so children can use them
-        self.interviews = jobs.interviews()
-        self.bucket_collection = jobs.bucket_collection
-        # self.bucket_collection = self.jobs.bucket_collection
-        # for model in self.jobs.models:
-        #    self.bucket_collection.add_model(model)
-    @abstractmethod
-    def run(
-        self,
-        n: int = 1,
-        debug: bool = False,
-        verbose: bool = False,
-        progress_bar: bool = True,
-    ) -> Results:  # pragma: no cover
-        """
-        Runs the job: conducts Interviews and returns their results.
-        - `n`: how many times to run each interview
-        - `debug`: prints debug messages
-        - `verbose`: prints messages
-        - `progress_bar`: shows a progress bar
-        """
-        raise NotImplementedError

edsl 0.1.15__py3-none-any.whl → 0.1.40__py3-none-any.whl

edsl 0.1.15py3-none-any.whl → 0.1.40py3-none-any.whl