edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- edsl/Base.py +348 -38
- edsl/BaseDiff.py +260 -0
- edsl/TemplateLoader.py +24 -0
- edsl/__init__.py +46 -10
- edsl/__version__.py +1 -0
- edsl/agents/Agent.py +842 -144
- edsl/agents/AgentList.py +521 -25
- edsl/agents/Invigilator.py +250 -374
- edsl/agents/InvigilatorBase.py +257 -0
- edsl/agents/PromptConstructor.py +272 -0
- edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
- edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
- edsl/agents/descriptors.py +43 -13
- edsl/agents/prompt_helpers.py +129 -0
- edsl/agents/question_option_processor.py +172 -0
- edsl/auto/AutoStudy.py +130 -0
- edsl/auto/StageBase.py +243 -0
- edsl/auto/StageGenerateSurvey.py +178 -0
- edsl/auto/StageLabelQuestions.py +125 -0
- edsl/auto/StagePersona.py +61 -0
- edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
- edsl/auto/StagePersonaDimensionValues.py +74 -0
- edsl/auto/StagePersonaDimensions.py +69 -0
- edsl/auto/StageQuestions.py +74 -0
- edsl/auto/SurveyCreatorPipeline.py +21 -0
- edsl/auto/utilities.py +218 -0
- edsl/base/Base.py +279 -0
- edsl/config.py +121 -104
- edsl/conversation/Conversation.py +290 -0
- edsl/conversation/car_buying.py +59 -0
- edsl/conversation/chips.py +95 -0
- edsl/conversation/mug_negotiation.py +81 -0
- edsl/conversation/next_speaker_utilities.py +93 -0
- edsl/coop/CoopFunctionsMixin.py +15 -0
- edsl/coop/ExpectedParrotKeyHandler.py +125 -0
- edsl/coop/PriceFetcher.py +54 -0
- edsl/coop/__init__.py +1 -0
- edsl/coop/coop.py +1029 -134
- edsl/coop/utils.py +131 -0
- edsl/data/Cache.py +560 -89
- edsl/data/CacheEntry.py +230 -0
- edsl/data/CacheHandler.py +168 -0
- edsl/data/RemoteCacheSync.py +186 -0
- edsl/data/SQLiteDict.py +292 -0
- edsl/data/__init__.py +5 -3
- edsl/data/orm.py +6 -33
- edsl/data_transfer_models.py +74 -27
- edsl/enums.py +165 -8
- edsl/exceptions/BaseException.py +21 -0
- edsl/exceptions/__init__.py +52 -46
- edsl/exceptions/agents.py +33 -15
- edsl/exceptions/cache.py +5 -0
- edsl/exceptions/coop.py +8 -0
- edsl/exceptions/general.py +34 -0
- edsl/exceptions/inference_services.py +5 -0
- edsl/exceptions/jobs.py +15 -0
- edsl/exceptions/language_models.py +46 -1
- edsl/exceptions/questions.py +80 -5
- edsl/exceptions/results.py +16 -5
- edsl/exceptions/scenarios.py +29 -0
- edsl/exceptions/surveys.py +13 -10
- edsl/inference_services/AnthropicService.py +106 -0
- edsl/inference_services/AvailableModelCacheHandler.py +184 -0
- edsl/inference_services/AvailableModelFetcher.py +215 -0
- edsl/inference_services/AwsBedrock.py +118 -0
- edsl/inference_services/AzureAI.py +215 -0
- edsl/inference_services/DeepInfraService.py +18 -0
- edsl/inference_services/GoogleService.py +143 -0
- edsl/inference_services/GroqService.py +20 -0
- edsl/inference_services/InferenceServiceABC.py +80 -0
- edsl/inference_services/InferenceServicesCollection.py +138 -0
- edsl/inference_services/MistralAIService.py +120 -0
- edsl/inference_services/OllamaService.py +18 -0
- edsl/inference_services/OpenAIService.py +236 -0
- edsl/inference_services/PerplexityService.py +160 -0
- edsl/inference_services/ServiceAvailability.py +135 -0
- edsl/inference_services/TestService.py +90 -0
- edsl/inference_services/TogetherAIService.py +172 -0
- edsl/inference_services/data_structures.py +134 -0
- edsl/inference_services/models_available_cache.py +118 -0
- edsl/inference_services/rate_limits_cache.py +25 -0
- edsl/inference_services/registry.py +41 -0
- edsl/inference_services/write_available.py +10 -0
- edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
- edsl/jobs/Answers.py +21 -20
- edsl/jobs/FetchInvigilator.py +47 -0
- edsl/jobs/InterviewTaskManager.py +98 -0
- edsl/jobs/InterviewsConstructor.py +50 -0
- edsl/jobs/Jobs.py +684 -204
- edsl/jobs/JobsChecks.py +172 -0
- edsl/jobs/JobsComponentConstructor.py +189 -0
- edsl/jobs/JobsPrompts.py +270 -0
- edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
- edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
- edsl/jobs/RequestTokenEstimator.py +30 -0
- edsl/jobs/async_interview_runner.py +138 -0
- edsl/jobs/buckets/BucketCollection.py +104 -0
- edsl/jobs/buckets/ModelBuckets.py +65 -0
- edsl/jobs/buckets/TokenBucket.py +283 -0
- edsl/jobs/buckets/TokenBucketAPI.py +211 -0
- edsl/jobs/buckets/TokenBucketClient.py +191 -0
- edsl/jobs/check_survey_scenario_compatibility.py +85 -0
- edsl/jobs/data_structures.py +120 -0
- edsl/jobs/decorators.py +35 -0
- edsl/jobs/interviews/Interview.py +392 -0
- edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
- edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
- edsl/jobs/interviews/InterviewStatistic.py +63 -0
- edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
- edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
- edsl/jobs/interviews/InterviewStatusLog.py +92 -0
- edsl/jobs/interviews/ReportErrors.py +66 -0
- edsl/jobs/interviews/interview_status_enum.py +9 -0
- edsl/jobs/jobs_status_enums.py +9 -0
- edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
- edsl/jobs/results_exceptions_handler.py +98 -0
- edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
- edsl/jobs/runners/JobsRunnerStatus.py +298 -0
- edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
- edsl/jobs/tasks/TaskCreators.py +64 -0
- edsl/jobs/tasks/TaskHistory.py +470 -0
- edsl/jobs/tasks/TaskStatusLog.py +23 -0
- edsl/jobs/tasks/task_status_enum.py +161 -0
- edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
- edsl/jobs/tokens/TokenUsage.py +34 -0
- edsl/language_models/ComputeCost.py +63 -0
- edsl/language_models/LanguageModel.py +507 -386
- edsl/language_models/ModelList.py +164 -0
- edsl/language_models/PriceManager.py +127 -0
- edsl/language_models/RawResponseHandler.py +106 -0
- edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
- edsl/language_models/__init__.py +1 -8
- edsl/language_models/fake_openai_call.py +15 -0
- edsl/language_models/fake_openai_service.py +61 -0
- edsl/language_models/key_management/KeyLookup.py +63 -0
- edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
- edsl/language_models/key_management/KeyLookupCollection.py +38 -0
- edsl/language_models/key_management/__init__.py +0 -0
- edsl/language_models/key_management/models.py +131 -0
- edsl/language_models/model.py +256 -0
- edsl/language_models/repair.py +109 -41
- edsl/language_models/utilities.py +65 -0
- edsl/notebooks/Notebook.py +263 -0
- edsl/notebooks/NotebookToLaTeX.py +142 -0
- edsl/notebooks/__init__.py +1 -0
- edsl/prompts/Prompt.py +222 -93
- edsl/prompts/__init__.py +1 -1
- edsl/questions/ExceptionExplainer.py +77 -0
- edsl/questions/HTMLQuestion.py +103 -0
- edsl/questions/QuestionBase.py +518 -0
- edsl/questions/QuestionBasePromptsMixin.py +221 -0
- edsl/questions/QuestionBudget.py +164 -67
- edsl/questions/QuestionCheckBox.py +281 -62
- edsl/questions/QuestionDict.py +343 -0
- edsl/questions/QuestionExtract.py +136 -50
- edsl/questions/QuestionFreeText.py +79 -55
- edsl/questions/QuestionFunctional.py +138 -41
- edsl/questions/QuestionList.py +184 -57
- edsl/questions/QuestionMatrix.py +265 -0
- edsl/questions/QuestionMultipleChoice.py +293 -69
- edsl/questions/QuestionNumerical.py +109 -56
- edsl/questions/QuestionRank.py +244 -49
- edsl/questions/Quick.py +41 -0
- edsl/questions/SimpleAskMixin.py +74 -0
- edsl/questions/__init__.py +9 -6
- edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
- edsl/questions/compose_questions.py +13 -7
- edsl/questions/data_structures.py +20 -0
- edsl/questions/decorators.py +21 -0
- edsl/questions/derived/QuestionLikertFive.py +28 -26
- edsl/questions/derived/QuestionLinearScale.py +41 -28
- edsl/questions/derived/QuestionTopK.py +34 -26
- edsl/questions/derived/QuestionYesNo.py +40 -27
- edsl/questions/descriptors.py +228 -74
- edsl/questions/loop_processor.py +149 -0
- edsl/questions/prompt_templates/question_budget.jinja +13 -0
- edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
- edsl/questions/prompt_templates/question_extract.jinja +11 -0
- edsl/questions/prompt_templates/question_free_text.jinja +3 -0
- edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
- edsl/questions/prompt_templates/question_list.jinja +17 -0
- edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
- edsl/questions/prompt_templates/question_numerical.jinja +37 -0
- edsl/questions/question_base_gen_mixin.py +168 -0
- edsl/questions/question_registry.py +130 -46
- edsl/questions/register_questions_meta.py +71 -0
- edsl/questions/response_validator_abc.py +188 -0
- edsl/questions/response_validator_factory.py +34 -0
- edsl/questions/settings.py +5 -2
- edsl/questions/templates/__init__.py +0 -0
- edsl/questions/templates/budget/__init__.py +0 -0
- edsl/questions/templates/budget/answering_instructions.jinja +7 -0
- edsl/questions/templates/budget/question_presentation.jinja +7 -0
- edsl/questions/templates/checkbox/__init__.py +0 -0
- edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
- edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
- edsl/questions/templates/dict/__init__.py +0 -0
- edsl/questions/templates/dict/answering_instructions.jinja +21 -0
- edsl/questions/templates/dict/question_presentation.jinja +1 -0
- edsl/questions/templates/extract/__init__.py +0 -0
- edsl/questions/templates/extract/answering_instructions.jinja +7 -0
- edsl/questions/templates/extract/question_presentation.jinja +1 -0
- edsl/questions/templates/free_text/__init__.py +0 -0
- edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
- edsl/questions/templates/free_text/question_presentation.jinja +1 -0
- edsl/questions/templates/likert_five/__init__.py +0 -0
- edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
- edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
- edsl/questions/templates/linear_scale/__init__.py +0 -0
- edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
- edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
- edsl/questions/templates/list/__init__.py +0 -0
- edsl/questions/templates/list/answering_instructions.jinja +4 -0
- edsl/questions/templates/list/question_presentation.jinja +5 -0
- edsl/questions/templates/matrix/__init__.py +1 -0
- edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
- edsl/questions/templates/matrix/question_presentation.jinja +20 -0
- edsl/questions/templates/multiple_choice/__init__.py +0 -0
- edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
- edsl/questions/templates/multiple_choice/html.jinja +0 -0
- edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
- edsl/questions/templates/numerical/__init__.py +0 -0
- edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
- edsl/questions/templates/numerical/question_presentation.jinja +7 -0
- edsl/questions/templates/rank/__init__.py +0 -0
- edsl/questions/templates/rank/answering_instructions.jinja +11 -0
- edsl/questions/templates/rank/question_presentation.jinja +15 -0
- edsl/questions/templates/top_k/__init__.py +0 -0
- edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
- edsl/questions/templates/top_k/question_presentation.jinja +22 -0
- edsl/questions/templates/yes_no/__init__.py +0 -0
- edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
- edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
- edsl/results/CSSParameterizer.py +108 -0
- edsl/results/Dataset.py +550 -19
- edsl/results/DatasetExportMixin.py +594 -0
- edsl/results/DatasetTree.py +295 -0
- edsl/results/MarkdownToDocx.py +122 -0
- edsl/results/MarkdownToPDF.py +111 -0
- edsl/results/Result.py +477 -173
- edsl/results/Results.py +987 -269
- edsl/results/ResultsExportMixin.py +28 -125
- edsl/results/ResultsGGMixin.py +83 -15
- edsl/results/TableDisplay.py +125 -0
- edsl/results/TextEditor.py +50 -0
- edsl/results/__init__.py +1 -1
- edsl/results/file_exports.py +252 -0
- edsl/results/results_fetch_mixin.py +33 -0
- edsl/results/results_selector.py +145 -0
- edsl/results/results_tools_mixin.py +98 -0
- edsl/results/smart_objects.py +96 -0
- edsl/results/table_data_class.py +12 -0
- edsl/results/table_display.css +78 -0
- edsl/results/table_renderers.py +118 -0
- edsl/results/tree_explore.py +115 -0
- edsl/scenarios/ConstructDownloadLink.py +109 -0
- edsl/scenarios/DocumentChunker.py +102 -0
- edsl/scenarios/DocxScenario.py +16 -0
- edsl/scenarios/FileStore.py +543 -0
- edsl/scenarios/PdfExtractor.py +40 -0
- edsl/scenarios/Scenario.py +431 -62
- edsl/scenarios/ScenarioHtmlMixin.py +65 -0
- edsl/scenarios/ScenarioList.py +1415 -45
- edsl/scenarios/ScenarioListExportMixin.py +45 -0
- edsl/scenarios/ScenarioListPdfMixin.py +239 -0
- edsl/scenarios/__init__.py +2 -0
- edsl/scenarios/directory_scanner.py +96 -0
- edsl/scenarios/file_methods.py +85 -0
- edsl/scenarios/handlers/__init__.py +13 -0
- edsl/scenarios/handlers/csv.py +49 -0
- edsl/scenarios/handlers/docx.py +76 -0
- edsl/scenarios/handlers/html.py +37 -0
- edsl/scenarios/handlers/json.py +111 -0
- edsl/scenarios/handlers/latex.py +5 -0
- edsl/scenarios/handlers/md.py +51 -0
- edsl/scenarios/handlers/pdf.py +68 -0
- edsl/scenarios/handlers/png.py +39 -0
- edsl/scenarios/handlers/pptx.py +105 -0
- edsl/scenarios/handlers/py.py +294 -0
- edsl/scenarios/handlers/sql.py +313 -0
- edsl/scenarios/handlers/sqlite.py +149 -0
- edsl/scenarios/handlers/txt.py +33 -0
- edsl/scenarios/scenario_join.py +131 -0
- edsl/scenarios/scenario_selector.py +156 -0
- edsl/shared.py +1 -0
- edsl/study/ObjectEntry.py +173 -0
- edsl/study/ProofOfWork.py +113 -0
- edsl/study/SnapShot.py +80 -0
- edsl/study/Study.py +521 -0
- edsl/study/__init__.py +4 -0
- edsl/surveys/ConstructDAG.py +92 -0
- edsl/surveys/DAG.py +92 -11
- edsl/surveys/EditSurvey.py +221 -0
- edsl/surveys/InstructionHandler.py +100 -0
- edsl/surveys/Memory.py +9 -4
- edsl/surveys/MemoryManagement.py +72 -0
- edsl/surveys/MemoryPlan.py +156 -35
- edsl/surveys/Rule.py +221 -74
- edsl/surveys/RuleCollection.py +241 -61
- edsl/surveys/RuleManager.py +172 -0
- edsl/surveys/Simulator.py +75 -0
- edsl/surveys/Survey.py +1079 -339
- edsl/surveys/SurveyCSS.py +273 -0
- edsl/surveys/SurveyExportMixin.py +235 -40
- edsl/surveys/SurveyFlowVisualization.py +181 -0
- edsl/surveys/SurveyQualtricsImport.py +284 -0
- edsl/surveys/SurveyToApp.py +141 -0
- edsl/surveys/__init__.py +4 -2
- edsl/surveys/base.py +19 -3
- edsl/surveys/descriptors.py +17 -6
- edsl/surveys/instructions/ChangeInstruction.py +48 -0
- edsl/surveys/instructions/Instruction.py +56 -0
- edsl/surveys/instructions/InstructionCollection.py +82 -0
- edsl/surveys/instructions/__init__.py +0 -0
- edsl/templates/error_reporting/base.html +24 -0
- edsl/templates/error_reporting/exceptions_by_model.html +35 -0
- edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
- edsl/templates/error_reporting/exceptions_by_type.html +17 -0
- edsl/templates/error_reporting/interview_details.html +116 -0
- edsl/templates/error_reporting/interviews.html +19 -0
- edsl/templates/error_reporting/overview.html +5 -0
- edsl/templates/error_reporting/performance_plot.html +2 -0
- edsl/templates/error_reporting/report.css +74 -0
- edsl/templates/error_reporting/report.html +118 -0
- edsl/templates/error_reporting/report.js +25 -0
- edsl/tools/__init__.py +1 -0
- edsl/tools/clusters.py +192 -0
- edsl/tools/embeddings.py +27 -0
- edsl/tools/embeddings_plotting.py +118 -0
- edsl/tools/plotting.py +112 -0
- edsl/tools/summarize.py +18 -0
- edsl/utilities/PrettyList.py +56 -0
- edsl/utilities/SystemInfo.py +5 -0
- edsl/utilities/__init__.py +21 -20
- edsl/utilities/ast_utilities.py +3 -0
- edsl/utilities/data/Registry.py +2 -0
- edsl/utilities/decorators.py +41 -0
- edsl/utilities/gcp_bucket/__init__.py +0 -0
- edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
- edsl/utilities/interface.py +310 -60
- edsl/utilities/is_notebook.py +18 -0
- edsl/utilities/is_valid_variable_name.py +11 -0
- edsl/utilities/naming_utilities.py +263 -0
- edsl/utilities/remove_edsl_version.py +24 -0
- edsl/utilities/repair_functions.py +28 -0
- edsl/utilities/restricted_python.py +70 -0
- edsl/utilities/utilities.py +203 -13
- edsl-0.1.40.dist-info/METADATA +111 -0
- edsl-0.1.40.dist-info/RECORD +362 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
- edsl/agents/AgentListExportMixin.py +0 -24
- edsl/coop/old.py +0 -31
- edsl/data/Database.py +0 -141
- edsl/data/crud.py +0 -121
- edsl/jobs/Interview.py +0 -417
- edsl/jobs/JobsRunner.py +0 -63
- edsl/jobs/JobsRunnerStatusMixin.py +0 -115
- edsl/jobs/base.py +0 -47
- edsl/jobs/buckets.py +0 -166
- edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
- edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
- edsl/jobs/task_management.py +0 -218
- edsl/jobs/token_tracking.py +0 -78
- edsl/language_models/DeepInfra.py +0 -69
- edsl/language_models/OpenAI.py +0 -98
- edsl/language_models/model_interfaces/GeminiPro.py +0 -66
- edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
- edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
- edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
- edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
- edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
- edsl/language_models/registry.py +0 -81
- edsl/language_models/schemas.py +0 -15
- edsl/language_models/unused/ReplicateBase.py +0 -83
- edsl/prompts/QuestionInstructionsBase.py +0 -6
- edsl/prompts/library/agent_instructions.py +0 -29
- edsl/prompts/library/agent_persona.py +0 -17
- edsl/prompts/library/question_budget.py +0 -26
- edsl/prompts/library/question_checkbox.py +0 -32
- edsl/prompts/library/question_extract.py +0 -19
- edsl/prompts/library/question_freetext.py +0 -14
- edsl/prompts/library/question_linear_scale.py +0 -20
- edsl/prompts/library/question_list.py +0 -22
- edsl/prompts/library/question_multiple_choice.py +0 -44
- edsl/prompts/library/question_numerical.py +0 -31
- edsl/prompts/library/question_rank.py +0 -21
- edsl/prompts/prompt_config.py +0 -33
- edsl/prompts/registry.py +0 -185
- edsl/questions/Question.py +0 -240
- edsl/report/InputOutputDataTypes.py +0 -134
- edsl/report/RegressionMixin.py +0 -28
- edsl/report/ReportOutputs.py +0 -1228
- edsl/report/ResultsFetchMixin.py +0 -106
- edsl/report/ResultsOutputMixin.py +0 -14
- edsl/report/demo.ipynb +0 -645
- edsl/results/ResultsDBMixin.py +0 -184
- edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
- edsl/trackers/Tracker.py +0 -91
- edsl/trackers/TrackerAPI.py +0 -196
- edsl/trackers/TrackerTasks.py +0 -70
- edsl/utilities/pastebin.py +0 -141
- edsl-0.1.14.dist-info/METADATA +0 -69
- edsl-0.1.14.dist-info/RECORD +0 -141
- /edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
- /edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
- /edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0
@@ -0,0 +1,63 @@
|
|
1
|
+
from collections import UserDict
|
2
|
+
from dataclasses import asdict
|
3
|
+
from edsl.enums import service_to_api_keyname
|
4
|
+
|
5
|
+
from edsl.language_models.key_management.models import LanguageModelInput
|
6
|
+
|
7
|
+
|
8
|
+
class KeyLookup(UserDict):
|
9
|
+
"""A class for looking up API keys and related configuration.
|
10
|
+
|
11
|
+
>>> from edsl.language_models.key_management.models import LanguageModelInput
|
12
|
+
>>> lookup = KeyLookup()
|
13
|
+
>>> lm_input = LanguageModelInput.example()
|
14
|
+
>>> lookup['test'] = lm_input
|
15
|
+
>>> lookup.to_dict()['test']['api_token']
|
16
|
+
'sk-abcd123'
|
17
|
+
>>> restored = KeyLookup.from_dict(lookup.to_dict())
|
18
|
+
>>> restored['test'].api_token
|
19
|
+
'sk-abcd123'
|
20
|
+
"""
|
21
|
+
|
22
|
+
def to_dict(self):
|
23
|
+
"""
|
24
|
+
>>> kl = KeyLookup.example()
|
25
|
+
>>> kl2 = KeyLookup.from_dict(kl.to_dict())
|
26
|
+
>>> kl2 == kl
|
27
|
+
True
|
28
|
+
>>> kl2 is kl
|
29
|
+
False
|
30
|
+
"""
|
31
|
+
return {k: asdict(v) for k, v in self.data.items()}
|
32
|
+
|
33
|
+
@classmethod
|
34
|
+
def from_dict(cls, d):
|
35
|
+
return cls({k: LanguageModelInput(**v) for k, v in d.items()})
|
36
|
+
|
37
|
+
@classmethod
|
38
|
+
def example(cls):
|
39
|
+
return cls(
|
40
|
+
{
|
41
|
+
"test": LanguageModelInput.example(),
|
42
|
+
"openai": LanguageModelInput.example(),
|
43
|
+
}
|
44
|
+
)
|
45
|
+
|
46
|
+
def to_dot_env(self):
|
47
|
+
"""Return a string representation of the key lookup collection for a .env file."""
|
48
|
+
lines = []
|
49
|
+
for service, lm_input in self.items():
|
50
|
+
if service != "test":
|
51
|
+
lines.append(f"EDSL_SERVICE_RPM_{service.upper()}={lm_input.rpm}")
|
52
|
+
lines.append(f"EDSL_SERVICE_TPM_{service.upper()}={lm_input.tpm}")
|
53
|
+
key_name = service_to_api_keyname.get(service, service)
|
54
|
+
lines.append(f"{key_name.upper()}={lm_input.api_token}")
|
55
|
+
if lm_input.api_id is not None:
|
56
|
+
lines.append(f"{service.upper()}_API_ID={lm_input.api_id}")
|
57
|
+
return "\n".join([f"{line}" for line in lines])
|
58
|
+
|
59
|
+
|
60
|
+
if __name__ == "__main__":
|
61
|
+
import doctest
|
62
|
+
|
63
|
+
doctest.testmod(optionflags=doctest.ELLIPSIS)
|
@@ -0,0 +1,273 @@
|
|
1
|
+
from typing import Optional, List
|
2
|
+
from collections import UserDict
|
3
|
+
import os
|
4
|
+
from functools import lru_cache
|
5
|
+
from dataclasses import dataclass, asdict
|
6
|
+
|
7
|
+
from edsl.enums import service_to_api_keyname
|
8
|
+
from edsl.exceptions.general import MissingAPIKeyError
|
9
|
+
|
10
|
+
from edsl.language_models.key_management.KeyLookup import KeyLookup
|
11
|
+
|
12
|
+
from edsl.language_models.key_management.models import (
|
13
|
+
APIKeyEntry,
|
14
|
+
LimitEntry,
|
15
|
+
APIIDEntry,
|
16
|
+
LanguageModelInput,
|
17
|
+
)
|
18
|
+
|
19
|
+
service_to_api_keyname["bedrock"] = "AWS_SECRET_ACCESS_KEY"
|
20
|
+
service_to_api_id = {"bedrock": "AWS_ACCESS_KEY_ID"}
|
21
|
+
|
22
|
+
api_keyname_to_service = {}
|
23
|
+
|
24
|
+
for service, key in service_to_api_keyname.items():
|
25
|
+
if isinstance(key, list):
|
26
|
+
for k in key:
|
27
|
+
api_keyname_to_service[k] = service
|
28
|
+
else:
|
29
|
+
api_keyname_to_service[key] = service
|
30
|
+
|
31
|
+
api_id_to_service = {"AWS_ACCESS_KEY_ID": "bedrock"}
|
32
|
+
|
33
|
+
|
34
|
+
class KeyLookupBuilder:
|
35
|
+
"""Builds KeyLookup options.
|
36
|
+
|
37
|
+
>>> builder = KeyLookupBuilder(fetch_order=("config", "env"))
|
38
|
+
>>> builder.DEFAULT_RPM
|
39
|
+
10
|
40
|
+
>>> builder.DEFAULT_TPM
|
41
|
+
2000000
|
42
|
+
>>> builder.fetch_order
|
43
|
+
('config', 'env')
|
44
|
+
|
45
|
+
Test invalid fetch_order:
|
46
|
+
>>> try:
|
47
|
+
... KeyLookupBuilder(fetch_order=["config", "env"]) # Should be tuple
|
48
|
+
... except ValueError as e:
|
49
|
+
... str(e)
|
50
|
+
'fetch_order must be a tuple'
|
51
|
+
|
52
|
+
Test service extraction:
|
53
|
+
>>> builder.extract_service("EDSL_SERVICE_RPM_OPENAI")
|
54
|
+
('openai', 'rpm')
|
55
|
+
"""
|
56
|
+
|
57
|
+
DEFAULT_RPM = 10
|
58
|
+
DEFAULT_TPM = 2000000
|
59
|
+
|
60
|
+
def __init__(self, fetch_order: Optional[tuple[str]] = None):
|
61
|
+
if fetch_order is None:
|
62
|
+
self.fetch_order = ("config", "env")
|
63
|
+
else:
|
64
|
+
self.fetch_order = fetch_order
|
65
|
+
|
66
|
+
if not isinstance(self.fetch_order, tuple):
|
67
|
+
raise ValueError("fetch_order must be a tuple")
|
68
|
+
|
69
|
+
self.limit_data = {}
|
70
|
+
self.key_data = {}
|
71
|
+
self.id_data = {}
|
72
|
+
self.process_key_value_pairs()
|
73
|
+
|
74
|
+
@property
|
75
|
+
def known_services(self):
|
76
|
+
"""Get the set of known services.
|
77
|
+
|
78
|
+
>>> builder = KeyLookupBuilder()
|
79
|
+
>>> isinstance(builder.known_services, set)
|
80
|
+
True
|
81
|
+
"""
|
82
|
+
return set(self.key_data.keys()) | set(self.limit_data.keys())
|
83
|
+
|
84
|
+
@lru_cache
|
85
|
+
def build(self) -> "KeyLookup":
|
86
|
+
"""Build a KeyLookup instance.
|
87
|
+
|
88
|
+
>>> builder = KeyLookupBuilder()
|
89
|
+
>>> lookup = builder.build()
|
90
|
+
>>> isinstance(lookup, KeyLookup)
|
91
|
+
True
|
92
|
+
>>> lookup['test'].api_token # Test service should always exist
|
93
|
+
'test'
|
94
|
+
"""
|
95
|
+
d = {}
|
96
|
+
for service in self.known_services:
|
97
|
+
try:
|
98
|
+
d[service] = self.get_language_model_input(service)
|
99
|
+
except MissingAPIKeyError:
|
100
|
+
pass
|
101
|
+
|
102
|
+
d.update({"test": LanguageModelInput(api_token="test", rpm=10, tpm=2000000)})
|
103
|
+
return KeyLookup(d)
|
104
|
+
|
105
|
+
def get_language_model_input(self, service: str) -> LanguageModelInput:
|
106
|
+
"""Get the language model input for a given service.
|
107
|
+
|
108
|
+
>>> builder = KeyLookupBuilder()
|
109
|
+
>>> try:
|
110
|
+
... builder.get_language_model_input("nonexistent_service")
|
111
|
+
... except MissingAPIKeyError as e:
|
112
|
+
... str(e)
|
113
|
+
"No key found for service 'nonexistent_service'"
|
114
|
+
"""
|
115
|
+
if (key_entries := self.key_data.get(service)) is None:
|
116
|
+
raise MissingAPIKeyError(f"No key found for service '{service}'")
|
117
|
+
|
118
|
+
if len(key_entries) == 1:
|
119
|
+
api_key_entry = key_entries[0]
|
120
|
+
|
121
|
+
id_entry = self.id_data.get(service)
|
122
|
+
id_source = id_entry.source if id_entry is not None else None
|
123
|
+
api_id = id_entry.value if id_entry is not None else None
|
124
|
+
|
125
|
+
if (limit_entry := self.limit_data.get(service)) is None:
|
126
|
+
limit_entry = LimitEntry(
|
127
|
+
service=service,
|
128
|
+
rpm=self.DEFAULT_RPM,
|
129
|
+
tpm=self.DEFAULT_TPM,
|
130
|
+
source="default",
|
131
|
+
)
|
132
|
+
|
133
|
+
if limit_entry.rpm is None:
|
134
|
+
limit_entry.rpm = self.DEFAULT_RPM
|
135
|
+
if limit_entry.tpm is None:
|
136
|
+
limit_entry.tpm = self.DEFAULT_TPM
|
137
|
+
|
138
|
+
return LanguageModelInput(
|
139
|
+
api_token=api_key_entry.value,
|
140
|
+
rpm=int(limit_entry.rpm),
|
141
|
+
tpm=int(limit_entry.tpm),
|
142
|
+
api_id=api_id,
|
143
|
+
token_source=api_key_entry.source,
|
144
|
+
limit_source=limit_entry.source,
|
145
|
+
id_source=id_source,
|
146
|
+
)
|
147
|
+
|
148
|
+
def __repr__(self):
|
149
|
+
return f"DataSource(key_data={self.key_data}, limit_data={self.limit_data}, id_data={self.id_data})"
|
150
|
+
|
151
|
+
def _os_env_key_value_pairs(self):
|
152
|
+
return dict(list(os.environ.items()))
|
153
|
+
|
154
|
+
def _coop_key_value_pairs(self):
|
155
|
+
from edsl.coop import Coop
|
156
|
+
|
157
|
+
c = Coop()
|
158
|
+
return dict(list(c.fetch_rate_limit_config_vars().items()))
|
159
|
+
|
160
|
+
def _config_key_value_pairs(self):
|
161
|
+
from edsl.config import CONFIG
|
162
|
+
|
163
|
+
return dict(list(CONFIG.items()))
|
164
|
+
|
165
|
+
@staticmethod
|
166
|
+
def extract_service(key: str) -> str:
|
167
|
+
"""Extract the service and limit type from the key"""
|
168
|
+
limit_type, service_raw = key.replace("EDSL_SERVICE_", "").split("_")
|
169
|
+
return service_raw.lower(), limit_type.lower()
|
170
|
+
|
171
|
+
def get_key_value_pairs(self) -> dict:
|
172
|
+
"""Get key-value pairs from configured sources."""
|
173
|
+
fetching_functions = {
|
174
|
+
"env": self._os_env_key_value_pairs,
|
175
|
+
"coop": self._coop_key_value_pairs,
|
176
|
+
"config": self._config_key_value_pairs,
|
177
|
+
}
|
178
|
+
d = {}
|
179
|
+
for source in self.fetch_order:
|
180
|
+
f = fetching_functions[source]
|
181
|
+
new_data = f()
|
182
|
+
for k, v in new_data.items():
|
183
|
+
d[k] = (v, source)
|
184
|
+
return d
|
185
|
+
|
186
|
+
def _entry_type(self, key, value) -> str:
|
187
|
+
"""Determine the type of entry from a key.
|
188
|
+
|
189
|
+
>>> builder = KeyLookupBuilder()
|
190
|
+
>>> builder._entry_type("EDSL_SERVICE_RPM_OPENAI", "60")
|
191
|
+
'limit'
|
192
|
+
>>> builder._entry_type("OPENAI_API_KEY", "sk-1234")
|
193
|
+
'api_key'
|
194
|
+
>>> builder._entry_type("AWS_ACCESS_KEY_ID", "AKIA1234")
|
195
|
+
'api_id'
|
196
|
+
>>> builder._entry_type("UNKNOWN_KEY", "value")
|
197
|
+
'unknown'
|
198
|
+
"""
|
199
|
+
if key.startswith("EDSL_SERVICE_"):
|
200
|
+
return "limit"
|
201
|
+
elif key in api_keyname_to_service:
|
202
|
+
return "api_key"
|
203
|
+
elif key in api_id_to_service:
|
204
|
+
return "api_id"
|
205
|
+
return "unknown"
|
206
|
+
|
207
|
+
def _add_id(self, key: str, value: str, source: str) -> None:
|
208
|
+
"""Add an API ID to the id_data dictionary.
|
209
|
+
|
210
|
+
>>> builder = KeyLookupBuilder()
|
211
|
+
>>> builder._add_id("AWS_ACCESS_KEY_ID", "AKIA1234", "env")
|
212
|
+
>>> builder.id_data["bedrock"].value
|
213
|
+
'AKIA1234'
|
214
|
+
>>> try:
|
215
|
+
... builder._add_id("AWS_ACCESS_KEY_ID", "AKIA5678", "env")
|
216
|
+
... except ValueError as e:
|
217
|
+
... str(e)
|
218
|
+
'Duplicate ID for service bedrock'
|
219
|
+
"""
|
220
|
+
service = api_id_to_service[key]
|
221
|
+
if service not in self.id_data:
|
222
|
+
self.id_data[service] = APIIDEntry(
|
223
|
+
service=service, name=key, value=value, source=source
|
224
|
+
)
|
225
|
+
else:
|
226
|
+
raise ValueError(f"Duplicate ID for service {service}")
|
227
|
+
|
228
|
+
def _add_limit(self, key: str, value: str, source: str) -> None:
|
229
|
+
"""Add a rate limit entry to the limit_data dictionary.
|
230
|
+
|
231
|
+
>>> builder = KeyLookupBuilder()
|
232
|
+
>>> builder._add_limit("EDSL_SERVICE_RPM_OPENAI", "60", "config")
|
233
|
+
>>> builder.limit_data["openai"].rpm
|
234
|
+
'60'
|
235
|
+
>>> builder._add_limit("EDSL_SERVICE_TPM_OPENAI", "100000", "config")
|
236
|
+
>>> builder.limit_data["openai"].tpm
|
237
|
+
'100000'
|
238
|
+
"""
|
239
|
+
service, limit_type = self.extract_service(key)
|
240
|
+
if service in self.limit_data:
|
241
|
+
setattr(self.limit_data[service], limit_type.lower(), value)
|
242
|
+
else:
|
243
|
+
new_limit_entry = LimitEntry(
|
244
|
+
service=service, rpm=None, tpm=None, source=source
|
245
|
+
)
|
246
|
+
setattr(new_limit_entry, limit_type.lower(), value)
|
247
|
+
self.limit_data[service] = new_limit_entry
|
248
|
+
|
249
|
+
def _add_api_key(self, key: str, value: str, source: str) -> None:
|
250
|
+
"""Add an API key entry to the key_data dictionary.
|
251
|
+
|
252
|
+
>>> builder = KeyLookupBuilder()
|
253
|
+
>>> builder._add_api_key("OPENAI_API_KEY", "sk-1234", "env")
|
254
|
+
>>> 'sk-1234' == builder.key_data["openai"][-1].value
|
255
|
+
True
|
256
|
+
"""
|
257
|
+
service = api_keyname_to_service[key]
|
258
|
+
new_entry = APIKeyEntry(service=service, name=key, value=value, source=source)
|
259
|
+
if service not in self.key_data:
|
260
|
+
self.key_data[service] = [new_entry]
|
261
|
+
else:
|
262
|
+
self.key_data[service].append(new_entry)
|
263
|
+
|
264
|
+
def process_key_value_pairs(self) -> None:
|
265
|
+
"""Process all key-value pairs from the configured sources."""
|
266
|
+
for key, value_pair in self.get_key_value_pairs().items():
|
267
|
+
value, source = value_pair
|
268
|
+
if (entry_type := self._entry_type(key, value)) == "limit":
|
269
|
+
self._add_limit(key, value, source)
|
270
|
+
elif entry_type == "api_key":
|
271
|
+
self._add_api_key(key, value, source)
|
272
|
+
elif entry_type == "api_id":
|
273
|
+
self._add_id(key, value, source)
|
@@ -0,0 +1,38 @@
|
|
1
|
+
from collections import UserDict
|
2
|
+
|
3
|
+
from edsl.language_models.key_management.KeyLookupBuilder import KeyLookupBuilder
|
4
|
+
|
5
|
+
|
6
|
+
class KeyLookupCollection(UserDict):
|
7
|
+
"""A singleton class that stores key-lookup objects.
|
8
|
+
|
9
|
+
This is because once a KeyLook is created once, we do not
|
10
|
+
need to keep re-creating it.
|
11
|
+
|
12
|
+
>>> collection = KeyLookupCollection()
|
13
|
+
>>> collection2 = KeyLookupCollection()
|
14
|
+
>>> collection is collection2 # Test singleton pattern
|
15
|
+
True
|
16
|
+
>>> collection.add_key_lookup(("config", "env"))
|
17
|
+
>>> ("config", "env") in collection.data
|
18
|
+
True
|
19
|
+
"""
|
20
|
+
|
21
|
+
_instance = None
|
22
|
+
|
23
|
+
def __new__(cls, *args, **kwargs):
|
24
|
+
if cls._instance is None:
|
25
|
+
cls._instance = super().__new__(cls)
|
26
|
+
return cls._instance
|
27
|
+
|
28
|
+
def __init__(self, *args, **kwargs):
|
29
|
+
if not hasattr(self, "_initialized"):
|
30
|
+
self.data = {}
|
31
|
+
self._initialized = True
|
32
|
+
super().__init__(*args, **kwargs)
|
33
|
+
|
34
|
+
def add_key_lookup(self, fetch_order=None):
|
35
|
+
if fetch_order is None:
|
36
|
+
fetch_order = ("config", "env")
|
37
|
+
if fetch_order not in self.data:
|
38
|
+
self.data[fetch_order] = KeyLookupBuilder(fetch_order=fetch_order).build()
|
File without changes
|
@@ -0,0 +1,131 @@
|
|
1
|
+
from dataclasses import dataclass, asdict
|
2
|
+
from typing import Optional
|
3
|
+
|
4
|
+
|
5
|
+
@dataclass
|
6
|
+
class APIKeyEntry:
|
7
|
+
"""A class representing an API key entry.
|
8
|
+
|
9
|
+
>>> entry = APIKeyEntry.example()
|
10
|
+
>>> entry.service
|
11
|
+
'openai'
|
12
|
+
>>> entry.name
|
13
|
+
'OPENAI_API_KEY'
|
14
|
+
>>> entry.value
|
15
|
+
'sk-abcd1234'
|
16
|
+
>>> entry.source
|
17
|
+
'env'
|
18
|
+
"""
|
19
|
+
|
20
|
+
service: str
|
21
|
+
name: str
|
22
|
+
value: str
|
23
|
+
source: Optional[str] = None
|
24
|
+
|
25
|
+
@classmethod
|
26
|
+
def example(cls):
|
27
|
+
return APIKeyEntry(
|
28
|
+
service="openai", name="OPENAI_API_KEY", value="sk-abcd1234", source="env"
|
29
|
+
)
|
30
|
+
|
31
|
+
|
32
|
+
@dataclass
|
33
|
+
class LimitEntry:
|
34
|
+
"""A class representing rate limit entries for a service.
|
35
|
+
|
36
|
+
>>> limit = LimitEntry.example()
|
37
|
+
>>> limit.service
|
38
|
+
'openai'
|
39
|
+
>>> limit.rpm
|
40
|
+
60
|
41
|
+
>>> limit.tpm
|
42
|
+
100000
|
43
|
+
>>> limit.source
|
44
|
+
'config'
|
45
|
+
"""
|
46
|
+
|
47
|
+
service: str
|
48
|
+
rpm: int
|
49
|
+
tpm: int
|
50
|
+
source: Optional[str] = None
|
51
|
+
|
52
|
+
@classmethod
|
53
|
+
def example(cls):
|
54
|
+
return LimitEntry(service="openai", rpm=60, tpm=100000, source="config")
|
55
|
+
|
56
|
+
|
57
|
+
@dataclass
|
58
|
+
class APIIDEntry:
|
59
|
+
"""A class representing an API ID entry.
|
60
|
+
|
61
|
+
>>> id_entry = APIIDEntry.example()
|
62
|
+
>>> id_entry.service
|
63
|
+
'bedrock'
|
64
|
+
>>> id_entry.name
|
65
|
+
'AWS_ACCESS_KEY_ID'
|
66
|
+
>>> id_entry.value
|
67
|
+
'AKIA1234'
|
68
|
+
>>> id_entry.source
|
69
|
+
'env'
|
70
|
+
"""
|
71
|
+
|
72
|
+
service: str
|
73
|
+
name: str
|
74
|
+
value: str
|
75
|
+
source: Optional[str] = None
|
76
|
+
|
77
|
+
@classmethod
|
78
|
+
def example(cls):
|
79
|
+
return APIIDEntry(
|
80
|
+
service="bedrock", name="AWS_ACCESS_KEY_ID", value="AKIA1234", source="env"
|
81
|
+
)
|
82
|
+
|
83
|
+
|
84
|
+
@dataclass
|
85
|
+
class LanguageModelInput:
|
86
|
+
"""A class representing input configuration for a language model service.
|
87
|
+
|
88
|
+
>>> lm_input = LanguageModelInput.example()
|
89
|
+
>>> lm_input.api_token
|
90
|
+
'sk-abcd123'
|
91
|
+
>>> lm_input.rpm
|
92
|
+
60
|
93
|
+
>>> lm_input.tpm
|
94
|
+
100000
|
95
|
+
>>> lm_input.api_id
|
96
|
+
|
97
|
+
|
98
|
+
Test dictionary conversion:
|
99
|
+
>>> d = lm_input.to_dict()
|
100
|
+
>>> isinstance(d, dict)
|
101
|
+
True
|
102
|
+
>>> LanguageModelInput.from_dict(d).api_token == lm_input.api_token
|
103
|
+
True
|
104
|
+
"""
|
105
|
+
|
106
|
+
api_token: str
|
107
|
+
rpm: int
|
108
|
+
tpm: int
|
109
|
+
api_id: Optional[str] = None
|
110
|
+
token_source: Optional[str] = None
|
111
|
+
limit_source: Optional[str] = None
|
112
|
+
id_source: Optional[str] = None
|
113
|
+
|
114
|
+
def to_dict(self):
|
115
|
+
return asdict(self)
|
116
|
+
|
117
|
+
@classmethod
|
118
|
+
def from_dict(cls, d):
|
119
|
+
return cls(**d)
|
120
|
+
|
121
|
+
@classmethod
|
122
|
+
def example(cls):
|
123
|
+
return LanguageModelInput(
|
124
|
+
api_token="sk-abcd123", tpm=100000, rpm=60, api_id=None
|
125
|
+
)
|
126
|
+
|
127
|
+
|
128
|
+
if __name__ == "__main__":
|
129
|
+
import doctest
|
130
|
+
|
131
|
+
doctest.testmod()
|