edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- edsl/Base.py +413 -332
- edsl/BaseDiff.py +260 -260
- edsl/TemplateLoader.py +24 -24
- edsl/__init__.py +57 -49
- edsl/__version__.py +1 -1
- edsl/agents/Agent.py +1071 -867
- edsl/agents/AgentList.py +551 -413
- edsl/agents/Invigilator.py +284 -233
- edsl/agents/InvigilatorBase.py +257 -270
- edsl/agents/PromptConstructor.py +272 -354
- edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
- edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
- edsl/agents/__init__.py +2 -3
- edsl/agents/descriptors.py +99 -99
- edsl/agents/prompt_helpers.py +129 -129
- edsl/agents/question_option_processor.py +172 -0
- edsl/auto/AutoStudy.py +130 -117
- edsl/auto/StageBase.py +243 -230
- edsl/auto/StageGenerateSurvey.py +178 -178
- edsl/auto/StageLabelQuestions.py +125 -125
- edsl/auto/StagePersona.py +61 -61
- edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
- edsl/auto/StagePersonaDimensionValues.py +74 -74
- edsl/auto/StagePersonaDimensions.py +69 -69
- edsl/auto/StageQuestions.py +74 -73
- edsl/auto/SurveyCreatorPipeline.py +21 -21
- edsl/auto/utilities.py +218 -224
- edsl/base/Base.py +279 -279
- edsl/config.py +177 -157
- edsl/conversation/Conversation.py +290 -290
- edsl/conversation/car_buying.py +59 -58
- edsl/conversation/chips.py +95 -95
- edsl/conversation/mug_negotiation.py +81 -81
- edsl/conversation/next_speaker_utilities.py +93 -93
- edsl/coop/CoopFunctionsMixin.py +15 -0
- edsl/coop/ExpectedParrotKeyHandler.py +125 -0
- edsl/coop/PriceFetcher.py +54 -54
- edsl/coop/__init__.py +2 -2
- edsl/coop/coop.py +1106 -1028
- edsl/coop/utils.py +131 -131
- edsl/data/Cache.py +573 -555
- edsl/data/CacheEntry.py +230 -233
- edsl/data/CacheHandler.py +168 -149
- edsl/data/RemoteCacheSync.py +186 -78
- edsl/data/SQLiteDict.py +292 -292
- edsl/data/__init__.py +5 -4
- edsl/data/orm.py +10 -10
- edsl/data_transfer_models.py +74 -73
- edsl/enums.py +202 -175
- edsl/exceptions/BaseException.py +21 -21
- edsl/exceptions/__init__.py +54 -54
- edsl/exceptions/agents.py +54 -42
- edsl/exceptions/cache.py +5 -5
- edsl/exceptions/configuration.py +16 -16
- edsl/exceptions/coop.py +10 -10
- edsl/exceptions/data.py +14 -14
- edsl/exceptions/general.py +34 -34
- edsl/exceptions/inference_services.py +5 -0
- edsl/exceptions/jobs.py +33 -33
- edsl/exceptions/language_models.py +63 -63
- edsl/exceptions/prompts.py +15 -15
- edsl/exceptions/questions.py +109 -91
- edsl/exceptions/results.py +29 -29
- edsl/exceptions/scenarios.py +29 -22
- edsl/exceptions/surveys.py +37 -37
- edsl/inference_services/AnthropicService.py +106 -87
- edsl/inference_services/AvailableModelCacheHandler.py +184 -0
- edsl/inference_services/AvailableModelFetcher.py +215 -0
- edsl/inference_services/AwsBedrock.py +118 -120
- edsl/inference_services/AzureAI.py +215 -217
- edsl/inference_services/DeepInfraService.py +18 -18
- edsl/inference_services/GoogleService.py +143 -148
- edsl/inference_services/GroqService.py +20 -20
- edsl/inference_services/InferenceServiceABC.py +80 -147
- edsl/inference_services/InferenceServicesCollection.py +138 -97
- edsl/inference_services/MistralAIService.py +120 -123
- edsl/inference_services/OllamaService.py +18 -18
- edsl/inference_services/OpenAIService.py +236 -224
- edsl/inference_services/PerplexityService.py +160 -163
- edsl/inference_services/ServiceAvailability.py +135 -0
- edsl/inference_services/TestService.py +90 -89
- edsl/inference_services/TogetherAIService.py +172 -170
- edsl/inference_services/data_structures.py +134 -0
- edsl/inference_services/models_available_cache.py +118 -118
- edsl/inference_services/rate_limits_cache.py +25 -25
- edsl/inference_services/registry.py +41 -41
- edsl/inference_services/write_available.py +10 -10
- edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
- edsl/jobs/Answers.py +43 -56
- edsl/jobs/FetchInvigilator.py +47 -0
- edsl/jobs/InterviewTaskManager.py +98 -0
- edsl/jobs/InterviewsConstructor.py +50 -0
- edsl/jobs/Jobs.py +823 -898
- edsl/jobs/JobsChecks.py +172 -147
- edsl/jobs/JobsComponentConstructor.py +189 -0
- edsl/jobs/JobsPrompts.py +270 -268
- edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
- edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
- edsl/jobs/RequestTokenEstimator.py +30 -0
- edsl/jobs/__init__.py +1 -1
- edsl/jobs/async_interview_runner.py +138 -0
- edsl/jobs/buckets/BucketCollection.py +104 -63
- edsl/jobs/buckets/ModelBuckets.py +65 -65
- edsl/jobs/buckets/TokenBucket.py +283 -251
- edsl/jobs/buckets/TokenBucketAPI.py +211 -0
- edsl/jobs/buckets/TokenBucketClient.py +191 -0
- edsl/jobs/check_survey_scenario_compatibility.py +85 -0
- edsl/jobs/data_structures.py +120 -0
- edsl/jobs/decorators.py +35 -0
- edsl/jobs/interviews/Interview.py +396 -661
- edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
- edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
- edsl/jobs/interviews/InterviewStatistic.py +63 -63
- edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
- edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
- edsl/jobs/interviews/InterviewStatusLog.py +92 -92
- edsl/jobs/interviews/ReportErrors.py +66 -66
- edsl/jobs/interviews/interview_status_enum.py +9 -9
- edsl/jobs/jobs_status_enums.py +9 -0
- edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
- edsl/jobs/results_exceptions_handler.py +98 -0
- edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
- edsl/jobs/runners/JobsRunnerStatus.py +297 -330
- edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
- edsl/jobs/tasks/TaskCreators.py +64 -64
- edsl/jobs/tasks/TaskHistory.py +470 -450
- edsl/jobs/tasks/TaskStatusLog.py +23 -23
- edsl/jobs/tasks/task_status_enum.py +161 -163
- edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
- edsl/jobs/tokens/TokenUsage.py +34 -34
- edsl/language_models/ComputeCost.py +63 -0
- edsl/language_models/LanguageModel.py +626 -668
- edsl/language_models/ModelList.py +164 -155
- edsl/language_models/PriceManager.py +127 -0
- edsl/language_models/RawResponseHandler.py +106 -0
- edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
- edsl/language_models/ServiceDataSources.py +0 -0
- edsl/language_models/__init__.py +2 -3
- edsl/language_models/fake_openai_call.py +15 -15
- edsl/language_models/fake_openai_service.py +61 -61
- edsl/language_models/key_management/KeyLookup.py +63 -0
- edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
- edsl/language_models/key_management/KeyLookupCollection.py +38 -0
- edsl/language_models/key_management/__init__.py +0 -0
- edsl/language_models/key_management/models.py +131 -0
- edsl/language_models/model.py +256 -0
- edsl/language_models/repair.py +156 -156
- edsl/language_models/utilities.py +65 -64
- edsl/notebooks/Notebook.py +263 -258
- edsl/notebooks/NotebookToLaTeX.py +142 -0
- edsl/notebooks/__init__.py +1 -1
- edsl/prompts/Prompt.py +352 -362
- edsl/prompts/__init__.py +2 -2
- edsl/questions/ExceptionExplainer.py +77 -0
- edsl/questions/HTMLQuestion.py +103 -0
- edsl/questions/QuestionBase.py +518 -664
- edsl/questions/QuestionBasePromptsMixin.py +221 -217
- edsl/questions/QuestionBudget.py +227 -227
- edsl/questions/QuestionCheckBox.py +359 -359
- edsl/questions/QuestionExtract.py +180 -182
- edsl/questions/QuestionFreeText.py +113 -114
- edsl/questions/QuestionFunctional.py +166 -166
- edsl/questions/QuestionList.py +223 -231
- edsl/questions/QuestionMatrix.py +265 -0
- edsl/questions/QuestionMultipleChoice.py +330 -286
- edsl/questions/QuestionNumerical.py +151 -153
- edsl/questions/QuestionRank.py +314 -324
- edsl/questions/Quick.py +41 -41
- edsl/questions/SimpleAskMixin.py +74 -73
- edsl/questions/__init__.py +27 -26
- edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
- edsl/questions/compose_questions.py +98 -98
- edsl/questions/data_structures.py +20 -0
- edsl/questions/decorators.py +21 -21
- edsl/questions/derived/QuestionLikertFive.py +76 -76
- edsl/questions/derived/QuestionLinearScale.py +90 -87
- edsl/questions/derived/QuestionTopK.py +93 -93
- edsl/questions/derived/QuestionYesNo.py +82 -82
- edsl/questions/descriptors.py +427 -413
- edsl/questions/loop_processor.py +149 -0
- edsl/questions/prompt_templates/question_budget.jinja +13 -13
- edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
- edsl/questions/prompt_templates/question_extract.jinja +11 -11
- edsl/questions/prompt_templates/question_free_text.jinja +3 -3
- edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
- edsl/questions/prompt_templates/question_list.jinja +17 -17
- edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
- edsl/questions/prompt_templates/question_numerical.jinja +36 -36
- edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
- edsl/questions/question_registry.py +177 -177
- edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
- edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
- edsl/questions/response_validator_factory.py +34 -0
- edsl/questions/settings.py +12 -12
- edsl/questions/templates/budget/answering_instructions.jinja +7 -7
- edsl/questions/templates/budget/question_presentation.jinja +7 -7
- edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
- edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
- edsl/questions/templates/extract/answering_instructions.jinja +7 -7
- edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
- edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
- edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
- edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
- edsl/questions/templates/list/answering_instructions.jinja +3 -3
- edsl/questions/templates/list/question_presentation.jinja +5 -5
- edsl/questions/templates/matrix/__init__.py +1 -0
- edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
- edsl/questions/templates/matrix/question_presentation.jinja +20 -0
- edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
- edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
- edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
- edsl/questions/templates/numerical/question_presentation.jinja +6 -6
- edsl/questions/templates/rank/answering_instructions.jinja +11 -11
- edsl/questions/templates/rank/question_presentation.jinja +15 -15
- edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
- edsl/questions/templates/top_k/question_presentation.jinja +22 -22
- edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
- edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
- edsl/results/CSSParameterizer.py +108 -108
- edsl/results/Dataset.py +587 -424
- edsl/results/DatasetExportMixin.py +594 -731
- edsl/results/DatasetTree.py +295 -275
- edsl/results/MarkdownToDocx.py +122 -0
- edsl/results/MarkdownToPDF.py +111 -0
- edsl/results/Result.py +557 -465
- edsl/results/Results.py +1183 -1165
- edsl/results/ResultsExportMixin.py +45 -43
- edsl/results/ResultsGGMixin.py +121 -121
- edsl/results/TableDisplay.py +125 -198
- edsl/results/TextEditor.py +50 -0
- edsl/results/__init__.py +2 -2
- edsl/results/file_exports.py +252 -0
- edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
- edsl/results/{Selector.py → results_selector.py} +145 -135
- edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
- edsl/results/smart_objects.py +96 -0
- edsl/results/table_data_class.py +12 -0
- edsl/results/table_display.css +77 -77
- edsl/results/table_renderers.py +118 -0
- edsl/results/tree_explore.py +115 -115
- edsl/scenarios/ConstructDownloadLink.py +109 -0
- edsl/scenarios/DocumentChunker.py +102 -0
- edsl/scenarios/DocxScenario.py +16 -0
- edsl/scenarios/FileStore.py +511 -632
- edsl/scenarios/PdfExtractor.py +40 -0
- edsl/scenarios/Scenario.py +498 -601
- edsl/scenarios/ScenarioHtmlMixin.py +65 -64
- edsl/scenarios/ScenarioList.py +1458 -1287
- edsl/scenarios/ScenarioListExportMixin.py +45 -52
- edsl/scenarios/ScenarioListPdfMixin.py +239 -261
- edsl/scenarios/__init__.py +3 -4
- edsl/scenarios/directory_scanner.py +96 -0
- edsl/scenarios/file_methods.py +85 -0
- edsl/scenarios/handlers/__init__.py +13 -0
- edsl/scenarios/handlers/csv.py +38 -0
- edsl/scenarios/handlers/docx.py +76 -0
- edsl/scenarios/handlers/html.py +37 -0
- edsl/scenarios/handlers/json.py +111 -0
- edsl/scenarios/handlers/latex.py +5 -0
- edsl/scenarios/handlers/md.py +51 -0
- edsl/scenarios/handlers/pdf.py +68 -0
- edsl/scenarios/handlers/png.py +39 -0
- edsl/scenarios/handlers/pptx.py +105 -0
- edsl/scenarios/handlers/py.py +294 -0
- edsl/scenarios/handlers/sql.py +313 -0
- edsl/scenarios/handlers/sqlite.py +149 -0
- edsl/scenarios/handlers/txt.py +33 -0
- edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
- edsl/scenarios/scenario_selector.py +156 -0
- edsl/shared.py +1 -1
- edsl/study/ObjectEntry.py +173 -173
- edsl/study/ProofOfWork.py +113 -113
- edsl/study/SnapShot.py +80 -80
- edsl/study/Study.py +521 -528
- edsl/study/__init__.py +4 -4
- edsl/surveys/ConstructDAG.py +92 -0
- edsl/surveys/DAG.py +148 -148
- edsl/surveys/EditSurvey.py +221 -0
- edsl/surveys/InstructionHandler.py +100 -0
- edsl/surveys/Memory.py +31 -31
- edsl/surveys/MemoryManagement.py +72 -0
- edsl/surveys/MemoryPlan.py +244 -244
- edsl/surveys/Rule.py +327 -326
- edsl/surveys/RuleCollection.py +385 -387
- edsl/surveys/RuleManager.py +172 -0
- edsl/surveys/Simulator.py +75 -0
- edsl/surveys/Survey.py +1280 -1801
- edsl/surveys/SurveyCSS.py +273 -261
- edsl/surveys/SurveyExportMixin.py +259 -259
- edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
- edsl/surveys/SurveyQualtricsImport.py +284 -284
- edsl/surveys/SurveyToApp.py +141 -0
- edsl/surveys/__init__.py +5 -3
- edsl/surveys/base.py +53 -53
- edsl/surveys/descriptors.py +60 -56
- edsl/surveys/instructions/ChangeInstruction.py +48 -49
- edsl/surveys/instructions/Instruction.py +56 -65
- edsl/surveys/instructions/InstructionCollection.py +82 -77
- edsl/templates/error_reporting/base.html +23 -23
- edsl/templates/error_reporting/exceptions_by_model.html +34 -34
- edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
- edsl/templates/error_reporting/exceptions_by_type.html +16 -16
- edsl/templates/error_reporting/interview_details.html +115 -115
- edsl/templates/error_reporting/interviews.html +19 -19
- edsl/templates/error_reporting/overview.html +4 -4
- edsl/templates/error_reporting/performance_plot.html +1 -1
- edsl/templates/error_reporting/report.css +73 -73
- edsl/templates/error_reporting/report.html +117 -117
- edsl/templates/error_reporting/report.js +25 -25
- edsl/tools/__init__.py +1 -1
- edsl/tools/clusters.py +192 -192
- edsl/tools/embeddings.py +27 -27
- edsl/tools/embeddings_plotting.py +118 -118
- edsl/tools/plotting.py +112 -112
- edsl/tools/summarize.py +18 -18
- edsl/utilities/PrettyList.py +56 -0
- edsl/utilities/SystemInfo.py +28 -28
- edsl/utilities/__init__.py +22 -22
- edsl/utilities/ast_utilities.py +25 -25
- edsl/utilities/data/Registry.py +6 -6
- edsl/utilities/data/__init__.py +1 -1
- edsl/utilities/data/scooter_results.json +1 -1
- edsl/utilities/decorators.py +77 -77
- edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
- edsl/utilities/interface.py +627 -627
- edsl/utilities/is_notebook.py +18 -0
- edsl/utilities/is_valid_variable_name.py +11 -0
- edsl/utilities/naming_utilities.py +263 -263
- edsl/utilities/remove_edsl_version.py +24 -0
- edsl/utilities/repair_functions.py +28 -28
- edsl/utilities/restricted_python.py +70 -70
- edsl/utilities/utilities.py +436 -424
- {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/LICENSE +21 -21
- {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/METADATA +13 -11
- edsl-0.1.39.dev5.dist-info/RECORD +358 -0
- {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/WHEEL +1 -1
- edsl/language_models/KeyLookup.py +0 -30
- edsl/language_models/registry.py +0 -190
- edsl/language_models/unused/ReplicateBase.py +0 -83
- edsl/results/ResultsDBMixin.py +0 -238
- edsl-0.1.39.dev3.dist-info/RECORD +0 -277
edsl/language_models/registry.py
DELETED
@@ -1,190 +0,0 @@
|
|
1
|
-
import textwrap
|
2
|
-
from random import random
|
3
|
-
from edsl.config import CONFIG
|
4
|
-
|
5
|
-
# if "EDSL_DEFAULT_MODEL" not in CONFIG:
|
6
|
-
# default_model = "test"
|
7
|
-
# else:
|
8
|
-
# default_model = CONFIG.get("EDSL_DEFAULT_MODEL")
|
9
|
-
|
10
|
-
from collections import UserList
|
11
|
-
|
12
|
-
|
13
|
-
class PrettyList(UserList):
|
14
|
-
def __init__(self, data=None, columns=None):
|
15
|
-
super().__init__(data)
|
16
|
-
self.columns = columns
|
17
|
-
|
18
|
-
def _repr_html_(self):
|
19
|
-
if isinstance(self[0], list) or isinstance(self[0], tuple):
|
20
|
-
num_cols = len(self[0])
|
21
|
-
else:
|
22
|
-
num_cols = 1
|
23
|
-
|
24
|
-
if self.columns:
|
25
|
-
columns = self.columns
|
26
|
-
else:
|
27
|
-
columns = list(range(num_cols))
|
28
|
-
|
29
|
-
if num_cols > 1:
|
30
|
-
return (
|
31
|
-
"<pre><table>"
|
32
|
-
+ "".join(["<th>" + str(column) + "</th>" for column in columns])
|
33
|
-
+ "".join(
|
34
|
-
[
|
35
|
-
"<tr>"
|
36
|
-
+ "".join(["<td>" + str(x) + "</td>" for x in row])
|
37
|
-
+ "</tr>"
|
38
|
-
for row in self
|
39
|
-
]
|
40
|
-
)
|
41
|
-
+ "</table></pre>"
|
42
|
-
)
|
43
|
-
else:
|
44
|
-
return (
|
45
|
-
"<pre><table>"
|
46
|
-
+ "".join(["<th>" + str(index) + "</th>" for index in columns])
|
47
|
-
+ "".join(
|
48
|
-
["<tr>" + "<td>" + str(row) + "</td>" + "</tr>" for row in self]
|
49
|
-
)
|
50
|
-
+ "</table></pre>"
|
51
|
-
)
|
52
|
-
|
53
|
-
|
54
|
-
def get_model_class(model_name, registry=None):
|
55
|
-
from edsl.inference_services.registry import default
|
56
|
-
|
57
|
-
registry = registry or default
|
58
|
-
factory = registry.create_model_factory(model_name)
|
59
|
-
return factory
|
60
|
-
|
61
|
-
|
62
|
-
class Meta(type):
|
63
|
-
def __repr__(cls):
|
64
|
-
return textwrap.dedent(
|
65
|
-
f"""\
|
66
|
-
Available models: {cls.available()}
|
67
|
-
|
68
|
-
To create an instance, you can do:
|
69
|
-
>>> m = Model('gpt-4-1106-preview', temperature=0.5, ...)
|
70
|
-
|
71
|
-
To get the default model, you can leave out the model name.
|
72
|
-
To see the available models, you can do:
|
73
|
-
>>> Model.available()
|
74
|
-
"""
|
75
|
-
)
|
76
|
-
|
77
|
-
|
78
|
-
class Model(metaclass=Meta):
|
79
|
-
default_model = CONFIG.get("EDSL_DEFAULT_MODEL")
|
80
|
-
|
81
|
-
def __new__(
|
82
|
-
cls, model_name=None, registry=None, service_name=None, *args, **kwargs
|
83
|
-
):
|
84
|
-
# Map index to the respective subclass
|
85
|
-
if model_name is None:
|
86
|
-
model_name = (
|
87
|
-
cls.default_model
|
88
|
-
) # when model_name is None, use the default model, set in the config file
|
89
|
-
from edsl.inference_services.registry import default
|
90
|
-
|
91
|
-
registry = registry or default
|
92
|
-
|
93
|
-
if isinstance(model_name, int): # can refer to a model by index
|
94
|
-
model_name = cls.available(name_only=True)[model_name]
|
95
|
-
|
96
|
-
factory = registry.create_model_factory(model_name, service_name=service_name)
|
97
|
-
return factory(*args, **kwargs)
|
98
|
-
|
99
|
-
@classmethod
|
100
|
-
def add_model(cls, service_name, model_name):
|
101
|
-
from edsl.inference_services.registry import default
|
102
|
-
|
103
|
-
registry = default
|
104
|
-
registry.add_model(service_name, model_name)
|
105
|
-
|
106
|
-
@classmethod
|
107
|
-
def services(cls, registry=None):
|
108
|
-
from edsl.inference_services.registry import default
|
109
|
-
|
110
|
-
registry = registry or default
|
111
|
-
return [r._inference_service_ for r in registry.services]
|
112
|
-
|
113
|
-
@classmethod
|
114
|
-
def available(cls, search_term=None, name_only=False, registry=None, service=None):
|
115
|
-
from edsl.inference_services.registry import default
|
116
|
-
|
117
|
-
registry = registry or default
|
118
|
-
full_list = registry.available()
|
119
|
-
|
120
|
-
if service is not None:
|
121
|
-
if service not in cls.services(registry=registry):
|
122
|
-
raise ValueError(f"Service {service} not found in available services.")
|
123
|
-
|
124
|
-
full_list = [m for m in full_list if m[1] == service]
|
125
|
-
|
126
|
-
if search_term is None:
|
127
|
-
if name_only:
|
128
|
-
return PrettyList(
|
129
|
-
[m[0] for m in full_list],
|
130
|
-
columns=["Model Name", "Service Name", "Code"],
|
131
|
-
)
|
132
|
-
else:
|
133
|
-
return PrettyList(
|
134
|
-
full_list, columns=["Model Name", "Service Name", "Code"]
|
135
|
-
)
|
136
|
-
else:
|
137
|
-
filtered_results = [
|
138
|
-
m for m in full_list if search_term in m[0] or search_term in m[1]
|
139
|
-
]
|
140
|
-
if name_only:
|
141
|
-
return PrettyList(
|
142
|
-
[m[0] for m in filtered_results],
|
143
|
-
columns=["Model Name", "Service Name", "Code"],
|
144
|
-
)
|
145
|
-
else:
|
146
|
-
return PrettyList(
|
147
|
-
filtered_results, columns=["Model Name", "Service Name", "Code"]
|
148
|
-
)
|
149
|
-
|
150
|
-
@classmethod
|
151
|
-
def check_models(cls, verbose=False):
|
152
|
-
print("Checking all available models...\n")
|
153
|
-
for model in cls.available(name_only=True):
|
154
|
-
print(f"Now checking: {model}")
|
155
|
-
try:
|
156
|
-
m = cls(model)
|
157
|
-
except Exception as e:
|
158
|
-
print(f"Error creating instance of {model}: {e}")
|
159
|
-
continue
|
160
|
-
try:
|
161
|
-
results = m.hello(verbose)
|
162
|
-
if verbose:
|
163
|
-
print(f"Results from model call: {results}")
|
164
|
-
except Exception as e:
|
165
|
-
print(f"Error calling 'hello' on {model}: {e}")
|
166
|
-
continue
|
167
|
-
print("OK!")
|
168
|
-
print("\n")
|
169
|
-
|
170
|
-
@classmethod
|
171
|
-
def example(cls, randomize: bool = False) -> "Model":
|
172
|
-
"""
|
173
|
-
Returns an example Model instance.
|
174
|
-
|
175
|
-
:param randomize: If True, the temperature is set to a random decimal between 0 and 1.
|
176
|
-
"""
|
177
|
-
temperature = 0.5 if not randomize else round(random(), 2)
|
178
|
-
model_name = cls.default_model
|
179
|
-
return cls(model_name, temperature=temperature)
|
180
|
-
|
181
|
-
|
182
|
-
if __name__ == "__main__":
|
183
|
-
import doctest
|
184
|
-
|
185
|
-
doctest.testmod(optionflags=doctest.ELLIPSIS)
|
186
|
-
|
187
|
-
available = Model.available()
|
188
|
-
m = Model("gpt-4-1106-preview")
|
189
|
-
results = m.execute_model_call("Hello world")
|
190
|
-
print(results)
|
@@ -1,83 +0,0 @@
|
|
1
|
-
import asyncio
|
2
|
-
import aiohttp
|
3
|
-
import json
|
4
|
-
from typing import Any
|
5
|
-
|
6
|
-
from edsl import CONFIG
|
7
|
-
|
8
|
-
from edsl.language_models.LanguageModel import LanguageModel
|
9
|
-
|
10
|
-
|
11
|
-
def replicate_model_factory(model_name, base_url, api_token):
|
12
|
-
class ReplicateLanguageModelBase(LanguageModel):
|
13
|
-
_model_ = (
|
14
|
-
model_name # Example model name, replace with actual model name if needed
|
15
|
-
)
|
16
|
-
_parameters_ = {
|
17
|
-
"temperature": 0.1,
|
18
|
-
"topK": 50,
|
19
|
-
"topP": 0.9,
|
20
|
-
"max_new_tokens": 500,
|
21
|
-
"min_new_tokens": -1,
|
22
|
-
"repetition_penalty": 1.15,
|
23
|
-
# "version": "5fe0a3d7ac2852264a25279d1dfb798acbc4d49711d126646594e212cb821749",
|
24
|
-
"use_cache": True,
|
25
|
-
}
|
26
|
-
_api_token = api_token
|
27
|
-
_base_url = base_url
|
28
|
-
|
29
|
-
async def async_execute_model_call(
|
30
|
-
self, user_prompt: str, system_prompt: str = ""
|
31
|
-
) -> dict[str, Any]:
|
32
|
-
self.api_token = self._api_token
|
33
|
-
self.headers = {
|
34
|
-
"Authorization": f"Token {self.api_token}",
|
35
|
-
"Content-Type": "application/json",
|
36
|
-
}
|
37
|
-
# combined_prompt = f"{system_prompt} {user_prompt}".strip()
|
38
|
-
# print(f"Prompt: {combined_prompt}")
|
39
|
-
data = {
|
40
|
-
# "version": self._parameters_["version"],
|
41
|
-
"input": {
|
42
|
-
"debug": False,
|
43
|
-
"top_k": self._parameters_["topK"],
|
44
|
-
"top_p": self._parameters_["topP"],
|
45
|
-
"prompt": user_prompt,
|
46
|
-
"system_prompt": system_prompt,
|
47
|
-
"temperature": self._parameters_["temperature"],
|
48
|
-
"max_new_tokens": self._parameters_["max_new_tokens"],
|
49
|
-
"min_new_tokens": self._parameters_["min_new_tokens"],
|
50
|
-
"prompt_template": "{prompt}",
|
51
|
-
"repetition_penalty": self._parameters_["repetition_penalty"],
|
52
|
-
},
|
53
|
-
}
|
54
|
-
|
55
|
-
async with aiohttp.ClientSession() as session:
|
56
|
-
async with session.post(
|
57
|
-
self._base_url, headers=self.headers, data=json.dumps(data)
|
58
|
-
) as response:
|
59
|
-
raw_response_text = await response.text()
|
60
|
-
data = json.loads(raw_response_text)
|
61
|
-
print(f"This was the data returned by the model:{data}")
|
62
|
-
prediction_url = data["urls"]["get"]
|
63
|
-
|
64
|
-
while True:
|
65
|
-
async with session.get(
|
66
|
-
prediction_url, headers=self.headers
|
67
|
-
) as get_response:
|
68
|
-
if get_response.status != 200:
|
69
|
-
# Handle non-success status codes appropriately
|
70
|
-
return None
|
71
|
-
|
72
|
-
get_data = await get_response.text()
|
73
|
-
get_data = json.loads(get_data)
|
74
|
-
if get_data["status"] == "succeeded":
|
75
|
-
return get_data
|
76
|
-
await asyncio.sleep(1)
|
77
|
-
|
78
|
-
def parse_response(self, raw_response: dict[str, Any]) -> str:
|
79
|
-
data = "".join(raw_response["output"])
|
80
|
-
print(f"This is what the model returned: {data}")
|
81
|
-
return data
|
82
|
-
|
83
|
-
return ReplicateLanguageModelBase
|
edsl/results/ResultsDBMixin.py
DELETED
@@ -1,238 +0,0 @@
|
|
1
|
-
"""Mixin for working with SQLite respresentation of a 'Results' object."""
|
2
|
-
|
3
|
-
import sqlite3
|
4
|
-
from enum import Enum
|
5
|
-
from typing import Literal, Union, Optional
|
6
|
-
|
7
|
-
|
8
|
-
class SQLDataShape(Enum):
|
9
|
-
"""Enum for the shape of the data in the SQL database."""
|
10
|
-
|
11
|
-
WIDE = "wide"
|
12
|
-
LONG = "long"
|
13
|
-
|
14
|
-
|
15
|
-
class ResultsDBMixin:
|
16
|
-
"""Mixin for interacting with a Results object as if it were a SQL database."""
|
17
|
-
|
18
|
-
def _rows(self):
|
19
|
-
"""Return the rows of the `Results` object as a list of tuples."""
|
20
|
-
for index, result in enumerate(self):
|
21
|
-
yield from result.rows(index)
|
22
|
-
|
23
|
-
def export_sql_dump(self, shape: Literal["wide", "long"], filename: str):
|
24
|
-
"""Export the SQL database to a file.
|
25
|
-
|
26
|
-
:param shape: The shape of the data in the database (wide or long)
|
27
|
-
:param filename: The filename to save the database to
|
28
|
-
"""
|
29
|
-
shape_enum = self._get_shape_enum(shape)
|
30
|
-
conn = self._db(shape=shape_enum)
|
31
|
-
|
32
|
-
with open(filename, "w") as f:
|
33
|
-
for line in conn.iterdump():
|
34
|
-
f.write(f"{line}\n")
|
35
|
-
|
36
|
-
conn.close()
|
37
|
-
|
38
|
-
def backup_db_to_file(self, shape: Literal["wide", "long"], filename: str):
|
39
|
-
"""Backup the in-memory database to a file.
|
40
|
-
|
41
|
-
|
42
|
-
:param shape: The shape of the data in the database (wide or long)
|
43
|
-
:param filename: The filename to save the database to
|
44
|
-
|
45
|
-
>>> from edsl.results import Results
|
46
|
-
>>> r = Results.example()
|
47
|
-
>>> r.backup_db_to_file(filename="backup.db", shape="long")
|
48
|
-
|
49
|
-
"""
|
50
|
-
shape_enum = self._get_shape_enum(shape)
|
51
|
-
# Source database connection (in-memory)
|
52
|
-
source_conn = self._db(shape=shape_enum)
|
53
|
-
|
54
|
-
# Destination database connection (file)
|
55
|
-
dest_conn = sqlite3.connect(filename)
|
56
|
-
|
57
|
-
# Backup in-memory database to file
|
58
|
-
with source_conn:
|
59
|
-
source_conn.backup(dest_conn)
|
60
|
-
|
61
|
-
# Close both connections
|
62
|
-
source_conn.close()
|
63
|
-
dest_conn.close()
|
64
|
-
|
65
|
-
def _db(self, shape: SQLDataShape, remove_prefix=False):
|
66
|
-
"""Create a SQLite database in memory and return the connection.
|
67
|
-
|
68
|
-
:param shape: The shape of the data in the database (wide or long)
|
69
|
-
:param remove_prefix: Whether to remove the prefix from the column names
|
70
|
-
|
71
|
-
"""
|
72
|
-
if shape == SQLDataShape.LONG:
|
73
|
-
conn = sqlite3.connect(":memory:")
|
74
|
-
|
75
|
-
create_table_query = """
|
76
|
-
CREATE TABLE self (
|
77
|
-
id INTEGER,
|
78
|
-
data_type TEXT,
|
79
|
-
key TEXT,
|
80
|
-
value TEXT
|
81
|
-
)
|
82
|
-
"""
|
83
|
-
conn.execute(create_table_query)
|
84
|
-
|
85
|
-
list_of_tuples = list(self._rows())
|
86
|
-
insert_query = (
|
87
|
-
"INSERT INTO self (id, data_type, key, value) VALUES (?, ?, ?, ?)"
|
88
|
-
)
|
89
|
-
conn.executemany(insert_query, list_of_tuples)
|
90
|
-
conn.commit()
|
91
|
-
return conn
|
92
|
-
elif shape == SQLDataShape.WIDE:
|
93
|
-
from sqlalchemy import create_engine
|
94
|
-
|
95
|
-
engine = create_engine("sqlite:///:memory:")
|
96
|
-
df = self.to_pandas(remove_prefix=remove_prefix, lists_as_strings=True)
|
97
|
-
df.to_sql("self", engine, index=False, if_exists="replace")
|
98
|
-
return engine.connect()
|
99
|
-
else:
|
100
|
-
raise Exception("Invalid SQLDataShape")
|
101
|
-
|
102
|
-
def _get_shape_enum(self, shape: Literal["wide", "long"]):
|
103
|
-
"""Convert the shape string to a SQLDataShape enum."""
|
104
|
-
if shape is None:
|
105
|
-
raise Exception("Must select either 'wide' or 'long' format")
|
106
|
-
elif shape == "wide":
|
107
|
-
return SQLDataShape.WIDE
|
108
|
-
elif shape == "long":
|
109
|
-
return SQLDataShape.LONG
|
110
|
-
else:
|
111
|
-
raise Exception("Invalid shape: must be either 'long' or 'wide'")
|
112
|
-
|
113
|
-
def sql(
|
114
|
-
self,
|
115
|
-
query: str,
|
116
|
-
shape: Literal["wide", "long"] = "wide",
|
117
|
-
remove_prefix: bool = True,
|
118
|
-
transpose: bool = None,
|
119
|
-
transpose_by: str = None,
|
120
|
-
csv: bool = False,
|
121
|
-
to_list=False,
|
122
|
-
to_latex=False,
|
123
|
-
filename: Optional[str] = None,
|
124
|
-
) -> Union["pd.DataFrame", str]:
|
125
|
-
"""Execute a SQL query and return the results as a DataFrame.
|
126
|
-
|
127
|
-
:param query: The SQL query to execute
|
128
|
-
:param shape: The shape of the data in the database (wide or long)
|
129
|
-
:param remove_prefix: Whether to remove the prefix from the column names
|
130
|
-
:param transpose: Whether to transpose the DataFrame
|
131
|
-
:param transpose_by: The column to use as the index when transposing
|
132
|
-
:param csv: Whether to return the DataFrame as a CSV string
|
133
|
-
|
134
|
-
|
135
|
-
Example usage:
|
136
|
-
|
137
|
-
>>> from edsl.results import Results
|
138
|
-
>>> r = Results.example()
|
139
|
-
>>> d = r.sql("select data_type, key, value from self where data_type = 'answer' order by value limit 3", shape="long")
|
140
|
-
>>> sorted(list(d['value']))
|
141
|
-
['Good', 'Great', 'Great']
|
142
|
-
|
143
|
-
We can also return the data in wide format.
|
144
|
-
Note the use of single quotes to escape the column names, as required by sql.
|
145
|
-
|
146
|
-
>>> from edsl.results import Results
|
147
|
-
>>> Results.example().sql("select how_feeling from self", shape = 'wide', remove_prefix=True)
|
148
|
-
how_feeling
|
149
|
-
0 OK
|
150
|
-
1 Great
|
151
|
-
2 Terrible
|
152
|
-
3 OK
|
153
|
-
"""
|
154
|
-
import pandas as pd
|
155
|
-
|
156
|
-
shape_enum = self._get_shape_enum(shape)
|
157
|
-
|
158
|
-
conn = self._db(shape=shape_enum, remove_prefix=remove_prefix)
|
159
|
-
df = pd.read_sql_query(query, conn)
|
160
|
-
|
161
|
-
# Transpose the DataFrame if transpose is True
|
162
|
-
if transpose or transpose_by:
|
163
|
-
df = pd.DataFrame(df)
|
164
|
-
if transpose_by:
|
165
|
-
df = df.set_index(transpose_by)
|
166
|
-
else:
|
167
|
-
df = df.set_index(df.columns[0])
|
168
|
-
df = df.transpose()
|
169
|
-
|
170
|
-
if csv and to_list:
|
171
|
-
raise Exception("Cannot return both CSV and list")
|
172
|
-
|
173
|
-
if to_list:
|
174
|
-
return df.values.tolist()
|
175
|
-
|
176
|
-
if to_latex:
|
177
|
-
df.columns = [col.replace("_", " ") for col in df.columns]
|
178
|
-
|
179
|
-
latex_output = df.to_latex(index=False)
|
180
|
-
if filename:
|
181
|
-
with open(filename, "w") as f:
|
182
|
-
f.write(latex_output)
|
183
|
-
return None
|
184
|
-
return latex_output
|
185
|
-
|
186
|
-
if csv:
|
187
|
-
if filename:
|
188
|
-
df.to_csv(filename, index=False)
|
189
|
-
return None
|
190
|
-
|
191
|
-
return df.to_csv(index=False)
|
192
|
-
|
193
|
-
return df
|
194
|
-
|
195
|
-
def show_schema(
|
196
|
-
self, shape: Literal["wide", "long"], remove_prefix: bool = False
|
197
|
-
) -> None:
|
198
|
-
"""Show the schema of the Results database.
|
199
|
-
|
200
|
-
:param shape: The shape of the data in the database (wide or long)
|
201
|
-
:param remove_prefix: Whether to remove the prefix from the column names
|
202
|
-
|
203
|
-
>>> from edsl.results import Results
|
204
|
-
>>> r = Results.example()
|
205
|
-
>>> r.show_schema(shape="long")
|
206
|
-
Type: table, Name: self, SQL: CREATE TABLE self (
|
207
|
-
...
|
208
|
-
<BLANKLINE>
|
209
|
-
"""
|
210
|
-
import pandas as pd
|
211
|
-
|
212
|
-
shape_enum = self._get_shape_enum(shape)
|
213
|
-
conn = self._db(shape=shape_enum, remove_prefix=remove_prefix)
|
214
|
-
|
215
|
-
if shape_enum == SQLDataShape.LONG:
|
216
|
-
# Query to get the schema of all tables
|
217
|
-
query = "SELECT type, name, sql FROM sqlite_master WHERE type='table'"
|
218
|
-
cursor = conn.execute(query)
|
219
|
-
schema = cursor.fetchall()
|
220
|
-
conn.close()
|
221
|
-
|
222
|
-
# Format and return the schema information
|
223
|
-
schema_info = ""
|
224
|
-
for row in schema:
|
225
|
-
schema_info += f"Type: {row[0]}, Name: {row[1]}, SQL: {row[2]}\n"
|
226
|
-
|
227
|
-
print(schema_info)
|
228
|
-
elif shape_enum == SQLDataShape.WIDE:
|
229
|
-
query = f"PRAGMA table_info(self)"
|
230
|
-
schema = pd.read_sql(query, conn)
|
231
|
-
# print(schema)
|
232
|
-
return schema
|
233
|
-
|
234
|
-
|
235
|
-
if __name__ == "__main__":
|
236
|
-
import doctest
|
237
|
-
|
238
|
-
doctest.testmod(optionflags=doctest.ELLIPSIS)
|