edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (344) hide show
  1. edsl/Base.py +413 -332
  2. edsl/BaseDiff.py +260 -260
  3. edsl/TemplateLoader.py +24 -24
  4. edsl/__init__.py +57 -49
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +1071 -867
  7. edsl/agents/AgentList.py +551 -413
  8. edsl/agents/Invigilator.py +284 -233
  9. edsl/agents/InvigilatorBase.py +257 -270
  10. edsl/agents/PromptConstructor.py +272 -354
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/__init__.py +2 -3
  14. edsl/agents/descriptors.py +99 -99
  15. edsl/agents/prompt_helpers.py +129 -129
  16. edsl/agents/question_option_processor.py +172 -0
  17. edsl/auto/AutoStudy.py +130 -117
  18. edsl/auto/StageBase.py +243 -230
  19. edsl/auto/StageGenerateSurvey.py +178 -178
  20. edsl/auto/StageLabelQuestions.py +125 -125
  21. edsl/auto/StagePersona.py +61 -61
  22. edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
  23. edsl/auto/StagePersonaDimensionValues.py +74 -74
  24. edsl/auto/StagePersonaDimensions.py +69 -69
  25. edsl/auto/StageQuestions.py +74 -73
  26. edsl/auto/SurveyCreatorPipeline.py +21 -21
  27. edsl/auto/utilities.py +218 -224
  28. edsl/base/Base.py +279 -279
  29. edsl/config.py +177 -157
  30. edsl/conversation/Conversation.py +290 -290
  31. edsl/conversation/car_buying.py +59 -58
  32. edsl/conversation/chips.py +95 -95
  33. edsl/conversation/mug_negotiation.py +81 -81
  34. edsl/conversation/next_speaker_utilities.py +93 -93
  35. edsl/coop/CoopFunctionsMixin.py +15 -0
  36. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  37. edsl/coop/PriceFetcher.py +54 -54
  38. edsl/coop/__init__.py +2 -2
  39. edsl/coop/coop.py +1106 -1028
  40. edsl/coop/utils.py +131 -131
  41. edsl/data/Cache.py +573 -555
  42. edsl/data/CacheEntry.py +230 -233
  43. edsl/data/CacheHandler.py +168 -149
  44. edsl/data/RemoteCacheSync.py +186 -78
  45. edsl/data/SQLiteDict.py +292 -292
  46. edsl/data/__init__.py +5 -4
  47. edsl/data/hack.py +10 -0
  48. edsl/data/orm.py +10 -10
  49. edsl/data_transfer_models.py +74 -73
  50. edsl/enums.py +202 -175
  51. edsl/exceptions/BaseException.py +21 -21
  52. edsl/exceptions/__init__.py +54 -54
  53. edsl/exceptions/agents.py +54 -42
  54. edsl/exceptions/cache.py +5 -5
  55. edsl/exceptions/configuration.py +16 -16
  56. edsl/exceptions/coop.py +10 -10
  57. edsl/exceptions/data.py +14 -14
  58. edsl/exceptions/general.py +34 -34
  59. edsl/exceptions/inference_services.py +5 -0
  60. edsl/exceptions/jobs.py +33 -33
  61. edsl/exceptions/language_models.py +63 -63
  62. edsl/exceptions/prompts.py +15 -15
  63. edsl/exceptions/questions.py +109 -91
  64. edsl/exceptions/results.py +29 -29
  65. edsl/exceptions/scenarios.py +29 -22
  66. edsl/exceptions/surveys.py +37 -37
  67. edsl/inference_services/AnthropicService.py +106 -87
  68. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  69. edsl/inference_services/AvailableModelFetcher.py +215 -0
  70. edsl/inference_services/AwsBedrock.py +118 -120
  71. edsl/inference_services/AzureAI.py +215 -217
  72. edsl/inference_services/DeepInfraService.py +18 -18
  73. edsl/inference_services/GoogleService.py +143 -148
  74. edsl/inference_services/GroqService.py +20 -20
  75. edsl/inference_services/InferenceServiceABC.py +80 -147
  76. edsl/inference_services/InferenceServicesCollection.py +138 -97
  77. edsl/inference_services/MistralAIService.py +120 -123
  78. edsl/inference_services/OllamaService.py +18 -18
  79. edsl/inference_services/OpenAIService.py +236 -224
  80. edsl/inference_services/PerplexityService.py +160 -163
  81. edsl/inference_services/ServiceAvailability.py +135 -0
  82. edsl/inference_services/TestService.py +90 -89
  83. edsl/inference_services/TogetherAIService.py +172 -170
  84. edsl/inference_services/data_structures.py +134 -0
  85. edsl/inference_services/models_available_cache.py +118 -118
  86. edsl/inference_services/rate_limits_cache.py +25 -25
  87. edsl/inference_services/registry.py +41 -41
  88. edsl/inference_services/write_available.py +10 -10
  89. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  90. edsl/jobs/Answers.py +43 -56
  91. edsl/jobs/FetchInvigilator.py +47 -0
  92. edsl/jobs/InterviewTaskManager.py +98 -0
  93. edsl/jobs/InterviewsConstructor.py +50 -0
  94. edsl/jobs/Jobs.py +823 -898
  95. edsl/jobs/JobsChecks.py +172 -147
  96. edsl/jobs/JobsComponentConstructor.py +189 -0
  97. edsl/jobs/JobsPrompts.py +270 -268
  98. edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
  99. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  100. edsl/jobs/RequestTokenEstimator.py +30 -0
  101. edsl/jobs/__init__.py +1 -1
  102. edsl/jobs/async_interview_runner.py +138 -0
  103. edsl/jobs/buckets/BucketCollection.py +104 -63
  104. edsl/jobs/buckets/ModelBuckets.py +65 -65
  105. edsl/jobs/buckets/TokenBucket.py +283 -251
  106. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  107. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  108. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  109. edsl/jobs/data_structures.py +120 -0
  110. edsl/jobs/decorators.py +35 -0
  111. edsl/jobs/interviews/Interview.py +396 -661
  112. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
  113. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
  114. edsl/jobs/interviews/InterviewStatistic.py +63 -63
  115. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
  116. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
  117. edsl/jobs/interviews/InterviewStatusLog.py +92 -92
  118. edsl/jobs/interviews/ReportErrors.py +66 -66
  119. edsl/jobs/interviews/interview_status_enum.py +9 -9
  120. edsl/jobs/jobs_status_enums.py +9 -0
  121. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  122. edsl/jobs/results_exceptions_handler.py +98 -0
  123. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
  124. edsl/jobs/runners/JobsRunnerStatus.py +297 -330
  125. edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
  126. edsl/jobs/tasks/TaskCreators.py +64 -64
  127. edsl/jobs/tasks/TaskHistory.py +470 -450
  128. edsl/jobs/tasks/TaskStatusLog.py +23 -23
  129. edsl/jobs/tasks/task_status_enum.py +161 -163
  130. edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
  131. edsl/jobs/tokens/TokenUsage.py +34 -34
  132. edsl/language_models/ComputeCost.py +63 -0
  133. edsl/language_models/LanguageModel.py +626 -668
  134. edsl/language_models/ModelList.py +164 -155
  135. edsl/language_models/PriceManager.py +127 -0
  136. edsl/language_models/RawResponseHandler.py +106 -0
  137. edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
  138. edsl/language_models/ServiceDataSources.py +0 -0
  139. edsl/language_models/__init__.py +2 -3
  140. edsl/language_models/fake_openai_call.py +15 -15
  141. edsl/language_models/fake_openai_service.py +61 -61
  142. edsl/language_models/key_management/KeyLookup.py +63 -0
  143. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  144. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  145. edsl/language_models/key_management/__init__.py +0 -0
  146. edsl/language_models/key_management/models.py +131 -0
  147. edsl/language_models/model.py +256 -0
  148. edsl/language_models/repair.py +156 -156
  149. edsl/language_models/utilities.py +65 -64
  150. edsl/notebooks/Notebook.py +263 -258
  151. edsl/notebooks/NotebookToLaTeX.py +142 -0
  152. edsl/notebooks/__init__.py +1 -1
  153. edsl/prompts/Prompt.py +352 -362
  154. edsl/prompts/__init__.py +2 -2
  155. edsl/questions/ExceptionExplainer.py +77 -0
  156. edsl/questions/HTMLQuestion.py +103 -0
  157. edsl/questions/QuestionBase.py +518 -664
  158. edsl/questions/QuestionBasePromptsMixin.py +221 -217
  159. edsl/questions/QuestionBudget.py +227 -227
  160. edsl/questions/QuestionCheckBox.py +359 -359
  161. edsl/questions/QuestionExtract.py +180 -182
  162. edsl/questions/QuestionFreeText.py +113 -114
  163. edsl/questions/QuestionFunctional.py +166 -166
  164. edsl/questions/QuestionList.py +223 -231
  165. edsl/questions/QuestionMatrix.py +265 -0
  166. edsl/questions/QuestionMultipleChoice.py +330 -286
  167. edsl/questions/QuestionNumerical.py +151 -153
  168. edsl/questions/QuestionRank.py +314 -324
  169. edsl/questions/Quick.py +41 -41
  170. edsl/questions/SimpleAskMixin.py +74 -73
  171. edsl/questions/__init__.py +27 -26
  172. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
  173. edsl/questions/compose_questions.py +98 -98
  174. edsl/questions/data_structures.py +20 -0
  175. edsl/questions/decorators.py +21 -21
  176. edsl/questions/derived/QuestionLikertFive.py +76 -76
  177. edsl/questions/derived/QuestionLinearScale.py +90 -87
  178. edsl/questions/derived/QuestionTopK.py +93 -93
  179. edsl/questions/derived/QuestionYesNo.py +82 -82
  180. edsl/questions/descriptors.py +427 -413
  181. edsl/questions/loop_processor.py +149 -0
  182. edsl/questions/prompt_templates/question_budget.jinja +13 -13
  183. edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
  184. edsl/questions/prompt_templates/question_extract.jinja +11 -11
  185. edsl/questions/prompt_templates/question_free_text.jinja +3 -3
  186. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
  187. edsl/questions/prompt_templates/question_list.jinja +17 -17
  188. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
  189. edsl/questions/prompt_templates/question_numerical.jinja +36 -36
  190. edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
  191. edsl/questions/question_registry.py +177 -177
  192. edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
  193. edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
  194. edsl/questions/response_validator_factory.py +34 -0
  195. edsl/questions/settings.py +12 -12
  196. edsl/questions/templates/budget/answering_instructions.jinja +7 -7
  197. edsl/questions/templates/budget/question_presentation.jinja +7 -7
  198. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
  199. edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
  200. edsl/questions/templates/extract/answering_instructions.jinja +7 -7
  201. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
  202. edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
  203. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
  204. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
  205. edsl/questions/templates/list/answering_instructions.jinja +3 -3
  206. edsl/questions/templates/list/question_presentation.jinja +5 -5
  207. edsl/questions/templates/matrix/__init__.py +1 -0
  208. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  209. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  210. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
  211. edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
  212. edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
  213. edsl/questions/templates/numerical/question_presentation.jinja +6 -6
  214. edsl/questions/templates/rank/answering_instructions.jinja +11 -11
  215. edsl/questions/templates/rank/question_presentation.jinja +15 -15
  216. edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
  217. edsl/questions/templates/top_k/question_presentation.jinja +22 -22
  218. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
  219. edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
  220. edsl/results/CSSParameterizer.py +108 -108
  221. edsl/results/Dataset.py +587 -424
  222. edsl/results/DatasetExportMixin.py +594 -731
  223. edsl/results/DatasetTree.py +295 -275
  224. edsl/results/MarkdownToDocx.py +122 -0
  225. edsl/results/MarkdownToPDF.py +111 -0
  226. edsl/results/Result.py +557 -465
  227. edsl/results/Results.py +1183 -1165
  228. edsl/results/ResultsExportMixin.py +45 -43
  229. edsl/results/ResultsGGMixin.py +121 -121
  230. edsl/results/TableDisplay.py +125 -198
  231. edsl/results/TextEditor.py +50 -0
  232. edsl/results/__init__.py +2 -2
  233. edsl/results/file_exports.py +252 -0
  234. edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
  235. edsl/results/{Selector.py → results_selector.py} +145 -135
  236. edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
  237. edsl/results/smart_objects.py +96 -0
  238. edsl/results/table_data_class.py +12 -0
  239. edsl/results/table_display.css +77 -77
  240. edsl/results/table_renderers.py +118 -0
  241. edsl/results/tree_explore.py +115 -115
  242. edsl/scenarios/ConstructDownloadLink.py +109 -0
  243. edsl/scenarios/DocumentChunker.py +102 -0
  244. edsl/scenarios/DocxScenario.py +16 -0
  245. edsl/scenarios/FileStore.py +511 -632
  246. edsl/scenarios/PdfExtractor.py +40 -0
  247. edsl/scenarios/Scenario.py +498 -601
  248. edsl/scenarios/ScenarioHtmlMixin.py +65 -64
  249. edsl/scenarios/ScenarioList.py +1458 -1287
  250. edsl/scenarios/ScenarioListExportMixin.py +45 -52
  251. edsl/scenarios/ScenarioListPdfMixin.py +239 -261
  252. edsl/scenarios/__init__.py +3 -4
  253. edsl/scenarios/directory_scanner.py +96 -0
  254. edsl/scenarios/file_methods.py +85 -0
  255. edsl/scenarios/handlers/__init__.py +13 -0
  256. edsl/scenarios/handlers/csv.py +38 -0
  257. edsl/scenarios/handlers/docx.py +76 -0
  258. edsl/scenarios/handlers/html.py +37 -0
  259. edsl/scenarios/handlers/json.py +111 -0
  260. edsl/scenarios/handlers/latex.py +5 -0
  261. edsl/scenarios/handlers/md.py +51 -0
  262. edsl/scenarios/handlers/pdf.py +68 -0
  263. edsl/scenarios/handlers/png.py +39 -0
  264. edsl/scenarios/handlers/pptx.py +105 -0
  265. edsl/scenarios/handlers/py.py +294 -0
  266. edsl/scenarios/handlers/sql.py +313 -0
  267. edsl/scenarios/handlers/sqlite.py +149 -0
  268. edsl/scenarios/handlers/txt.py +33 -0
  269. edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
  270. edsl/scenarios/scenario_selector.py +156 -0
  271. edsl/shared.py +1 -1
  272. edsl/study/ObjectEntry.py +173 -173
  273. edsl/study/ProofOfWork.py +113 -113
  274. edsl/study/SnapShot.py +80 -80
  275. edsl/study/Study.py +521 -528
  276. edsl/study/__init__.py +4 -4
  277. edsl/surveys/ConstructDAG.py +92 -0
  278. edsl/surveys/DAG.py +148 -148
  279. edsl/surveys/EditSurvey.py +221 -0
  280. edsl/surveys/InstructionHandler.py +100 -0
  281. edsl/surveys/Memory.py +31 -31
  282. edsl/surveys/MemoryManagement.py +72 -0
  283. edsl/surveys/MemoryPlan.py +244 -244
  284. edsl/surveys/Rule.py +327 -326
  285. edsl/surveys/RuleCollection.py +385 -387
  286. edsl/surveys/RuleManager.py +172 -0
  287. edsl/surveys/Simulator.py +75 -0
  288. edsl/surveys/Survey.py +1280 -1801
  289. edsl/surveys/SurveyCSS.py +273 -261
  290. edsl/surveys/SurveyExportMixin.py +259 -259
  291. edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
  292. edsl/surveys/SurveyQualtricsImport.py +284 -284
  293. edsl/surveys/SurveyToApp.py +141 -0
  294. edsl/surveys/__init__.py +5 -3
  295. edsl/surveys/base.py +53 -53
  296. edsl/surveys/descriptors.py +60 -56
  297. edsl/surveys/instructions/ChangeInstruction.py +48 -49
  298. edsl/surveys/instructions/Instruction.py +56 -65
  299. edsl/surveys/instructions/InstructionCollection.py +82 -77
  300. edsl/templates/error_reporting/base.html +23 -23
  301. edsl/templates/error_reporting/exceptions_by_model.html +34 -34
  302. edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
  303. edsl/templates/error_reporting/exceptions_by_type.html +16 -16
  304. edsl/templates/error_reporting/interview_details.html +115 -115
  305. edsl/templates/error_reporting/interviews.html +19 -19
  306. edsl/templates/error_reporting/overview.html +4 -4
  307. edsl/templates/error_reporting/performance_plot.html +1 -1
  308. edsl/templates/error_reporting/report.css +73 -73
  309. edsl/templates/error_reporting/report.html +117 -117
  310. edsl/templates/error_reporting/report.js +25 -25
  311. edsl/test_h +1 -0
  312. edsl/tools/__init__.py +1 -1
  313. edsl/tools/clusters.py +192 -192
  314. edsl/tools/embeddings.py +27 -27
  315. edsl/tools/embeddings_plotting.py +118 -118
  316. edsl/tools/plotting.py +112 -112
  317. edsl/tools/summarize.py +18 -18
  318. edsl/utilities/PrettyList.py +56 -0
  319. edsl/utilities/SystemInfo.py +28 -28
  320. edsl/utilities/__init__.py +22 -22
  321. edsl/utilities/ast_utilities.py +25 -25
  322. edsl/utilities/data/Registry.py +6 -6
  323. edsl/utilities/data/__init__.py +1 -1
  324. edsl/utilities/data/scooter_results.json +1 -1
  325. edsl/utilities/decorators.py +77 -77
  326. edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
  327. edsl/utilities/gcp_bucket/example.py +50 -0
  328. edsl/utilities/interface.py +627 -627
  329. edsl/utilities/is_notebook.py +18 -0
  330. edsl/utilities/is_valid_variable_name.py +11 -0
  331. edsl/utilities/naming_utilities.py +263 -263
  332. edsl/utilities/remove_edsl_version.py +24 -0
  333. edsl/utilities/repair_functions.py +28 -28
  334. edsl/utilities/restricted_python.py +70 -70
  335. edsl/utilities/utilities.py +436 -424
  336. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/LICENSE +21 -21
  337. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/METADATA +13 -11
  338. edsl-0.1.39.dev4.dist-info/RECORD +361 -0
  339. edsl/language_models/KeyLookup.py +0 -30
  340. edsl/language_models/registry.py +0 -190
  341. edsl/language_models/unused/ReplicateBase.py +0 -83
  342. edsl/results/ResultsDBMixin.py +0 -238
  343. edsl-0.1.39.dev3.dist-info/RECORD +0 -277
  344. {edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev4.dist-info}/WHEEL +0 -0
@@ -1,190 +0,0 @@
1
- import textwrap
2
- from random import random
3
- from edsl.config import CONFIG
4
-
5
- # if "EDSL_DEFAULT_MODEL" not in CONFIG:
6
- # default_model = "test"
7
- # else:
8
- # default_model = CONFIG.get("EDSL_DEFAULT_MODEL")
9
-
10
- from collections import UserList
11
-
12
-
13
- class PrettyList(UserList):
14
- def __init__(self, data=None, columns=None):
15
- super().__init__(data)
16
- self.columns = columns
17
-
18
- def _repr_html_(self):
19
- if isinstance(self[0], list) or isinstance(self[0], tuple):
20
- num_cols = len(self[0])
21
- else:
22
- num_cols = 1
23
-
24
- if self.columns:
25
- columns = self.columns
26
- else:
27
- columns = list(range(num_cols))
28
-
29
- if num_cols > 1:
30
- return (
31
- "<pre><table>"
32
- + "".join(["<th>" + str(column) + "</th>" for column in columns])
33
- + "".join(
34
- [
35
- "<tr>"
36
- + "".join(["<td>" + str(x) + "</td>" for x in row])
37
- + "</tr>"
38
- for row in self
39
- ]
40
- )
41
- + "</table></pre>"
42
- )
43
- else:
44
- return (
45
- "<pre><table>"
46
- + "".join(["<th>" + str(index) + "</th>" for index in columns])
47
- + "".join(
48
- ["<tr>" + "<td>" + str(row) + "</td>" + "</tr>" for row in self]
49
- )
50
- + "</table></pre>"
51
- )
52
-
53
-
54
- def get_model_class(model_name, registry=None):
55
- from edsl.inference_services.registry import default
56
-
57
- registry = registry or default
58
- factory = registry.create_model_factory(model_name)
59
- return factory
60
-
61
-
62
- class Meta(type):
63
- def __repr__(cls):
64
- return textwrap.dedent(
65
- f"""\
66
- Available models: {cls.available()}
67
-
68
- To create an instance, you can do:
69
- >>> m = Model('gpt-4-1106-preview', temperature=0.5, ...)
70
-
71
- To get the default model, you can leave out the model name.
72
- To see the available models, you can do:
73
- >>> Model.available()
74
- """
75
- )
76
-
77
-
78
- class Model(metaclass=Meta):
79
- default_model = CONFIG.get("EDSL_DEFAULT_MODEL")
80
-
81
- def __new__(
82
- cls, model_name=None, registry=None, service_name=None, *args, **kwargs
83
- ):
84
- # Map index to the respective subclass
85
- if model_name is None:
86
- model_name = (
87
- cls.default_model
88
- ) # when model_name is None, use the default model, set in the config file
89
- from edsl.inference_services.registry import default
90
-
91
- registry = registry or default
92
-
93
- if isinstance(model_name, int): # can refer to a model by index
94
- model_name = cls.available(name_only=True)[model_name]
95
-
96
- factory = registry.create_model_factory(model_name, service_name=service_name)
97
- return factory(*args, **kwargs)
98
-
99
- @classmethod
100
- def add_model(cls, service_name, model_name):
101
- from edsl.inference_services.registry import default
102
-
103
- registry = default
104
- registry.add_model(service_name, model_name)
105
-
106
- @classmethod
107
- def services(cls, registry=None):
108
- from edsl.inference_services.registry import default
109
-
110
- registry = registry or default
111
- return [r._inference_service_ for r in registry.services]
112
-
113
- @classmethod
114
- def available(cls, search_term=None, name_only=False, registry=None, service=None):
115
- from edsl.inference_services.registry import default
116
-
117
- registry = registry or default
118
- full_list = registry.available()
119
-
120
- if service is not None:
121
- if service not in cls.services(registry=registry):
122
- raise ValueError(f"Service {service} not found in available services.")
123
-
124
- full_list = [m for m in full_list if m[1] == service]
125
-
126
- if search_term is None:
127
- if name_only:
128
- return PrettyList(
129
- [m[0] for m in full_list],
130
- columns=["Model Name", "Service Name", "Code"],
131
- )
132
- else:
133
- return PrettyList(
134
- full_list, columns=["Model Name", "Service Name", "Code"]
135
- )
136
- else:
137
- filtered_results = [
138
- m for m in full_list if search_term in m[0] or search_term in m[1]
139
- ]
140
- if name_only:
141
- return PrettyList(
142
- [m[0] for m in filtered_results],
143
- columns=["Model Name", "Service Name", "Code"],
144
- )
145
- else:
146
- return PrettyList(
147
- filtered_results, columns=["Model Name", "Service Name", "Code"]
148
- )
149
-
150
- @classmethod
151
- def check_models(cls, verbose=False):
152
- print("Checking all available models...\n")
153
- for model in cls.available(name_only=True):
154
- print(f"Now checking: {model}")
155
- try:
156
- m = cls(model)
157
- except Exception as e:
158
- print(f"Error creating instance of {model}: {e}")
159
- continue
160
- try:
161
- results = m.hello(verbose)
162
- if verbose:
163
- print(f"Results from model call: {results}")
164
- except Exception as e:
165
- print(f"Error calling 'hello' on {model}: {e}")
166
- continue
167
- print("OK!")
168
- print("\n")
169
-
170
- @classmethod
171
- def example(cls, randomize: bool = False) -> "Model":
172
- """
173
- Returns an example Model instance.
174
-
175
- :param randomize: If True, the temperature is set to a random decimal between 0 and 1.
176
- """
177
- temperature = 0.5 if not randomize else round(random(), 2)
178
- model_name = cls.default_model
179
- return cls(model_name, temperature=temperature)
180
-
181
-
182
- if __name__ == "__main__":
183
- import doctest
184
-
185
- doctest.testmod(optionflags=doctest.ELLIPSIS)
186
-
187
- available = Model.available()
188
- m = Model("gpt-4-1106-preview")
189
- results = m.execute_model_call("Hello world")
190
- print(results)
@@ -1,83 +0,0 @@
1
- import asyncio
2
- import aiohttp
3
- import json
4
- from typing import Any
5
-
6
- from edsl import CONFIG
7
-
8
- from edsl.language_models.LanguageModel import LanguageModel
9
-
10
-
11
- def replicate_model_factory(model_name, base_url, api_token):
12
- class ReplicateLanguageModelBase(LanguageModel):
13
- _model_ = (
14
- model_name # Example model name, replace with actual model name if needed
15
- )
16
- _parameters_ = {
17
- "temperature": 0.1,
18
- "topK": 50,
19
- "topP": 0.9,
20
- "max_new_tokens": 500,
21
- "min_new_tokens": -1,
22
- "repetition_penalty": 1.15,
23
- # "version": "5fe0a3d7ac2852264a25279d1dfb798acbc4d49711d126646594e212cb821749",
24
- "use_cache": True,
25
- }
26
- _api_token = api_token
27
- _base_url = base_url
28
-
29
- async def async_execute_model_call(
30
- self, user_prompt: str, system_prompt: str = ""
31
- ) -> dict[str, Any]:
32
- self.api_token = self._api_token
33
- self.headers = {
34
- "Authorization": f"Token {self.api_token}",
35
- "Content-Type": "application/json",
36
- }
37
- # combined_prompt = f"{system_prompt} {user_prompt}".strip()
38
- # print(f"Prompt: {combined_prompt}")
39
- data = {
40
- # "version": self._parameters_["version"],
41
- "input": {
42
- "debug": False,
43
- "top_k": self._parameters_["topK"],
44
- "top_p": self._parameters_["topP"],
45
- "prompt": user_prompt,
46
- "system_prompt": system_prompt,
47
- "temperature": self._parameters_["temperature"],
48
- "max_new_tokens": self._parameters_["max_new_tokens"],
49
- "min_new_tokens": self._parameters_["min_new_tokens"],
50
- "prompt_template": "{prompt}",
51
- "repetition_penalty": self._parameters_["repetition_penalty"],
52
- },
53
- }
54
-
55
- async with aiohttp.ClientSession() as session:
56
- async with session.post(
57
- self._base_url, headers=self.headers, data=json.dumps(data)
58
- ) as response:
59
- raw_response_text = await response.text()
60
- data = json.loads(raw_response_text)
61
- print(f"This was the data returned by the model:{data}")
62
- prediction_url = data["urls"]["get"]
63
-
64
- while True:
65
- async with session.get(
66
- prediction_url, headers=self.headers
67
- ) as get_response:
68
- if get_response.status != 200:
69
- # Handle non-success status codes appropriately
70
- return None
71
-
72
- get_data = await get_response.text()
73
- get_data = json.loads(get_data)
74
- if get_data["status"] == "succeeded":
75
- return get_data
76
- await asyncio.sleep(1)
77
-
78
- def parse_response(self, raw_response: dict[str, Any]) -> str:
79
- data = "".join(raw_response["output"])
80
- print(f"This is what the model returned: {data}")
81
- return data
82
-
83
- return ReplicateLanguageModelBase
@@ -1,238 +0,0 @@
1
- """Mixin for working with SQLite respresentation of a 'Results' object."""
2
-
3
- import sqlite3
4
- from enum import Enum
5
- from typing import Literal, Union, Optional
6
-
7
-
8
- class SQLDataShape(Enum):
9
- """Enum for the shape of the data in the SQL database."""
10
-
11
- WIDE = "wide"
12
- LONG = "long"
13
-
14
-
15
- class ResultsDBMixin:
16
- """Mixin for interacting with a Results object as if it were a SQL database."""
17
-
18
- def _rows(self):
19
- """Return the rows of the `Results` object as a list of tuples."""
20
- for index, result in enumerate(self):
21
- yield from result.rows(index)
22
-
23
- def export_sql_dump(self, shape: Literal["wide", "long"], filename: str):
24
- """Export the SQL database to a file.
25
-
26
- :param shape: The shape of the data in the database (wide or long)
27
- :param filename: The filename to save the database to
28
- """
29
- shape_enum = self._get_shape_enum(shape)
30
- conn = self._db(shape=shape_enum)
31
-
32
- with open(filename, "w") as f:
33
- for line in conn.iterdump():
34
- f.write(f"{line}\n")
35
-
36
- conn.close()
37
-
38
- def backup_db_to_file(self, shape: Literal["wide", "long"], filename: str):
39
- """Backup the in-memory database to a file.
40
-
41
-
42
- :param shape: The shape of the data in the database (wide or long)
43
- :param filename: The filename to save the database to
44
-
45
- >>> from edsl.results import Results
46
- >>> r = Results.example()
47
- >>> r.backup_db_to_file(filename="backup.db", shape="long")
48
-
49
- """
50
- shape_enum = self._get_shape_enum(shape)
51
- # Source database connection (in-memory)
52
- source_conn = self._db(shape=shape_enum)
53
-
54
- # Destination database connection (file)
55
- dest_conn = sqlite3.connect(filename)
56
-
57
- # Backup in-memory database to file
58
- with source_conn:
59
- source_conn.backup(dest_conn)
60
-
61
- # Close both connections
62
- source_conn.close()
63
- dest_conn.close()
64
-
65
- def _db(self, shape: SQLDataShape, remove_prefix=False):
66
- """Create a SQLite database in memory and return the connection.
67
-
68
- :param shape: The shape of the data in the database (wide or long)
69
- :param remove_prefix: Whether to remove the prefix from the column names
70
-
71
- """
72
- if shape == SQLDataShape.LONG:
73
- conn = sqlite3.connect(":memory:")
74
-
75
- create_table_query = """
76
- CREATE TABLE self (
77
- id INTEGER,
78
- data_type TEXT,
79
- key TEXT,
80
- value TEXT
81
- )
82
- """
83
- conn.execute(create_table_query)
84
-
85
- list_of_tuples = list(self._rows())
86
- insert_query = (
87
- "INSERT INTO self (id, data_type, key, value) VALUES (?, ?, ?, ?)"
88
- )
89
- conn.executemany(insert_query, list_of_tuples)
90
- conn.commit()
91
- return conn
92
- elif shape == SQLDataShape.WIDE:
93
- from sqlalchemy import create_engine
94
-
95
- engine = create_engine("sqlite:///:memory:")
96
- df = self.to_pandas(remove_prefix=remove_prefix, lists_as_strings=True)
97
- df.to_sql("self", engine, index=False, if_exists="replace")
98
- return engine.connect()
99
- else:
100
- raise Exception("Invalid SQLDataShape")
101
-
102
- def _get_shape_enum(self, shape: Literal["wide", "long"]):
103
- """Convert the shape string to a SQLDataShape enum."""
104
- if shape is None:
105
- raise Exception("Must select either 'wide' or 'long' format")
106
- elif shape == "wide":
107
- return SQLDataShape.WIDE
108
- elif shape == "long":
109
- return SQLDataShape.LONG
110
- else:
111
- raise Exception("Invalid shape: must be either 'long' or 'wide'")
112
-
113
- def sql(
114
- self,
115
- query: str,
116
- shape: Literal["wide", "long"] = "wide",
117
- remove_prefix: bool = True,
118
- transpose: bool = None,
119
- transpose_by: str = None,
120
- csv: bool = False,
121
- to_list=False,
122
- to_latex=False,
123
- filename: Optional[str] = None,
124
- ) -> Union["pd.DataFrame", str]:
125
- """Execute a SQL query and return the results as a DataFrame.
126
-
127
- :param query: The SQL query to execute
128
- :param shape: The shape of the data in the database (wide or long)
129
- :param remove_prefix: Whether to remove the prefix from the column names
130
- :param transpose: Whether to transpose the DataFrame
131
- :param transpose_by: The column to use as the index when transposing
132
- :param csv: Whether to return the DataFrame as a CSV string
133
-
134
-
135
- Example usage:
136
-
137
- >>> from edsl.results import Results
138
- >>> r = Results.example()
139
- >>> d = r.sql("select data_type, key, value from self where data_type = 'answer' order by value limit 3", shape="long")
140
- >>> sorted(list(d['value']))
141
- ['Good', 'Great', 'Great']
142
-
143
- We can also return the data in wide format.
144
- Note the use of single quotes to escape the column names, as required by sql.
145
-
146
- >>> from edsl.results import Results
147
- >>> Results.example().sql("select how_feeling from self", shape = 'wide', remove_prefix=True)
148
- how_feeling
149
- 0 OK
150
- 1 Great
151
- 2 Terrible
152
- 3 OK
153
- """
154
- import pandas as pd
155
-
156
- shape_enum = self._get_shape_enum(shape)
157
-
158
- conn = self._db(shape=shape_enum, remove_prefix=remove_prefix)
159
- df = pd.read_sql_query(query, conn)
160
-
161
- # Transpose the DataFrame if transpose is True
162
- if transpose or transpose_by:
163
- df = pd.DataFrame(df)
164
- if transpose_by:
165
- df = df.set_index(transpose_by)
166
- else:
167
- df = df.set_index(df.columns[0])
168
- df = df.transpose()
169
-
170
- if csv and to_list:
171
- raise Exception("Cannot return both CSV and list")
172
-
173
- if to_list:
174
- return df.values.tolist()
175
-
176
- if to_latex:
177
- df.columns = [col.replace("_", " ") for col in df.columns]
178
-
179
- latex_output = df.to_latex(index=False)
180
- if filename:
181
- with open(filename, "w") as f:
182
- f.write(latex_output)
183
- return None
184
- return latex_output
185
-
186
- if csv:
187
- if filename:
188
- df.to_csv(filename, index=False)
189
- return None
190
-
191
- return df.to_csv(index=False)
192
-
193
- return df
194
-
195
- def show_schema(
196
- self, shape: Literal["wide", "long"], remove_prefix: bool = False
197
- ) -> None:
198
- """Show the schema of the Results database.
199
-
200
- :param shape: The shape of the data in the database (wide or long)
201
- :param remove_prefix: Whether to remove the prefix from the column names
202
-
203
- >>> from edsl.results import Results
204
- >>> r = Results.example()
205
- >>> r.show_schema(shape="long")
206
- Type: table, Name: self, SQL: CREATE TABLE self (
207
- ...
208
- <BLANKLINE>
209
- """
210
- import pandas as pd
211
-
212
- shape_enum = self._get_shape_enum(shape)
213
- conn = self._db(shape=shape_enum, remove_prefix=remove_prefix)
214
-
215
- if shape_enum == SQLDataShape.LONG:
216
- # Query to get the schema of all tables
217
- query = "SELECT type, name, sql FROM sqlite_master WHERE type='table'"
218
- cursor = conn.execute(query)
219
- schema = cursor.fetchall()
220
- conn.close()
221
-
222
- # Format and return the schema information
223
- schema_info = ""
224
- for row in schema:
225
- schema_info += f"Type: {row[0]}, Name: {row[1]}, SQL: {row[2]}\n"
226
-
227
- print(schema_info)
228
- elif shape_enum == SQLDataShape.WIDE:
229
- query = f"PRAGMA table_info(self)"
230
- schema = pd.read_sql(query, conn)
231
- # print(schema)
232
- return schema
233
-
234
-
235
- if __name__ == "__main__":
236
- import doctest
237
-
238
- doctest.testmod(optionflags=doctest.ELLIPSIS)