edsl 0.1.15__py3-none-any.whl → 0.1.40__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (407) hide show
  1. edsl/Base.py +348 -38
  2. edsl/BaseDiff.py +260 -0
  3. edsl/TemplateLoader.py +24 -0
  4. edsl/__init__.py +45 -10
  5. edsl/__version__.py +1 -1
  6. edsl/agents/Agent.py +842 -144
  7. edsl/agents/AgentList.py +521 -25
  8. edsl/agents/Invigilator.py +250 -374
  9. edsl/agents/InvigilatorBase.py +257 -0
  10. edsl/agents/PromptConstructor.py +272 -0
  11. edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
  12. edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
  13. edsl/agents/descriptors.py +43 -13
  14. edsl/agents/prompt_helpers.py +129 -0
  15. edsl/agents/question_option_processor.py +172 -0
  16. edsl/auto/AutoStudy.py +130 -0
  17. edsl/auto/StageBase.py +243 -0
  18. edsl/auto/StageGenerateSurvey.py +178 -0
  19. edsl/auto/StageLabelQuestions.py +125 -0
  20. edsl/auto/StagePersona.py +61 -0
  21. edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
  22. edsl/auto/StagePersonaDimensionValues.py +74 -0
  23. edsl/auto/StagePersonaDimensions.py +69 -0
  24. edsl/auto/StageQuestions.py +74 -0
  25. edsl/auto/SurveyCreatorPipeline.py +21 -0
  26. edsl/auto/utilities.py +218 -0
  27. edsl/base/Base.py +279 -0
  28. edsl/config.py +115 -113
  29. edsl/conversation/Conversation.py +290 -0
  30. edsl/conversation/car_buying.py +59 -0
  31. edsl/conversation/chips.py +95 -0
  32. edsl/conversation/mug_negotiation.py +81 -0
  33. edsl/conversation/next_speaker_utilities.py +93 -0
  34. edsl/coop/CoopFunctionsMixin.py +15 -0
  35. edsl/coop/ExpectedParrotKeyHandler.py +125 -0
  36. edsl/coop/PriceFetcher.py +54 -0
  37. edsl/coop/__init__.py +1 -0
  38. edsl/coop/coop.py +1029 -134
  39. edsl/coop/utils.py +131 -0
  40. edsl/data/Cache.py +560 -89
  41. edsl/data/CacheEntry.py +230 -0
  42. edsl/data/CacheHandler.py +168 -0
  43. edsl/data/RemoteCacheSync.py +186 -0
  44. edsl/data/SQLiteDict.py +292 -0
  45. edsl/data/__init__.py +5 -3
  46. edsl/data/orm.py +6 -33
  47. edsl/data_transfer_models.py +74 -27
  48. edsl/enums.py +165 -8
  49. edsl/exceptions/BaseException.py +21 -0
  50. edsl/exceptions/__init__.py +52 -46
  51. edsl/exceptions/agents.py +33 -15
  52. edsl/exceptions/cache.py +5 -0
  53. edsl/exceptions/coop.py +8 -0
  54. edsl/exceptions/general.py +34 -0
  55. edsl/exceptions/inference_services.py +5 -0
  56. edsl/exceptions/jobs.py +15 -0
  57. edsl/exceptions/language_models.py +46 -1
  58. edsl/exceptions/questions.py +80 -5
  59. edsl/exceptions/results.py +16 -5
  60. edsl/exceptions/scenarios.py +29 -0
  61. edsl/exceptions/surveys.py +13 -10
  62. edsl/inference_services/AnthropicService.py +106 -0
  63. edsl/inference_services/AvailableModelCacheHandler.py +184 -0
  64. edsl/inference_services/AvailableModelFetcher.py +215 -0
  65. edsl/inference_services/AwsBedrock.py +118 -0
  66. edsl/inference_services/AzureAI.py +215 -0
  67. edsl/inference_services/DeepInfraService.py +18 -0
  68. edsl/inference_services/GoogleService.py +143 -0
  69. edsl/inference_services/GroqService.py +20 -0
  70. edsl/inference_services/InferenceServiceABC.py +80 -0
  71. edsl/inference_services/InferenceServicesCollection.py +138 -0
  72. edsl/inference_services/MistralAIService.py +120 -0
  73. edsl/inference_services/OllamaService.py +18 -0
  74. edsl/inference_services/OpenAIService.py +236 -0
  75. edsl/inference_services/PerplexityService.py +160 -0
  76. edsl/inference_services/ServiceAvailability.py +135 -0
  77. edsl/inference_services/TestService.py +90 -0
  78. edsl/inference_services/TogetherAIService.py +172 -0
  79. edsl/inference_services/data_structures.py +134 -0
  80. edsl/inference_services/models_available_cache.py +118 -0
  81. edsl/inference_services/rate_limits_cache.py +25 -0
  82. edsl/inference_services/registry.py +41 -0
  83. edsl/inference_services/write_available.py +10 -0
  84. edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
  85. edsl/jobs/Answers.py +21 -20
  86. edsl/jobs/FetchInvigilator.py +47 -0
  87. edsl/jobs/InterviewTaskManager.py +98 -0
  88. edsl/jobs/InterviewsConstructor.py +50 -0
  89. edsl/jobs/Jobs.py +684 -206
  90. edsl/jobs/JobsChecks.py +172 -0
  91. edsl/jobs/JobsComponentConstructor.py +189 -0
  92. edsl/jobs/JobsPrompts.py +270 -0
  93. edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
  94. edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
  95. edsl/jobs/RequestTokenEstimator.py +30 -0
  96. edsl/jobs/async_interview_runner.py +138 -0
  97. edsl/jobs/buckets/BucketCollection.py +104 -0
  98. edsl/jobs/buckets/ModelBuckets.py +65 -0
  99. edsl/jobs/buckets/TokenBucket.py +283 -0
  100. edsl/jobs/buckets/TokenBucketAPI.py +211 -0
  101. edsl/jobs/buckets/TokenBucketClient.py +191 -0
  102. edsl/jobs/check_survey_scenario_compatibility.py +85 -0
  103. edsl/jobs/data_structures.py +120 -0
  104. edsl/jobs/decorators.py +35 -0
  105. edsl/jobs/interviews/Interview.py +392 -0
  106. edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
  107. edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
  108. edsl/jobs/interviews/InterviewStatistic.py +63 -0
  109. edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
  110. edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
  111. edsl/jobs/interviews/InterviewStatusLog.py +92 -0
  112. edsl/jobs/interviews/ReportErrors.py +66 -0
  113. edsl/jobs/interviews/interview_status_enum.py +9 -0
  114. edsl/jobs/jobs_status_enums.py +9 -0
  115. edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
  116. edsl/jobs/results_exceptions_handler.py +98 -0
  117. edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
  118. edsl/jobs/runners/JobsRunnerStatus.py +298 -0
  119. edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
  120. edsl/jobs/tasks/TaskCreators.py +64 -0
  121. edsl/jobs/tasks/TaskHistory.py +470 -0
  122. edsl/jobs/tasks/TaskStatusLog.py +23 -0
  123. edsl/jobs/tasks/task_status_enum.py +161 -0
  124. edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
  125. edsl/jobs/tokens/TokenUsage.py +34 -0
  126. edsl/language_models/ComputeCost.py +63 -0
  127. edsl/language_models/LanguageModel.py +507 -386
  128. edsl/language_models/ModelList.py +164 -0
  129. edsl/language_models/PriceManager.py +127 -0
  130. edsl/language_models/RawResponseHandler.py +106 -0
  131. edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
  132. edsl/language_models/__init__.py +1 -8
  133. edsl/language_models/fake_openai_call.py +15 -0
  134. edsl/language_models/fake_openai_service.py +61 -0
  135. edsl/language_models/key_management/KeyLookup.py +63 -0
  136. edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
  137. edsl/language_models/key_management/KeyLookupCollection.py +38 -0
  138. edsl/language_models/key_management/__init__.py +0 -0
  139. edsl/language_models/key_management/models.py +131 -0
  140. edsl/language_models/model.py +256 -0
  141. edsl/language_models/repair.py +109 -41
  142. edsl/language_models/utilities.py +65 -0
  143. edsl/notebooks/Notebook.py +263 -0
  144. edsl/notebooks/NotebookToLaTeX.py +142 -0
  145. edsl/notebooks/__init__.py +1 -0
  146. edsl/prompts/Prompt.py +222 -93
  147. edsl/prompts/__init__.py +1 -1
  148. edsl/questions/ExceptionExplainer.py +77 -0
  149. edsl/questions/HTMLQuestion.py +103 -0
  150. edsl/questions/QuestionBase.py +518 -0
  151. edsl/questions/QuestionBasePromptsMixin.py +221 -0
  152. edsl/questions/QuestionBudget.py +164 -67
  153. edsl/questions/QuestionCheckBox.py +281 -62
  154. edsl/questions/QuestionDict.py +343 -0
  155. edsl/questions/QuestionExtract.py +136 -50
  156. edsl/questions/QuestionFreeText.py +79 -55
  157. edsl/questions/QuestionFunctional.py +138 -41
  158. edsl/questions/QuestionList.py +184 -57
  159. edsl/questions/QuestionMatrix.py +265 -0
  160. edsl/questions/QuestionMultipleChoice.py +293 -69
  161. edsl/questions/QuestionNumerical.py +109 -56
  162. edsl/questions/QuestionRank.py +244 -49
  163. edsl/questions/Quick.py +41 -0
  164. edsl/questions/SimpleAskMixin.py +74 -0
  165. edsl/questions/__init__.py +9 -6
  166. edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
  167. edsl/questions/compose_questions.py +13 -7
  168. edsl/questions/data_structures.py +20 -0
  169. edsl/questions/decorators.py +21 -0
  170. edsl/questions/derived/QuestionLikertFive.py +28 -26
  171. edsl/questions/derived/QuestionLinearScale.py +41 -28
  172. edsl/questions/derived/QuestionTopK.py +34 -26
  173. edsl/questions/derived/QuestionYesNo.py +40 -27
  174. edsl/questions/descriptors.py +228 -74
  175. edsl/questions/loop_processor.py +149 -0
  176. edsl/questions/prompt_templates/question_budget.jinja +13 -0
  177. edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
  178. edsl/questions/prompt_templates/question_extract.jinja +11 -0
  179. edsl/questions/prompt_templates/question_free_text.jinja +3 -0
  180. edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
  181. edsl/questions/prompt_templates/question_list.jinja +17 -0
  182. edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
  183. edsl/questions/prompt_templates/question_numerical.jinja +37 -0
  184. edsl/questions/question_base_gen_mixin.py +168 -0
  185. edsl/questions/question_registry.py +130 -46
  186. edsl/questions/register_questions_meta.py +71 -0
  187. edsl/questions/response_validator_abc.py +188 -0
  188. edsl/questions/response_validator_factory.py +34 -0
  189. edsl/questions/settings.py +5 -2
  190. edsl/questions/templates/__init__.py +0 -0
  191. edsl/questions/templates/budget/__init__.py +0 -0
  192. edsl/questions/templates/budget/answering_instructions.jinja +7 -0
  193. edsl/questions/templates/budget/question_presentation.jinja +7 -0
  194. edsl/questions/templates/checkbox/__init__.py +0 -0
  195. edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
  196. edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
  197. edsl/questions/templates/dict/__init__.py +0 -0
  198. edsl/questions/templates/dict/answering_instructions.jinja +21 -0
  199. edsl/questions/templates/dict/question_presentation.jinja +1 -0
  200. edsl/questions/templates/extract/__init__.py +0 -0
  201. edsl/questions/templates/extract/answering_instructions.jinja +7 -0
  202. edsl/questions/templates/extract/question_presentation.jinja +1 -0
  203. edsl/questions/templates/free_text/__init__.py +0 -0
  204. edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
  205. edsl/questions/templates/free_text/question_presentation.jinja +1 -0
  206. edsl/questions/templates/likert_five/__init__.py +0 -0
  207. edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
  208. edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
  209. edsl/questions/templates/linear_scale/__init__.py +0 -0
  210. edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
  211. edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
  212. edsl/questions/templates/list/__init__.py +0 -0
  213. edsl/questions/templates/list/answering_instructions.jinja +4 -0
  214. edsl/questions/templates/list/question_presentation.jinja +5 -0
  215. edsl/questions/templates/matrix/__init__.py +1 -0
  216. edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
  217. edsl/questions/templates/matrix/question_presentation.jinja +20 -0
  218. edsl/questions/templates/multiple_choice/__init__.py +0 -0
  219. edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
  220. edsl/questions/templates/multiple_choice/html.jinja +0 -0
  221. edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
  222. edsl/questions/templates/numerical/__init__.py +0 -0
  223. edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
  224. edsl/questions/templates/numerical/question_presentation.jinja +7 -0
  225. edsl/questions/templates/rank/__init__.py +0 -0
  226. edsl/questions/templates/rank/answering_instructions.jinja +11 -0
  227. edsl/questions/templates/rank/question_presentation.jinja +15 -0
  228. edsl/questions/templates/top_k/__init__.py +0 -0
  229. edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
  230. edsl/questions/templates/top_k/question_presentation.jinja +22 -0
  231. edsl/questions/templates/yes_no/__init__.py +0 -0
  232. edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
  233. edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
  234. edsl/results/CSSParameterizer.py +108 -0
  235. edsl/results/Dataset.py +550 -19
  236. edsl/results/DatasetExportMixin.py +594 -0
  237. edsl/results/DatasetTree.py +295 -0
  238. edsl/results/MarkdownToDocx.py +122 -0
  239. edsl/results/MarkdownToPDF.py +111 -0
  240. edsl/results/Result.py +477 -173
  241. edsl/results/Results.py +987 -269
  242. edsl/results/ResultsExportMixin.py +28 -125
  243. edsl/results/ResultsGGMixin.py +83 -15
  244. edsl/results/TableDisplay.py +125 -0
  245. edsl/results/TextEditor.py +50 -0
  246. edsl/results/__init__.py +1 -1
  247. edsl/results/file_exports.py +252 -0
  248. edsl/results/results_fetch_mixin.py +33 -0
  249. edsl/results/results_selector.py +145 -0
  250. edsl/results/results_tools_mixin.py +98 -0
  251. edsl/results/smart_objects.py +96 -0
  252. edsl/results/table_data_class.py +12 -0
  253. edsl/results/table_display.css +78 -0
  254. edsl/results/table_renderers.py +118 -0
  255. edsl/results/tree_explore.py +115 -0
  256. edsl/scenarios/ConstructDownloadLink.py +109 -0
  257. edsl/scenarios/DocumentChunker.py +102 -0
  258. edsl/scenarios/DocxScenario.py +16 -0
  259. edsl/scenarios/FileStore.py +543 -0
  260. edsl/scenarios/PdfExtractor.py +40 -0
  261. edsl/scenarios/Scenario.py +431 -62
  262. edsl/scenarios/ScenarioHtmlMixin.py +65 -0
  263. edsl/scenarios/ScenarioList.py +1415 -45
  264. edsl/scenarios/ScenarioListExportMixin.py +45 -0
  265. edsl/scenarios/ScenarioListPdfMixin.py +239 -0
  266. edsl/scenarios/__init__.py +2 -0
  267. edsl/scenarios/directory_scanner.py +96 -0
  268. edsl/scenarios/file_methods.py +85 -0
  269. edsl/scenarios/handlers/__init__.py +13 -0
  270. edsl/scenarios/handlers/csv.py +49 -0
  271. edsl/scenarios/handlers/docx.py +76 -0
  272. edsl/scenarios/handlers/html.py +37 -0
  273. edsl/scenarios/handlers/json.py +111 -0
  274. edsl/scenarios/handlers/latex.py +5 -0
  275. edsl/scenarios/handlers/md.py +51 -0
  276. edsl/scenarios/handlers/pdf.py +68 -0
  277. edsl/scenarios/handlers/png.py +39 -0
  278. edsl/scenarios/handlers/pptx.py +105 -0
  279. edsl/scenarios/handlers/py.py +294 -0
  280. edsl/scenarios/handlers/sql.py +313 -0
  281. edsl/scenarios/handlers/sqlite.py +149 -0
  282. edsl/scenarios/handlers/txt.py +33 -0
  283. edsl/scenarios/scenario_join.py +131 -0
  284. edsl/scenarios/scenario_selector.py +156 -0
  285. edsl/shared.py +1 -0
  286. edsl/study/ObjectEntry.py +173 -0
  287. edsl/study/ProofOfWork.py +113 -0
  288. edsl/study/SnapShot.py +80 -0
  289. edsl/study/Study.py +521 -0
  290. edsl/study/__init__.py +4 -0
  291. edsl/surveys/ConstructDAG.py +92 -0
  292. edsl/surveys/DAG.py +92 -11
  293. edsl/surveys/EditSurvey.py +221 -0
  294. edsl/surveys/InstructionHandler.py +100 -0
  295. edsl/surveys/Memory.py +9 -4
  296. edsl/surveys/MemoryManagement.py +72 -0
  297. edsl/surveys/MemoryPlan.py +156 -35
  298. edsl/surveys/Rule.py +221 -74
  299. edsl/surveys/RuleCollection.py +241 -61
  300. edsl/surveys/RuleManager.py +172 -0
  301. edsl/surveys/Simulator.py +75 -0
  302. edsl/surveys/Survey.py +1079 -339
  303. edsl/surveys/SurveyCSS.py +273 -0
  304. edsl/surveys/SurveyExportMixin.py +235 -40
  305. edsl/surveys/SurveyFlowVisualization.py +181 -0
  306. edsl/surveys/SurveyQualtricsImport.py +284 -0
  307. edsl/surveys/SurveyToApp.py +141 -0
  308. edsl/surveys/__init__.py +4 -2
  309. edsl/surveys/base.py +19 -3
  310. edsl/surveys/descriptors.py +17 -6
  311. edsl/surveys/instructions/ChangeInstruction.py +48 -0
  312. edsl/surveys/instructions/Instruction.py +56 -0
  313. edsl/surveys/instructions/InstructionCollection.py +82 -0
  314. edsl/surveys/instructions/__init__.py +0 -0
  315. edsl/templates/error_reporting/base.html +24 -0
  316. edsl/templates/error_reporting/exceptions_by_model.html +35 -0
  317. edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
  318. edsl/templates/error_reporting/exceptions_by_type.html +17 -0
  319. edsl/templates/error_reporting/interview_details.html +116 -0
  320. edsl/templates/error_reporting/interviews.html +19 -0
  321. edsl/templates/error_reporting/overview.html +5 -0
  322. edsl/templates/error_reporting/performance_plot.html +2 -0
  323. edsl/templates/error_reporting/report.css +74 -0
  324. edsl/templates/error_reporting/report.html +118 -0
  325. edsl/templates/error_reporting/report.js +25 -0
  326. edsl/tools/__init__.py +1 -0
  327. edsl/tools/clusters.py +192 -0
  328. edsl/tools/embeddings.py +27 -0
  329. edsl/tools/embeddings_plotting.py +118 -0
  330. edsl/tools/plotting.py +112 -0
  331. edsl/tools/summarize.py +18 -0
  332. edsl/utilities/PrettyList.py +56 -0
  333. edsl/utilities/SystemInfo.py +5 -0
  334. edsl/utilities/__init__.py +21 -20
  335. edsl/utilities/ast_utilities.py +3 -0
  336. edsl/utilities/data/Registry.py +2 -0
  337. edsl/utilities/decorators.py +41 -0
  338. edsl/utilities/gcp_bucket/__init__.py +0 -0
  339. edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
  340. edsl/utilities/interface.py +310 -60
  341. edsl/utilities/is_notebook.py +18 -0
  342. edsl/utilities/is_valid_variable_name.py +11 -0
  343. edsl/utilities/naming_utilities.py +263 -0
  344. edsl/utilities/remove_edsl_version.py +24 -0
  345. edsl/utilities/repair_functions.py +28 -0
  346. edsl/utilities/restricted_python.py +70 -0
  347. edsl/utilities/utilities.py +203 -13
  348. edsl-0.1.40.dist-info/METADATA +111 -0
  349. edsl-0.1.40.dist-info/RECORD +362 -0
  350. {edsl-0.1.15.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
  351. edsl/agents/AgentListExportMixin.py +0 -24
  352. edsl/coop/old.py +0 -31
  353. edsl/data/Database.py +0 -141
  354. edsl/data/crud.py +0 -121
  355. edsl/jobs/Interview.py +0 -435
  356. edsl/jobs/JobsRunner.py +0 -63
  357. edsl/jobs/JobsRunnerStatusMixin.py +0 -115
  358. edsl/jobs/base.py +0 -47
  359. edsl/jobs/buckets.py +0 -178
  360. edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
  361. edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
  362. edsl/jobs/task_management.py +0 -215
  363. edsl/jobs/token_tracking.py +0 -78
  364. edsl/language_models/DeepInfra.py +0 -69
  365. edsl/language_models/OpenAI.py +0 -98
  366. edsl/language_models/model_interfaces/GeminiPro.py +0 -66
  367. edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
  368. edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
  369. edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
  370. edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
  371. edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
  372. edsl/language_models/registry.py +0 -81
  373. edsl/language_models/schemas.py +0 -15
  374. edsl/language_models/unused/ReplicateBase.py +0 -83
  375. edsl/prompts/QuestionInstructionsBase.py +0 -6
  376. edsl/prompts/library/agent_instructions.py +0 -29
  377. edsl/prompts/library/agent_persona.py +0 -17
  378. edsl/prompts/library/question_budget.py +0 -26
  379. edsl/prompts/library/question_checkbox.py +0 -32
  380. edsl/prompts/library/question_extract.py +0 -19
  381. edsl/prompts/library/question_freetext.py +0 -14
  382. edsl/prompts/library/question_linear_scale.py +0 -20
  383. edsl/prompts/library/question_list.py +0 -22
  384. edsl/prompts/library/question_multiple_choice.py +0 -44
  385. edsl/prompts/library/question_numerical.py +0 -31
  386. edsl/prompts/library/question_rank.py +0 -21
  387. edsl/prompts/prompt_config.py +0 -33
  388. edsl/prompts/registry.py +0 -185
  389. edsl/questions/Question.py +0 -240
  390. edsl/report/InputOutputDataTypes.py +0 -134
  391. edsl/report/RegressionMixin.py +0 -28
  392. edsl/report/ReportOutputs.py +0 -1228
  393. edsl/report/ResultsFetchMixin.py +0 -106
  394. edsl/report/ResultsOutputMixin.py +0 -14
  395. edsl/report/demo.ipynb +0 -645
  396. edsl/results/ResultsDBMixin.py +0 -184
  397. edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
  398. edsl/trackers/Tracker.py +0 -91
  399. edsl/trackers/TrackerAPI.py +0 -196
  400. edsl/trackers/TrackerTasks.py +0 -70
  401. edsl/utilities/pastebin.py +0 -141
  402. edsl-0.1.15.dist-info/METADATA +0 -69
  403. edsl-0.1.15.dist-info/RECORD +0 -142
  404. /edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
  405. /edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
  406. /edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
  407. {edsl-0.1.15.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0
@@ -0,0 +1,252 @@
1
+ from abc import ABC, abstractmethod
2
+ import io
3
+ import csv
4
+ import base64
5
+ from typing import Optional, Union, Tuple, List, Any, Dict
6
+ from openpyxl import Workbook
7
+
8
+ from edsl.scenarios.FileStore import FileStore
9
+
10
+
11
+ class FileExport(ABC):
12
+ def __init__(
13
+ self,
14
+ data: Any,
15
+ filename: Optional[str] = None,
16
+ remove_prefix: bool = False,
17
+ pretty_labels: Optional[Dict[str, str]] = None,
18
+ ):
19
+ self.data = data
20
+ self.filename = filename # or self._get_default_filename()
21
+ self.remove_prefix = remove_prefix
22
+ self.pretty_labels = pretty_labels
23
+
24
+ @property
25
+ def mime_type(self) -> str:
26
+ """Return the MIME type for this export format."""
27
+ return self.__class__.mime_type
28
+
29
+ @property
30
+ def suffix(self) -> str:
31
+ """Return the file suffix for this format."""
32
+ return self.__class__.suffix
33
+
34
+ @property
35
+ def is_binary(self) -> bool:
36
+ """Whether the format is binary or text-based."""
37
+ return self.__class__.is_binary
38
+
39
+ def _get_default_filename(self) -> str:
40
+ """Generate default filename for this format."""
41
+ return f"results.{self.suffix}"
42
+
43
+ def _create_filestore(self, data: Union[str, bytes]) -> "FileStore":
44
+ """Create a FileStore instance with encoded data."""
45
+ if isinstance(data, str):
46
+ base64_string = base64.b64encode(data.encode()).decode()
47
+ else:
48
+ base64_string = base64.b64encode(data).decode()
49
+
50
+ from edsl.scenarios.FileStore import FileStore
51
+
52
+ path = self.filename or self._get_default_filename()
53
+
54
+ fs = FileStore(
55
+ path=path,
56
+ mime_type=self.mime_type,
57
+ binary=self.is_binary,
58
+ suffix=self.suffix,
59
+ base64_string=base64_string,
60
+ )
61
+
62
+ if self.filename is not None:
63
+ fs.write(self.filename)
64
+ return None
65
+ return fs
66
+
67
+ @abstractmethod
68
+ def format_data(self) -> Union[str, bytes]:
69
+ """Convert the input data to the target format."""
70
+ pass
71
+
72
+ def export(self) -> Optional["FileStore"]:
73
+ """Export the data to a FileStore instance."""
74
+ formatted_data = self.format_data()
75
+ return self._create_filestore(formatted_data)
76
+
77
+
78
+ class JSONLExport(FileExport):
79
+ mime_type = "application/jsonl"
80
+ suffix = "jsonl"
81
+ is_binary = False
82
+
83
+ def format_data(self) -> str:
84
+ output = io.StringIO()
85
+ for entry in self.data:
86
+ key, values = list(entry.items())[0]
87
+ output.write(f'{{"{key}": {values}}}\n')
88
+ return output.getvalue()
89
+
90
+
91
+ class TabularExport(FileExport, ABC):
92
+ """Base class for exports that use tabular data."""
93
+
94
+ def __init__(self, *args, **kwargs):
95
+ super().__init__(*args, **kwargs)
96
+ self.header, self.rows = self.data._get_tabular_data(
97
+ remove_prefix=self.remove_prefix, pretty_labels=self.pretty_labels
98
+ )
99
+
100
+
101
+ class CSVExport(TabularExport):
102
+ mime_type = "text/csv"
103
+ suffix = "csv"
104
+ is_binary = False
105
+
106
+ def format_data(self) -> str:
107
+ output = io.StringIO()
108
+ writer = csv.writer(output)
109
+ writer.writerow(self.header)
110
+ writer.writerows(self.rows)
111
+ return output.getvalue()
112
+
113
+
114
+ class ExcelExport(TabularExport):
115
+ mime_type = "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"
116
+ suffix = "xlsx"
117
+ is_binary = True
118
+
119
+ def __init__(self, *args, sheet_name: Optional[str] = None, **kwargs):
120
+ super().__init__(*args, **kwargs)
121
+ self.sheet_name = sheet_name or "Results"
122
+
123
+ def format_data(self) -> bytes:
124
+ wb = Workbook()
125
+ ws = wb.active
126
+ ws.title = self.sheet_name
127
+
128
+ # Write header
129
+ for col, value in enumerate(self.header, 1):
130
+ ws.cell(row=1, column=col, value=value)
131
+
132
+ # Write data rows
133
+ for row_idx, row_data in enumerate(self.rows, 2):
134
+ for col, value in enumerate(row_data, 1):
135
+ ws.cell(row=row_idx, column=col, value=value)
136
+
137
+ # Save to bytes buffer
138
+ buffer = io.BytesIO()
139
+ wb.save(buffer)
140
+ buffer.seek(0)
141
+ return buffer.getvalue()
142
+
143
+
144
+ import sqlite3
145
+ from typing import Any
146
+
147
+
148
+ class SQLiteExport(TabularExport):
149
+ mime_type = "application/x-sqlite3"
150
+ suffix = "db"
151
+ is_binary = True
152
+
153
+ def __init__(
154
+ self, *args, table_name: str = "results", if_exists: str = "replace", **kwargs
155
+ ):
156
+ """
157
+ Initialize SQLite export.
158
+
159
+ Args:
160
+ table_name: Name of the table to create
161
+ if_exists: How to handle existing table ('fail', 'replace', or 'append')
162
+ """
163
+ super().__init__(*args, **kwargs)
164
+ self.table_name = table_name
165
+ self.if_exists = if_exists
166
+
167
+ def _get_column_types(self) -> list[tuple[str, str]]:
168
+ """Infer SQL column types from the data."""
169
+ column_types = []
170
+
171
+ # Check first row of data for types
172
+ if self.rows:
173
+ first_row = self.rows[0]
174
+ for header, value in zip(self.header, first_row):
175
+ if isinstance(value, bool):
176
+ sql_type = "BOOLEAN"
177
+ elif isinstance(value, int):
178
+ sql_type = "INTEGER"
179
+ elif isinstance(value, float):
180
+ sql_type = "REAL"
181
+ else:
182
+ sql_type = "TEXT"
183
+ column_types.append((header, sql_type))
184
+ else:
185
+ # If no data, default to TEXT
186
+ column_types = [(header, "TEXT") for header in self.header]
187
+
188
+ return column_types
189
+
190
+ def _create_table(self, cursor: sqlite3.Cursor) -> None:
191
+ """Create the table with appropriate schema."""
192
+ column_types = self._get_column_types()
193
+
194
+ # Drop existing table if replace mode
195
+ if self.if_exists == "replace":
196
+ cursor.execute(f"DROP TABLE IF EXISTS {self.table_name}")
197
+ elif self.if_exists == "fail":
198
+ cursor.execute(
199
+ f"SELECT name FROM sqlite_master WHERE type='table' AND name=?",
200
+ (self.table_name,),
201
+ )
202
+ if cursor.fetchone():
203
+ raise ValueError(f"Table {self.table_name} already exists")
204
+
205
+ # Create table
206
+ columns = ", ".join(f'"{col}" {dtype}' for col, dtype in column_types)
207
+ create_table_sql = f"""
208
+ CREATE TABLE IF NOT EXISTS {self.table_name} (
209
+ {columns}
210
+ )
211
+ """
212
+ cursor.execute(create_table_sql)
213
+
214
+ def format_data(self) -> bytes:
215
+ """Convert the data to a SQLite database file."""
216
+ buffer = io.BytesIO()
217
+
218
+ # Create in-memory database
219
+ conn = sqlite3.connect(":memory:")
220
+ cursor = conn.cursor()
221
+
222
+ # Create table and insert data
223
+ self._create_table(cursor)
224
+
225
+ # Prepare placeholders for INSERT
226
+ placeholders = ",".join(["?" for _ in self.header])
227
+ insert_sql = f"INSERT INTO {self.table_name} ({','.join(self.header)}) VALUES ({placeholders})"
228
+
229
+ # Insert data
230
+ cursor.executemany(insert_sql, self.rows)
231
+ conn.commit()
232
+
233
+ # Save to file buffer
234
+ conn.backup(sqlite3.connect(buffer))
235
+ conn.close()
236
+
237
+ buffer.seek(0)
238
+ return buffer.getvalue()
239
+
240
+ def _validate_params(self) -> None:
241
+ """Validate initialization parameters."""
242
+ valid_if_exists = {"fail", "replace", "append"}
243
+ if self.if_exists not in valid_if_exists:
244
+ raise ValueError(
245
+ f"if_exists must be one of {valid_if_exists}, got {self.if_exists}"
246
+ )
247
+
248
+ # Validate table name (basic SQLite identifier validation)
249
+ if not self.table_name.isalnum() and not all(c in "_" for c in self.table_name):
250
+ raise ValueError(
251
+ f"Invalid table name: {self.table_name}. Must contain only alphanumeric characters and underscores."
252
+ )
@@ -0,0 +1,33 @@
1
+ """Mixin for fetching data from results."""
2
+
3
+ from functools import partial
4
+ from itertools import chain
5
+
6
+
7
+ class ResultsFetchMixin:
8
+ """Mixin for fetching data from results."""
9
+
10
+ def _fetch_list(self, data_type: str, key: str) -> list:
11
+ """
12
+ Return a list of values from the data for a given data type and key.
13
+
14
+ Uses the filtered data, not the original data.
15
+
16
+ Example:
17
+
18
+ >>> from edsl.results import Results
19
+ >>> r = Results.example()
20
+ >>> r._fetch_list('answer', 'how_feeling')
21
+ ['OK', 'Great', 'Terrible', 'OK']
22
+ """
23
+ returned_list = []
24
+ for row in self.data:
25
+ returned_list.append(row.sub_dicts[data_type].get(key, None))
26
+
27
+ return returned_list
28
+
29
+
30
+ if __name__ == "__main__":
31
+ import doctest
32
+
33
+ doctest.testmod(optionflags=doctest.ELLIPSIS)
@@ -0,0 +1,145 @@
1
+ from typing import Union, List, Dict, Any, Optional
2
+ import sys
3
+ from collections import defaultdict
4
+ from edsl.results.Dataset import Dataset
5
+
6
+ from edsl.exceptions.results import ResultsColumnNotFoundError
7
+
8
+ from edsl.utilities.is_notebook import is_notebook
9
+
10
+
11
+ class Selector:
12
+ def __init__(
13
+ self,
14
+ known_data_types: List[str],
15
+ data_type_to_keys: Dict[str, List[str]],
16
+ key_to_data_type: Dict[str, str],
17
+ fetch_list_func,
18
+ columns: List[str],
19
+ ):
20
+ """Selects columns from a Results object"""
21
+ self.known_data_types = known_data_types
22
+ self._data_type_to_keys = data_type_to_keys
23
+ self._key_to_data_type = key_to_data_type
24
+ self._fetch_list = fetch_list_func
25
+ self.columns = columns
26
+
27
+ def select(self, *columns: Union[str, List[str]]) -> Optional[Dataset]:
28
+ try:
29
+ columns = self._normalize_columns(columns)
30
+ to_fetch = self._get_columns_to_fetch(columns)
31
+ new_data = self._fetch_data(to_fetch)
32
+ except ResultsColumnNotFoundError as e:
33
+ if is_notebook():
34
+ print("Error:", e, file=sys.stderr)
35
+ return None
36
+ else:
37
+ raise e
38
+ return Dataset(new_data)
39
+
40
+ def _normalize_columns(self, columns: Union[str, List[str]]) -> tuple:
41
+ """Normalize the columns to a tuple of strings
42
+
43
+ >>> s = Selector([], {}, {}, lambda x, y: x, [])
44
+ >>> s._normalize_columns([["a", "b"], ])
45
+ ('a', 'b')
46
+ >>> s._normalize_columns(None)
47
+ ('*.*',)
48
+ """
49
+ if not columns or columns == ("*",) or columns == (None,):
50
+ return ("*.*",)
51
+ if isinstance(columns[0], list):
52
+ return tuple(columns[0])
53
+ return columns
54
+
55
+ def _get_columns_to_fetch(self, columns: tuple) -> Dict[str, List[str]]:
56
+ to_fetch = defaultdict(list)
57
+ self.items_in_order = []
58
+
59
+ for column in columns:
60
+ matches = self._find_matching_columns(column)
61
+ # breakpoint()
62
+ self._validate_matches(column, matches)
63
+
64
+ if len(matches) == 1:
65
+ column = matches[0]
66
+
67
+ data_type, key = self._parse_column(column)
68
+ self._process_column(data_type, key, to_fetch)
69
+
70
+ return to_fetch
71
+
72
+ def _find_matching_columns(self, partial_name: str) -> list[str]:
73
+ if "." in partial_name:
74
+ search_in_list = self.columns
75
+ else:
76
+ search_in_list = [s.split(".")[1] for s in self.columns]
77
+ matches = [s for s in search_in_list if s.startswith(partial_name)]
78
+ return [partial_name] if partial_name in matches else matches
79
+
80
+ def _validate_matches(self, column: str, matches: List[str]):
81
+ if len(matches) > 1:
82
+ raise ResultsColumnNotFoundError(
83
+ f"Column '{column}' is ambiguous. Did you mean one of {matches}?"
84
+ )
85
+ if len(matches) == 0 and ".*" not in column:
86
+ raise ResultsColumnNotFoundError(f"Column '{column}' not found in data.")
87
+
88
+ def _parse_column(self, column: str) -> tuple[str, str]:
89
+ if "." in column:
90
+ return column.split(".")
91
+ try:
92
+ return self._key_to_data_type[column], column
93
+ except KeyError:
94
+ self._raise_key_error(column)
95
+
96
+ def _raise_key_error(self, column: str):
97
+ import difflib
98
+
99
+ close_matches = difflib.get_close_matches(column, self._key_to_data_type.keys())
100
+ if close_matches:
101
+ suggestions = ", ".join(close_matches)
102
+ raise ResultsColumnNotFoundError(
103
+ f"Column '{column}' not found in data. Did you mean: {suggestions}?"
104
+ )
105
+ else:
106
+ raise ResultsColumnNotFoundError(f"Column {column} not found in data")
107
+
108
+ def _process_column(self, data_type: str, key: str, to_fetch: Dict[str, List[str]]):
109
+ data_types = self._get_data_types_to_return(data_type)
110
+ found_once = False
111
+
112
+ for dt in data_types:
113
+ relevant_keys = self._data_type_to_keys[dt]
114
+ for k in relevant_keys:
115
+ if k == key or key == "*":
116
+ found_once = True
117
+ to_fetch[dt].append(k)
118
+ self.items_in_order.append(f"{dt}.{k}")
119
+
120
+ if not found_once:
121
+ raise ResultsColumnNotFoundError(f"Key {key} not found in data.")
122
+
123
+ def _get_data_types_to_return(self, parsed_data_type: str) -> List[str]:
124
+ if parsed_data_type == "*":
125
+ return self.known_data_types
126
+ if parsed_data_type not in self.known_data_types:
127
+ raise ResultsColumnNotFoundError(
128
+ f"Data type {parsed_data_type} not found in data. Did you mean one of {self.known_data_types}"
129
+ )
130
+ return [parsed_data_type]
131
+
132
+ def _fetch_data(self, to_fetch: Dict[str, List[str]]) -> List[Dict[str, Any]]:
133
+ new_data = []
134
+ for data_type, keys in to_fetch.items():
135
+ for key in keys:
136
+ entries = self._fetch_list(data_type, key)
137
+ new_data.append({f"{data_type}.{key}": entries})
138
+
139
+ return [d for key in self.items_in_order for d in new_data if key in d]
140
+
141
+
142
+ if __name__ == "__main__":
143
+ import doctest
144
+
145
+ doctest.testmod()
@@ -0,0 +1,98 @@
1
+ class ResultsToolsMixin:
2
+ def get_themes(
3
+ self,
4
+ field: str,
5
+ context: str,
6
+ max_values=100,
7
+ num_themes: int = 10,
8
+ seed=None,
9
+ progress_bar=False,
10
+ print_exceptions=False,
11
+ ) -> list:
12
+ values = [
13
+ str(txt)[:1000]
14
+ for txt in self.shuffle(seed=seed).select(field).to_list()[:max_values]
15
+ ]
16
+ from edsl import ScenarioList
17
+ from edsl.questions import QuestionList, QuestionCheckBox
18
+
19
+ q = QuestionList(
20
+ question_text=f"""
21
+ {context}
22
+ Here are some examples: { values }.
23
+ What are some 5-8 word themes that would mostly capture these examples?
24
+ Please shoot for {num_themes} as target number of themes.
25
+ """,
26
+ question_name="themes",
27
+ )
28
+ results = q.run(print_exceptions=print_exceptions, progress_bar=progress_bar)
29
+ return results.select("themes").first()
30
+
31
+ def answers_to_themes(
32
+ self,
33
+ field,
34
+ context: str,
35
+ themes: list,
36
+ progress_bar=False,
37
+ print_exceptions=False,
38
+ ) -> dict:
39
+ from edsl import ScenarioList
40
+ from edsl import QuestionCheckBox
41
+
42
+ values = self.select(field).to_list()
43
+ scenarios = ScenarioList.from_list("field", values).add_value(
44
+ "context", context
45
+ )
46
+ q = QuestionCheckBox(
47
+ question_text="""
48
+ {{ context }}
49
+ Consider the following response:
50
+
51
+ " {{ field }} "
52
+
53
+ Please check the themes that apply to these examples.
54
+ If blank, please check 'None'.
55
+ """,
56
+ question_options=themes + ["None", "Other"],
57
+ question_name="themes",
58
+ )
59
+ results = q.by(scenarios).run(
60
+ progress_bar=progress_bar, print_exceptions=print_exceptions
61
+ )
62
+ return {k: v for k, v in results.select("field", "themes").to_list()}
63
+
64
+ def apply_themes(self, field: str, new_field: str, answers_to_themes: dict):
65
+ def translate(x):
66
+ return answers_to_themes.get(x, "Other")
67
+
68
+ self.mutate(f"{new_field} = f({field})", functions_dict={"f": translate})
69
+ return self
70
+
71
+ def auto_theme(
72
+ self,
73
+ field: str,
74
+ context: str,
75
+ themes: list[str],
76
+ newfield: str = None,
77
+ progress_bar=False,
78
+ print_exceptions=False,
79
+ ) -> tuple:
80
+ """
81
+ :param field: The field to be themed.
82
+ :param context: The context of the field.
83
+ :param themes: The list of themes.
84
+ :param newfield: The new field name.
85
+
86
+ """
87
+
88
+ if not newfield:
89
+ newfield = f"{field}_themes"
90
+
91
+ answers_to_themes = self.answers_to_themes(
92
+ field=field,
93
+ context=context,
94
+ themes=themes,
95
+ progress_bar=progress_bar,
96
+ print_exceptions=print_exceptions,
97
+ )
98
+ return self.apply_themes(field, newfield, answers_to_themes), themes
@@ -0,0 +1,96 @@
1
+ from typing import Optional
2
+
3
+
4
+ class SmartInt(int):
5
+ pass
6
+
7
+
8
+ class SmartFloat(float):
9
+ pass
10
+
11
+
12
+ class SmartStr(str):
13
+ def clipboard(self) -> None:
14
+ try:
15
+ import pyperclip
16
+ except ImportError:
17
+ print(
18
+ "pyperclip is not installed. Run `pip install pyperclip` to install it."
19
+ )
20
+ return None
21
+
22
+ pyperclip.copy(self)
23
+ print("Text copied to clipboard.")
24
+
25
+ def write(self, filename: str):
26
+ with open(filename, "w") as f:
27
+ f.write(str(self))
28
+ return None
29
+
30
+ def _repr_html_(self):
31
+ pass
32
+
33
+ def markdown(self):
34
+ return SmartMarkdown(self)
35
+
36
+ def pdf(self, filename: Optional[str] = None): # Markdown will have this as well
37
+ # renders the markdown as a pdf that can be downloaded
38
+ from edsl.results.MarkdownToPDF import MarkdownToPDF
39
+
40
+ return MarkdownToPDF(self, filename).preview()
41
+
42
+ def docx(self, filename: Optional[str] = None):
43
+ # renders the markdown as a docx that can be downloaded
44
+ from edsl.results.MarkdownToDocx import MarkdownToDocx
45
+
46
+ return MarkdownToDocx(self, filename).preview()
47
+
48
+ def edit(self):
49
+ from edsl.results.TextEditor import TextEditor
50
+
51
+ editor = TextEditor(self)
52
+ self = self.__class__(editor.edit_gui())
53
+ # print(f"Updated text: {self}")
54
+
55
+
56
+ class SmartMarkdown(SmartStr):
57
+ def _repr_markdown_(self):
58
+ return self
59
+
60
+ def _repr_html_(self):
61
+ from IPython.display import Markdown, display
62
+
63
+ display(Markdown(self))
64
+
65
+
66
+ class SmartLaTeX(SmartStr):
67
+ def _repr_html_(self):
68
+ print(self)
69
+
70
+ def pdf(self, filename: Optional[str] = None):
71
+ from edsl.results.LaTeXToPDF import LaTeXToPDF
72
+
73
+ return LaTeXToPDF(self, filename).preview()
74
+
75
+ def docx(self, filename: Optional[str] = None):
76
+ from edsl.results.LaTeXToDocx import LaTeXToDocx
77
+
78
+ return LaTeXToDocx(self, filename).preview()
79
+
80
+ def edit(self):
81
+ from edsl.results.TextEditor import TextEditor
82
+
83
+ editor = TextEditor(self)
84
+ self = self.__class__(editor.edit_gui())
85
+ # print(f"Updated LaTeX: {self}")
86
+
87
+
88
+ class FirstObject:
89
+ def __new__(self, value):
90
+ if isinstance(value, int):
91
+ return SmartInt(value)
92
+ if isinstance(value, float):
93
+ return SmartFloat(value)
94
+ if isinstance(value, str):
95
+ return SmartStr(value)
96
+ return value
@@ -0,0 +1,12 @@
1
+ from dataclasses import dataclass
2
+ from typing import Any, List
3
+
4
+
5
+ @dataclass
6
+ class TableData:
7
+ """Simple data class to hold table information"""
8
+
9
+ headers: List[str]
10
+ data: List[List[Any]]
11
+ parameters: dict = None
12
+ raw_data_set: Any = None