PyPI - edsl - Versions diffs - 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl - Mend

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (407) hide show

edsl/Base.py +348 -38
edsl/BaseDiff.py +260 -0
edsl/TemplateLoader.py +24 -0
edsl/__init__.py +46 -10
edsl/__version__.py +1 -0
edsl/agents/Agent.py +842 -144
edsl/agents/AgentList.py +521 -25
edsl/agents/Invigilator.py +250 -374
edsl/agents/InvigilatorBase.py +257 -0
edsl/agents/PromptConstructor.py +272 -0
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/descriptors.py +43 -13
edsl/agents/prompt_helpers.py +129 -0
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +130 -0
edsl/auto/StageBase.py +243 -0
edsl/auto/StageGenerateSurvey.py +178 -0
edsl/auto/StageLabelQuestions.py +125 -0
edsl/auto/StagePersona.py +61 -0
edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
edsl/auto/StagePersonaDimensionValues.py +74 -0
edsl/auto/StagePersonaDimensions.py +69 -0
edsl/auto/StageQuestions.py +74 -0
edsl/auto/SurveyCreatorPipeline.py +21 -0
edsl/auto/utilities.py +218 -0
edsl/base/Base.py +279 -0
edsl/config.py +121 -104
edsl/conversation/Conversation.py +290 -0
edsl/conversation/car_buying.py +59 -0
edsl/conversation/chips.py +95 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +54 -0
edsl/coop/__init__.py +1 -0
edsl/coop/coop.py +1029 -134
edsl/coop/utils.py +131 -0
edsl/data/Cache.py +560 -89
edsl/data/CacheEntry.py +230 -0
edsl/data/CacheHandler.py +168 -0
edsl/data/RemoteCacheSync.py +186 -0
edsl/data/SQLiteDict.py +292 -0
edsl/data/__init__.py +5 -3
edsl/data/orm.py +6 -33
edsl/data_transfer_models.py +74 -27
edsl/enums.py +165 -8
edsl/exceptions/BaseException.py +21 -0
edsl/exceptions/__init__.py +52 -46
edsl/exceptions/agents.py +33 -15
edsl/exceptions/cache.py +5 -0
edsl/exceptions/coop.py +8 -0
edsl/exceptions/general.py +34 -0
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/jobs.py +15 -0
edsl/exceptions/language_models.py +46 -1
edsl/exceptions/questions.py +80 -5
edsl/exceptions/results.py +16 -5
edsl/exceptions/scenarios.py +29 -0
edsl/exceptions/surveys.py +13 -10
edsl/inference_services/AnthropicService.py +106 -0
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +118 -0
edsl/inference_services/AzureAI.py +215 -0
edsl/inference_services/DeepInfraService.py +18 -0
edsl/inference_services/GoogleService.py +143 -0
edsl/inference_services/GroqService.py +20 -0
edsl/inference_services/InferenceServiceABC.py +80 -0
edsl/inference_services/InferenceServicesCollection.py +138 -0
edsl/inference_services/MistralAIService.py +120 -0
edsl/inference_services/OllamaService.py +18 -0
edsl/inference_services/OpenAIService.py +236 -0
edsl/inference_services/PerplexityService.py +160 -0
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +90 -0
edsl/inference_services/TogetherAIService.py +172 -0
edsl/inference_services/data_structures.py +134 -0
edsl/inference_services/models_available_cache.py +118 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/registry.py +41 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +21 -20
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +684 -204
edsl/jobs/JobsChecks.py +172 -0
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +270 -0
edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +104 -0
edsl/jobs/buckets/ModelBuckets.py +65 -0
edsl/jobs/buckets/TokenBucket.py +283 -0
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +392 -0
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
edsl/jobs/interviews/InterviewStatistic.py +63 -0
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
edsl/jobs/interviews/InterviewStatusLog.py +92 -0
edsl/jobs/interviews/ReportErrors.py +66 -0
edsl/jobs/interviews/interview_status_enum.py +9 -0
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
edsl/jobs/runners/JobsRunnerStatus.py +298 -0
edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
edsl/jobs/tasks/TaskCreators.py +64 -0
edsl/jobs/tasks/TaskHistory.py +470 -0
edsl/jobs/tasks/TaskStatusLog.py +23 -0
edsl/jobs/tasks/task_status_enum.py +161 -0
edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
edsl/jobs/tokens/TokenUsage.py +34 -0
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +507 -386
edsl/language_models/ModelList.py +164 -0
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
edsl/language_models/__init__.py +1 -8
edsl/language_models/fake_openai_call.py +15 -0
edsl/language_models/fake_openai_service.py +61 -0
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +109 -41
edsl/language_models/utilities.py +65 -0
edsl/notebooks/Notebook.py +263 -0
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/notebooks/__init__.py +1 -0
edsl/prompts/Prompt.py +222 -93
edsl/prompts/__init__.py +1 -1
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +518 -0
edsl/questions/QuestionBasePromptsMixin.py +221 -0
edsl/questions/QuestionBudget.py +164 -67
edsl/questions/QuestionCheckBox.py +281 -62
edsl/questions/QuestionDict.py +343 -0
edsl/questions/QuestionExtract.py +136 -50
edsl/questions/QuestionFreeText.py +79 -55
edsl/questions/QuestionFunctional.py +138 -41
edsl/questions/QuestionList.py +184 -57
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +293 -69
edsl/questions/QuestionNumerical.py +109 -56
edsl/questions/QuestionRank.py +244 -49
edsl/questions/Quick.py +41 -0
edsl/questions/SimpleAskMixin.py +74 -0
edsl/questions/__init__.py +9 -6
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
edsl/questions/compose_questions.py +13 -7
edsl/questions/data_structures.py +20 -0
edsl/questions/decorators.py +21 -0
edsl/questions/derived/QuestionLikertFive.py +28 -26
edsl/questions/derived/QuestionLinearScale.py +41 -28
edsl/questions/derived/QuestionTopK.py +34 -26
edsl/questions/derived/QuestionYesNo.py +40 -27
edsl/questions/descriptors.py +228 -74
edsl/questions/loop_processor.py +149 -0
edsl/questions/prompt_templates/question_budget.jinja +13 -0
edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
edsl/questions/prompt_templates/question_extract.jinja +11 -0
edsl/questions/prompt_templates/question_free_text.jinja +3 -0
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
edsl/questions/prompt_templates/question_list.jinja +17 -0
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
edsl/questions/prompt_templates/question_numerical.jinja +37 -0
edsl/questions/question_base_gen_mixin.py +168 -0
edsl/questions/question_registry.py +130 -46
edsl/questions/register_questions_meta.py +71 -0
edsl/questions/response_validator_abc.py +188 -0
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/settings.py +5 -2
edsl/questions/templates/__init__.py +0 -0
edsl/questions/templates/budget/__init__.py +0 -0
edsl/questions/templates/budget/answering_instructions.jinja +7 -0
edsl/questions/templates/budget/question_presentation.jinja +7 -0
edsl/questions/templates/checkbox/__init__.py +0 -0
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
edsl/questions/templates/dict/__init__.py +0 -0
edsl/questions/templates/dict/answering_instructions.jinja +21 -0
edsl/questions/templates/dict/question_presentation.jinja +1 -0
edsl/questions/templates/extract/__init__.py +0 -0
edsl/questions/templates/extract/answering_instructions.jinja +7 -0
edsl/questions/templates/extract/question_presentation.jinja +1 -0
edsl/questions/templates/free_text/__init__.py +0 -0
edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
edsl/questions/templates/free_text/question_presentation.jinja +1 -0
edsl/questions/templates/likert_five/__init__.py +0 -0
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
edsl/questions/templates/linear_scale/__init__.py +0 -0
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
edsl/questions/templates/list/__init__.py +0 -0
edsl/questions/templates/list/answering_instructions.jinja +4 -0
edsl/questions/templates/list/question_presentation.jinja +5 -0
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/questions/templates/multiple_choice/__init__.py +0 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
edsl/questions/templates/multiple_choice/html.jinja +0 -0
edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
edsl/questions/templates/numerical/__init__.py +0 -0
edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
edsl/questions/templates/numerical/question_presentation.jinja +7 -0
edsl/questions/templates/rank/__init__.py +0 -0
edsl/questions/templates/rank/answering_instructions.jinja +11 -0
edsl/questions/templates/rank/question_presentation.jinja +15 -0
edsl/questions/templates/top_k/__init__.py +0 -0
edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
edsl/questions/templates/top_k/question_presentation.jinja +22 -0
edsl/questions/templates/yes_no/__init__.py +0 -0
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +550 -19
edsl/results/DatasetExportMixin.py +594 -0
edsl/results/DatasetTree.py +295 -0
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +477 -173
edsl/results/Results.py +987 -269
edsl/results/ResultsExportMixin.py +28 -125
edsl/results/ResultsGGMixin.py +83 -15
edsl/results/TableDisplay.py +125 -0
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +1 -1
edsl/results/file_exports.py +252 -0
edsl/results/results_fetch_mixin.py +33 -0
edsl/results/results_selector.py +145 -0
edsl/results/results_tools_mixin.py +98 -0
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_display.css +78 -0
edsl/results/table_renderers.py +118 -0
edsl/results/tree_explore.py +115 -0
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +543 -0
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +431 -62
edsl/scenarios/ScenarioHtmlMixin.py +65 -0
edsl/scenarios/ScenarioList.py +1415 -45
edsl/scenarios/ScenarioListExportMixin.py +45 -0
edsl/scenarios/ScenarioListPdfMixin.py +239 -0
edsl/scenarios/__init__.py +2 -0
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +49 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/scenario_join.py +131 -0
edsl/scenarios/scenario_selector.py +156 -0
edsl/shared.py +1 -0
edsl/study/ObjectEntry.py +173 -0
edsl/study/ProofOfWork.py +113 -0
edsl/study/SnapShot.py +80 -0
edsl/study/Study.py +521 -0
edsl/study/__init__.py +4 -0
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/DAG.py +92 -11
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/Memory.py +9 -4
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/MemoryPlan.py +156 -35
edsl/surveys/Rule.py +221 -74
edsl/surveys/RuleCollection.py +241 -61
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +1079 -339
edsl/surveys/SurveyCSS.py +273 -0
edsl/surveys/SurveyExportMixin.py +235 -40
edsl/surveys/SurveyFlowVisualization.py +181 -0
edsl/surveys/SurveyQualtricsImport.py +284 -0
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +4 -2
edsl/surveys/base.py +19 -3
edsl/surveys/descriptors.py +17 -6
edsl/surveys/instructions/ChangeInstruction.py +48 -0
edsl/surveys/instructions/Instruction.py +56 -0
edsl/surveys/instructions/InstructionCollection.py +82 -0
edsl/surveys/instructions/__init__.py +0 -0
edsl/templates/error_reporting/base.html +24 -0
edsl/templates/error_reporting/exceptions_by_model.html +35 -0
edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
edsl/templates/error_reporting/exceptions_by_type.html +17 -0
edsl/templates/error_reporting/interview_details.html +116 -0
edsl/templates/error_reporting/interviews.html +19 -0
edsl/templates/error_reporting/overview.html +5 -0
edsl/templates/error_reporting/performance_plot.html +2 -0
edsl/templates/error_reporting/report.css +74 -0
edsl/templates/error_reporting/report.html +118 -0
edsl/templates/error_reporting/report.js +25 -0
edsl/tools/__init__.py +1 -0
edsl/tools/clusters.py +192 -0
edsl/tools/embeddings.py +27 -0
edsl/tools/embeddings_plotting.py +118 -0
edsl/tools/plotting.py +112 -0
edsl/tools/summarize.py +18 -0
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/SystemInfo.py +5 -0
edsl/utilities/__init__.py +21 -20
edsl/utilities/ast_utilities.py +3 -0
edsl/utilities/data/Registry.py +2 -0
edsl/utilities/decorators.py +41 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/interface.py +310 -60
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/naming_utilities.py +263 -0
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/restricted_python.py +70 -0
edsl/utilities/utilities.py +203 -13
edsl-0.1.40.dist-info/METADATA +111 -0
edsl-0.1.40.dist-info/RECORD +362 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
edsl/agents/AgentListExportMixin.py +0 -24
edsl/coop/old.py +0 -31
edsl/data/Database.py +0 -141
edsl/data/crud.py +0 -121
edsl/jobs/Interview.py +0 -417
edsl/jobs/JobsRunner.py +0 -63
edsl/jobs/JobsRunnerStatusMixin.py +0 -115
edsl/jobs/base.py +0 -47
edsl/jobs/buckets.py +0 -166
edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
edsl/jobs/task_management.py +0 -218
edsl/jobs/token_tracking.py +0 -78
edsl/language_models/DeepInfra.py +0 -69
edsl/language_models/OpenAI.py +0 -98
edsl/language_models/model_interfaces/GeminiPro.py +0 -66
edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
edsl/language_models/registry.py +0 -81
edsl/language_models/schemas.py +0 -15
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/prompts/QuestionInstructionsBase.py +0 -6
edsl/prompts/library/agent_instructions.py +0 -29
edsl/prompts/library/agent_persona.py +0 -17
edsl/prompts/library/question_budget.py +0 -26
edsl/prompts/library/question_checkbox.py +0 -32
edsl/prompts/library/question_extract.py +0 -19
edsl/prompts/library/question_freetext.py +0 -14
edsl/prompts/library/question_linear_scale.py +0 -20
edsl/prompts/library/question_list.py +0 -22
edsl/prompts/library/question_multiple_choice.py +0 -44
edsl/prompts/library/question_numerical.py +0 -31
edsl/prompts/library/question_rank.py +0 -21
edsl/prompts/prompt_config.py +0 -33
edsl/prompts/registry.py +0 -185
edsl/questions/Question.py +0 -240
edsl/report/InputOutputDataTypes.py +0 -134
edsl/report/RegressionMixin.py +0 -28
edsl/report/ReportOutputs.py +0 -1228
edsl/report/ResultsFetchMixin.py +0 -106
edsl/report/ResultsOutputMixin.py +0 -14
edsl/report/demo.ipynb +0 -645
edsl/results/ResultsDBMixin.py +0 -184
edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
edsl/trackers/Tracker.py +0 -91
edsl/trackers/TrackerAPI.py +0 -196
edsl/trackers/TrackerTasks.py +0 -70
edsl/utilities/pastebin.py +0 -141
edsl-0.1.14.dist-info/METADATA +0 -69
edsl-0.1.14.dist-info/RECORD +0 -141
/edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
/edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
/edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
{edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0

edsl/results/ResultsDBMixin.py DELETED Viewed

@@ -1,184 +0,0 @@
-import pandas as pd
-import sqlite3
-from sqlalchemy import create_engine
-from enum import Enum
-class SQLDataShape(Enum):
-    WIDE = "wide"
-    LONG = "long"
-class ResultsDBMixin:
-    def rows(self):
-        for index, result in enumerate(self):
-            yield from result.rows(index)
-    def export_sql_dump(self, shape, filename):
-        shape_enum = self._get_shape_enum(shape)
-        conn = self.db(shape=shape_enum)
-        # Open file to write SQL dump
-        with open(filename, "w") as f:
-            for line in conn.iterdump():
-                f.write(f"{line}\n")
-        # Close the connection
-        conn.close()
-    def backup_db_to_file(self, shape, filename):
-        shape_enum = self._get_shape_enum(shape)
-        # Source database connection (in-memory)
-        source_conn = self.db(shape=shape_enum)
-        # Destination database connection (file)
-        dest_conn = sqlite3.connect(filename)
-        # Backup in-memory database to file
-        with source_conn:
-            source_conn.backup(dest_conn)
-        # Close both connections
-        source_conn.close()
-        dest_conn.close()
-    def db(self, shape: SQLDataShape, remove_prefix=False):
-        if shape == SQLDataShape.LONG:
-            # Step 2: Create a SQLite Database in Memory
-            conn = sqlite3.connect(":memory:")
-            create_table_query = """
-            CREATE TABLE self (
-                id INTEGER,
-                data_type TEXT,
-                key TEXT,
-                value TEXT
-            )
-            """
-            conn.execute(create_table_query)
-            # # Step 3: Insert the tuples into the table
-            list_of_tuples = list(self.rows())
-            insert_query = (
-                "INSERT INTO self (id, data_type, key, value) VALUES (?, ?, ?, ?)"
-            )
-            conn.executemany(insert_query, list_of_tuples)
-            conn.commit()
-            return conn
-        elif shape == SQLDataShape.WIDE:
-            db_uri = "sqlite:///:memory:"
-            # Create SQLAlchemy engine with the in-memory database connection string
-            engine = create_engine(db_uri)
-            # Convert DataFrame to SQLite in-memory database
-            df = self.to_pandas(remove_prefix=remove_prefix)
-            df.to_sql("self", engine, index=False, if_exists="replace")
-            # Create a connection to the SQLite database
-            conn = engine.connect()
-            return conn
-        else:
-            raise Exception("Invalid SQLDataShape")
-    def _get_shape_enum(self, shape: str):
-        if shape is None:
-            raise Exception("Must select either 'wide' or 'long' format")
-        elif shape == "wide":
-            return SQLDataShape.WIDE
-        elif shape == "long":
-            return SQLDataShape.LONG
-        else:
-            raise Exception("Invalid shape: must be either 'long' or 'wide'")
-    def sql(
-        self,
-        query: str,
-        shape: str,
-        remove_prefix: bool = False,
-        transpose: bool = None,
-        transpose_by: str = None,
-        csv: bool = False,
-    ):
-        """Execute a SQL query and return the results as a DataFrame.
-        :param query: The SQL query to execute
-        :param transpose: Transpose the DataFrame if True
-        :param transpose_by: Column to use as the index when transposing, otherwise the first column
-        :param csv: Return the DataFrame as a CSV string if True
-        """
-        shape_enum = self._get_shape_enum(shape)
-        conn = self.db(shape=shape_enum, remove_prefix=remove_prefix)
-        df = pd.read_sql_query(query, conn)
-        # Transpose the DataFrame if transpose is True
-        if transpose or transpose_by:
-            df = pd.DataFrame(df)
-            if transpose_by:
-                df = df.set_index(transpose_by)
-            else:
-                df = df.set_index(df.columns[0])
-            df = df.transpose()
-        # Return as CSV if output is "csv"
-        if csv:
-            return df.to_csv(index=False)
-        else:
-            return df
-    def show_schema(self, shape: str, remove_prefix: bool = False):
-        shape_enum = self._get_shape_enum(shape)
-        conn = self.db(shape=shape_enum, remove_prefix=remove_prefix)
-        if shape_enum == SQLDataShape.LONG:
-            # Query to get the schema of all tables
-            query = "SELECT type, name, sql FROM sqlite_master WHERE type='table'"
-            # Execute the query
-            cursor = conn.execute(query)
-            schema = cursor.fetchall()
-            # Close the connection
-            conn.close()
-            # Format and return the schema information
-            schema_info = ""
-            for row in schema:
-                schema_info += f"Type: {row[0]}, Name: {row[1]}, SQL: {row[2]}\n"
-            print(schema_info)
-        elif shape_enum == SQLDataShape.WIDE:
-            query = f"PRAGMA table_info(self)"
-            schema = pd.read_sql(query, conn)
-            print(schema)
-if __name__ == "__main__":
-    from edsl.results import Results
-    r = Results.example()
-    df = r.sql(
-        "select data_type, key, value from self where data_type = 'answer'",
-        shape="long",
-    )
-    print(df)
-    df = r.sql(
-        "select * from self",
-        shape="wide",
-    )
-    df = r.sql(
-        "select * from self",
-        shape="wide",
-    )
-    r.show_schema(shape="long")
-    df = r.sql(
-        "select * from self",
-        shape="wide",
-    )
-    print(df)

edsl/surveys/SurveyFlowVisualizationMixin.py DELETED Viewed

@@ -1,92 +0,0 @@
-import pydot
-import tempfile
-from IPython.display import Image
-from edsl.utilities import is_notebook
-from edsl.surveys.base import RulePriority, EndOfSurvey
-class SurveyFlowVisualizationMixin:
-    def show_flow(self):
-        "Creates an image showing the flow of users through the survey."
-        # Create a graph object
-        graph = pydot.Dot(graph_type="digraph")
-        # Add nodes
-        for index, question in enumerate(self.questions):
-            graph.add_node(
-                pydot.Node(
-                    f"Q{index}", label=f"{question.question_name}", shape="ellipse"
-                )
-            )
-        # Add an "EndOfSurvey" node
-        graph.add_node(
-            pydot.Node("EndOfSurvey", label="End of Survey", shape="rectangle")
-        )
-        # Add edges for normal flow
-        num_questions = len(self.questions)
-        for index in range(num_questions - 1):  # From Q1 to Q3
-            graph.add_edge(pydot.Edge(f"Q{index}", f"Q{index+1}"))
-        graph.add_edge(pydot.Edge(f"Q{num_questions-1}", "EndOfSurvey"))
-        relevant_rules = [
-            rule
-            for rule in self.rule_collection
-            if rule.priority > RulePriority.DEFAULT.value
-        ]
-        colors = [
-            "blue",
-            "red",
-            "purple",
-            "orange",
-            "pink",
-            "brown",
-            "grey",
-            "cyan",
-            "green",
-        ]
-        rule_colors = {
-            rule: colors[i % len(colors)] for i, rule in enumerate(relevant_rules)
-        }
-        for rule in relevant_rules:
-            color = rule_colors[rule]
-            edge_label = f"if {rule.expression}"
-            source_node = f"Q{rule.current_q}"
-            target_node = (
-                f"Q{rule.next_q}" if rule.next_q != EndOfSurvey else "EndOfSurvey"
-            )
-            edge = pydot.Edge(
-                source_node, target_node, label=edge_label, color=color, fontcolor=color
-            )
-            graph.add_edge(edge)
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".png") as tmp_file:
-            try:
-                graph.write_png(tmp_file.name)
-            except FileNotFoundError:
-                print(
-                    """File not found. Most likely it's because you don't have graphviz installed. Please install it and try again.
-                        It's
-                        $ sudo apt-get install graphviz
-                        on Ubuntu.
-                    """
-                )
-            if is_notebook():
-                display(Image(tmp_file.name))
-            else:
-                import os
-                import sys
-                if os.name == "nt":  # Windows
-                    os.system(f"start {tmp_file.name}")
-                elif os.name == "posix":  # macOS, Linux, Unix, etc.
-                    os.system(
-                        f"open {tmp_file.name}"
-                        if sys.platform == "darwin"
-                        else f"xdg-open {tmp_file.name}"
-                    )

edsl/trackers/Tracker.py DELETED Viewed

@@ -1,91 +0,0 @@
-"""
-This an ABC for a tracker that monitors a Python queue.
-Contained within the namespace is a class called TrackerEvent, which is also an ABC.
-This is the kind of event that will be placed in the queue the tracker is monitoring.
-Each child class of TrackerEvent needs to know how to update the state of the tracker.
-Each child has to implement a tracked_values method which tells what values the
-tracker is tracking - this is so it can pretty-print them.
-All child classes have to implement an allowed_events class variable.
-"""
-import time
-from abc import ABC, abstractmethod
-from queue import Empty
-from edsl.utilities.interface import print_dict_with_rich
-class Tracker(ABC):
-    "Meant to be single-threaded"
-    class TrackerEvent(ABC):
-        "Each child event needs to know how to update the state of the tracker."
-        @abstractmethod
-        def apply(self, tracker):
-            pass
-    def __init__(self, event_queue, verbose=False):
-        self.event_queue = event_queue
-        self.observed_events = []
-        self.verbose = verbose
-        if self.verbose:
-            print("Tracker instantiated")
-    @abstractmethod
-    def allowed_events(self) -> set:
-        "What events (classes) are allowed to be placed in the queue?"
-        pass
-    @abstractmethod
-    def tracked_values(self) -> dict:
-        "What values are tracked by this tracker (should be flat dictionary)?"
-        pass
-    def get_from_queue(self):
-        """Gets events from the queue and stores them in a list.
-        It runs until the event_queue is empty.
-        """
-        while True:
-            try:
-                event = self.event_queue.get(block=False)
-            except Empty as e:
-                if self.verbose:
-                    print("The queue is empty.")
-                break
-            else:
-                self.observed_events.append(event)
-                self.process_event(event)
-                self.event_queue.task_done()
-    def __call__(self, all_done, interval=1):
-        if self.verbose:
-            print("Tracking thread is starting.")
-        while not all_done.is_set():
-            self.get_from_queue()
-            time.sleep(interval)
-        # Run one last time to get anything still left in the event_queue
-        self.get_from_queue()
-    def process_event(self, event):
-        """Processes an event from the event queue."""
-        ## diabling this for now as two error-prone:
-        # https://chat.openai.com/share/6e0e2ae2-30d7-4281-982a-a69a218c4e76
-        # if not isinstance(event, tuple(self.allowed_events())):
-        #    print(f"Event type: {type(event).__name__}")
-        #    print(f"Allowed events: {self.allowed_events()}")
-        #    raise ValueError(f"Invalid event type: {type(event).__name__}")
-        event.apply(self)
-        if self.verbose:
-            self.show_status()
-    def show_status(self):
-        """Prints the status of the interview manager."""
-        data = self.tracked_values()
-        print_dict_with_rich(data)

edsl/trackers/TrackerAPI.py DELETED Viewed

@@ -1,196 +0,0 @@
-"""This tracker tracks API calls."""
-import json
-import time
-from collections import namedtuple
-from threading import Lock, Event
-from edsl.trackers.Tracker import Tracker
-UsageRates = namedtuple(
-    "UsageRates",
-    [
-        "estimated_tokens_per_minute_k",
-        "pct_of_tpm_limit",
-        "estimated_requests_per_minute_k",
-        "pct_of_rpm_limit",
-    ],
-)
-class TrackerAPI(Tracker):
-    """ """
-    class APICallDetails(Tracker.TrackerEvent):
-        def __init__(self, details):
-            self.details = details
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.usage.append(self.details)
-    def __init__(
-        self, lock, monitored_queue, tokens_per_minute_k=90, requests_per_minute_k=2
-    ):
-        self.lock = lock
-        self.tokens_per_minute_k = tokens_per_minute_k
-        self.requests_per_minute_k = requests_per_minute_k
-        self.usage = []
-        super().__init__(monitored_queue)
-    def usage_rates(self, last_seconds=60):
-        with self.lock:
-            right_now = time.time()
-            relevant_usage = [
-                x
-                for x in self.usage
-                if (x["timestamp"] > right_now - last_seconds)
-                and not x["cached_response"]
-            ]
-            if relevant_usage == []:
-                return UsageRates(**{k: 0 for k in UsageRates._fields})
-            else:
-                elapsed_seconds = right_now - relevant_usage[0]["timestamp"]
-                total_tokens = sum([x["total_tokens"] for x in relevant_usage])
-                estimated_tokens_per_minute_k = round(
-                    total_tokens / (elapsed_seconds / 60.0) / 1000, 0
-                )
-                pct_of_tpm_limit = round(
-                    100 * estimated_tokens_per_minute_k / self.tokens_per_minute_k
-                )
-                estimated_requests_per_minute_k = round(
-                    len(relevant_usage) / (elapsed_seconds / 60.0) / 1000, 2
-                )
-                pct_of_rpm_limit = round(
-                    100 * estimated_requests_per_minute_k / self.requests_per_minute_k
-                )
-                usage_rates = UsageRates(
-                    estimated_tokens_per_minute_k=estimated_tokens_per_minute_k,
-                    pct_of_tpm_limit=pct_of_tpm_limit,
-                    estimated_requests_per_minute_k=estimated_requests_per_minute_k,
-                    pct_of_rpm_limit=pct_of_rpm_limit,
-                )
-                return usage_rates
-    def tracked_values(self) -> dict:
-        return {
-            "Calls": len(self.usage),
-        }
-    def allowed_events(self):
-        return set([TrackerAPI.APICallDetails])
-    @classmethod
-    def fromJSON(cls, filename):
-        """This loads a tracker from a JSON file. Just for testing purposes"""
-        with open(filename, "r") as f:
-            json_dict = f.read()
-        usage = json.loads(json_dict)
-        # pretend responses are not cached for each testing, as the
-        # usage_rate methods only compute w/ non-cached responses
-        [x.update({"cached_response": False}) for x in usage]
-        instance = cls(Lock(), None)
-        instance.usage = usage
-        return instance
-    def toJSON(self, filename="sample_data.json"):
-        with open(filename, "w") as f:
-            json.dump(self.usage, f)
-    def status(self):
-        """This prints the status of the interview manager, while interviews are doing on."""
-        estimated_length = 100
-        completed = self.status_tracker.complete
-        pct_completed = self.status_tracker.percentage_complete
-        usage_rates = self.current_tpm(10)
-        heartbeat = next(self.status_tracker.hearbeat)
-        status_str = (
-            f"{heartbeat} Completed: {completed} ({pct_completed} of total); "
-            f"Est. TPM (k): {usage_rates.estimated_tokens_per_minute_k: ,} ({usage_rates.frac_of_tpm_limit}% of lim.); "
-            f"Est. RPM (k): {usage_rates.estimated_requests_per_minute_k:,} ({usage_rates.frac_of_rpm_limit}% of lim.)); "
-        )
-        # Pad with spaces to reach the estimated length
-        padded_status_str = status_str.ljust(estimated_length)
-        print(f"\r{padded_status_str}", end="", flush=True)
-if __name__ == "__main__":
-    import textwrap
-    from language_models import LanguageModelOpenAIThreeFiveTurbo
-    m = LanguageModelOpenAIThreeFiveTurbo(use_cache=True)
-    # the language model is attached to the queue
-    print(m.api_queue)
-    # the tracker expects a lock and an event
-    lock = Lock()
-    all_done = Event()
-    # tracker attached to the queue
-    tracker = TrackerAPI(lock=lock, monitored_queue=m.api_queue)
-    # the queue is empty to start
-    print(f"Queue size: {m.api_queue.qsize()}")
-    # a call is made to the language model
-    raw = m.get_raw_response(
-        prompt="What is your favorite color?",
-        system_prompt=textwrap.dedent(
-            """\
-                            You are pretending to be a human taking a survey.
-                            Do not break character.
-                            """
-        ),
-    )
-    # sleep for a second, as queue puts are non-blocking
-    import time
-    print("Sleeping for 1 second")
-    time.sleep(1)
-    # see that the queue updated
-    print(f"Queue size: {m.api_queue.qsize()}")
-    print(m.parse_response(raw))
-    # indicate we are all done
-    all_done.set()
-    # have the tracker finish up
-    tracker(all_done, interval=1)
-    # how many calls did the API observe?
-    print(tracker.tracked_values())
-    # what is in the tracker queue?
-    print(tracker.usage)
-    # confirm that the API queue is empty
-    print(f"Queue size: {m.api_queue.qsize()}")
-    ## Next example - compute queue statistics
-    all_done = Event()
-    tracker_two = TrackerAPI(lock=lock, monitored_queue=m.api_queue)
-    for i in range(10):
-        raw = m.get_raw_response(
-            prompt=f"What emotions are associated with {i}?",
-            system_prompt=textwrap.dedent(
-                """\
-                                You are pretending to be a human taking a survey.
-                                Do not break character.
-                                """
-            ),
-        )
-    time.sleep(1)
-    all_done.set()
-    # have the tracker finish up
-    tracker(all_done, interval=1)
-    # print(tracker.usage)
-    tracker.toJSON(filename="sample_data.json")
-    # from .example_api_call_data import sample_data
-    tracker = TrackerAPI.fromJSON("sample_data.json")
-    print(tracker.usage)
-    print(tracker.usage_rates(1000000))

edsl/trackers/TrackerTasks.py DELETED Viewed

@@ -1,70 +0,0 @@
-from edsl.trackers.Tracker import Tracker
-from edsl.utilities.interface import heartbeat_generator, human_readable_labeler_creator
-class TrackerTasks(Tracker):
-    """ """
-    class WorkerActivated(Tracker.TrackerEvent):
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.active_workers += 1
-    class WorkerDeactivated(Tracker.TrackerEvent):
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.active_workers -= 1
-    class TaskStarted(Tracker.TrackerEvent):
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.interviews_started += 1
-    class TaskCompleted(Tracker.TrackerEvent):
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.interviews_completed += 1
-    class ThreadStatus(Tracker.TrackerEvent):
-        def __init__(self, thread_id, status):
-            self.thread_id = thread_id
-            self.status = status
-        def apply(self, tracker):
-            with tracker.lock:
-                tracker.thread_status[self.thread_id] = self.status
-    def __init__(self, num_interviews, lock, monitored_queue):
-        self.num_interviews = num_interviews  # how many interviews are there in total
-        self.lock = lock
-        self.hearbeat = heartbeat_generator()  # generator to show responses coming in
-        self.active_workers = 0
-        self.interviews_started = 0
-        self.interviews_completed = 0
-        self.thread_status = dict()
-        # this is a function that takes thread IDs and turns them into successive integers
-        self.human_readable_labeler = human_readable_labeler_creator()
-        super().__init__(monitored_queue)
-    def tracked_values(self) -> dict:
-        return {
-            "Active Workers": self.active_workers,
-            "Interviews Started": self.interviews_started,
-            "Completed Interviews": self.interviews_completed,
-        }
-    def allowed_events(self):
-        return set(
-            [
-                TrackerTasks.WorkerActivated,
-                TrackerTasks.WorkerDeactivated,
-                TrackerTasks.TaskStarted,
-                TrackerTasks.TaskCompleted,
-                TrackerTasks.ThreadStatus,
-            ]
-        )
-    @property
-    def percentage_complete(self):
-        return round(100 * self.interviews_completed / self.num_interviews, 2)

edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl

edsl 0.1.14py3-none-any.whl → 0.1.40py3-none-any.whl