edsl 0.1.14__py3-none-any.whl → 0.1.40__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- edsl/Base.py +348 -38
- edsl/BaseDiff.py +260 -0
- edsl/TemplateLoader.py +24 -0
- edsl/__init__.py +46 -10
- edsl/__version__.py +1 -0
- edsl/agents/Agent.py +842 -144
- edsl/agents/AgentList.py +521 -25
- edsl/agents/Invigilator.py +250 -374
- edsl/agents/InvigilatorBase.py +257 -0
- edsl/agents/PromptConstructor.py +272 -0
- edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
- edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
- edsl/agents/descriptors.py +43 -13
- edsl/agents/prompt_helpers.py +129 -0
- edsl/agents/question_option_processor.py +172 -0
- edsl/auto/AutoStudy.py +130 -0
- edsl/auto/StageBase.py +243 -0
- edsl/auto/StageGenerateSurvey.py +178 -0
- edsl/auto/StageLabelQuestions.py +125 -0
- edsl/auto/StagePersona.py +61 -0
- edsl/auto/StagePersonaDimensionValueRanges.py +88 -0
- edsl/auto/StagePersonaDimensionValues.py +74 -0
- edsl/auto/StagePersonaDimensions.py +69 -0
- edsl/auto/StageQuestions.py +74 -0
- edsl/auto/SurveyCreatorPipeline.py +21 -0
- edsl/auto/utilities.py +218 -0
- edsl/base/Base.py +279 -0
- edsl/config.py +121 -104
- edsl/conversation/Conversation.py +290 -0
- edsl/conversation/car_buying.py +59 -0
- edsl/conversation/chips.py +95 -0
- edsl/conversation/mug_negotiation.py +81 -0
- edsl/conversation/next_speaker_utilities.py +93 -0
- edsl/coop/CoopFunctionsMixin.py +15 -0
- edsl/coop/ExpectedParrotKeyHandler.py +125 -0
- edsl/coop/PriceFetcher.py +54 -0
- edsl/coop/__init__.py +1 -0
- edsl/coop/coop.py +1029 -134
- edsl/coop/utils.py +131 -0
- edsl/data/Cache.py +560 -89
- edsl/data/CacheEntry.py +230 -0
- edsl/data/CacheHandler.py +168 -0
- edsl/data/RemoteCacheSync.py +186 -0
- edsl/data/SQLiteDict.py +292 -0
- edsl/data/__init__.py +5 -3
- edsl/data/orm.py +6 -33
- edsl/data_transfer_models.py +74 -27
- edsl/enums.py +165 -8
- edsl/exceptions/BaseException.py +21 -0
- edsl/exceptions/__init__.py +52 -46
- edsl/exceptions/agents.py +33 -15
- edsl/exceptions/cache.py +5 -0
- edsl/exceptions/coop.py +8 -0
- edsl/exceptions/general.py +34 -0
- edsl/exceptions/inference_services.py +5 -0
- edsl/exceptions/jobs.py +15 -0
- edsl/exceptions/language_models.py +46 -1
- edsl/exceptions/questions.py +80 -5
- edsl/exceptions/results.py +16 -5
- edsl/exceptions/scenarios.py +29 -0
- edsl/exceptions/surveys.py +13 -10
- edsl/inference_services/AnthropicService.py +106 -0
- edsl/inference_services/AvailableModelCacheHandler.py +184 -0
- edsl/inference_services/AvailableModelFetcher.py +215 -0
- edsl/inference_services/AwsBedrock.py +118 -0
- edsl/inference_services/AzureAI.py +215 -0
- edsl/inference_services/DeepInfraService.py +18 -0
- edsl/inference_services/GoogleService.py +143 -0
- edsl/inference_services/GroqService.py +20 -0
- edsl/inference_services/InferenceServiceABC.py +80 -0
- edsl/inference_services/InferenceServicesCollection.py +138 -0
- edsl/inference_services/MistralAIService.py +120 -0
- edsl/inference_services/OllamaService.py +18 -0
- edsl/inference_services/OpenAIService.py +236 -0
- edsl/inference_services/PerplexityService.py +160 -0
- edsl/inference_services/ServiceAvailability.py +135 -0
- edsl/inference_services/TestService.py +90 -0
- edsl/inference_services/TogetherAIService.py +172 -0
- edsl/inference_services/data_structures.py +134 -0
- edsl/inference_services/models_available_cache.py +118 -0
- edsl/inference_services/rate_limits_cache.py +25 -0
- edsl/inference_services/registry.py +41 -0
- edsl/inference_services/write_available.py +10 -0
- edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
- edsl/jobs/Answers.py +21 -20
- edsl/jobs/FetchInvigilator.py +47 -0
- edsl/jobs/InterviewTaskManager.py +98 -0
- edsl/jobs/InterviewsConstructor.py +50 -0
- edsl/jobs/Jobs.py +684 -204
- edsl/jobs/JobsChecks.py +172 -0
- edsl/jobs/JobsComponentConstructor.py +189 -0
- edsl/jobs/JobsPrompts.py +270 -0
- edsl/jobs/JobsRemoteInferenceHandler.py +311 -0
- edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
- edsl/jobs/RequestTokenEstimator.py +30 -0
- edsl/jobs/async_interview_runner.py +138 -0
- edsl/jobs/buckets/BucketCollection.py +104 -0
- edsl/jobs/buckets/ModelBuckets.py +65 -0
- edsl/jobs/buckets/TokenBucket.py +283 -0
- edsl/jobs/buckets/TokenBucketAPI.py +211 -0
- edsl/jobs/buckets/TokenBucketClient.py +191 -0
- edsl/jobs/check_survey_scenario_compatibility.py +85 -0
- edsl/jobs/data_structures.py +120 -0
- edsl/jobs/decorators.py +35 -0
- edsl/jobs/interviews/Interview.py +392 -0
- edsl/jobs/interviews/InterviewExceptionCollection.py +99 -0
- edsl/jobs/interviews/InterviewExceptionEntry.py +186 -0
- edsl/jobs/interviews/InterviewStatistic.py +63 -0
- edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -0
- edsl/jobs/interviews/InterviewStatusDictionary.py +78 -0
- edsl/jobs/interviews/InterviewStatusLog.py +92 -0
- edsl/jobs/interviews/ReportErrors.py +66 -0
- edsl/jobs/interviews/interview_status_enum.py +9 -0
- edsl/jobs/jobs_status_enums.py +9 -0
- edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
- edsl/jobs/results_exceptions_handler.py +98 -0
- edsl/jobs/runners/JobsRunnerAsyncio.py +151 -110
- edsl/jobs/runners/JobsRunnerStatus.py +298 -0
- edsl/jobs/tasks/QuestionTaskCreator.py +244 -0
- edsl/jobs/tasks/TaskCreators.py +64 -0
- edsl/jobs/tasks/TaskHistory.py +470 -0
- edsl/jobs/tasks/TaskStatusLog.py +23 -0
- edsl/jobs/tasks/task_status_enum.py +161 -0
- edsl/jobs/tokens/InterviewTokenUsage.py +27 -0
- edsl/jobs/tokens/TokenUsage.py +34 -0
- edsl/language_models/ComputeCost.py +63 -0
- edsl/language_models/LanguageModel.py +507 -386
- edsl/language_models/ModelList.py +164 -0
- edsl/language_models/PriceManager.py +127 -0
- edsl/language_models/RawResponseHandler.py +106 -0
- edsl/language_models/RegisterLanguageModelsMeta.py +184 -0
- edsl/language_models/__init__.py +1 -8
- edsl/language_models/fake_openai_call.py +15 -0
- edsl/language_models/fake_openai_service.py +61 -0
- edsl/language_models/key_management/KeyLookup.py +63 -0
- edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
- edsl/language_models/key_management/KeyLookupCollection.py +38 -0
- edsl/language_models/key_management/__init__.py +0 -0
- edsl/language_models/key_management/models.py +131 -0
- edsl/language_models/model.py +256 -0
- edsl/language_models/repair.py +109 -41
- edsl/language_models/utilities.py +65 -0
- edsl/notebooks/Notebook.py +263 -0
- edsl/notebooks/NotebookToLaTeX.py +142 -0
- edsl/notebooks/__init__.py +1 -0
- edsl/prompts/Prompt.py +222 -93
- edsl/prompts/__init__.py +1 -1
- edsl/questions/ExceptionExplainer.py +77 -0
- edsl/questions/HTMLQuestion.py +103 -0
- edsl/questions/QuestionBase.py +518 -0
- edsl/questions/QuestionBasePromptsMixin.py +221 -0
- edsl/questions/QuestionBudget.py +164 -67
- edsl/questions/QuestionCheckBox.py +281 -62
- edsl/questions/QuestionDict.py +343 -0
- edsl/questions/QuestionExtract.py +136 -50
- edsl/questions/QuestionFreeText.py +79 -55
- edsl/questions/QuestionFunctional.py +138 -41
- edsl/questions/QuestionList.py +184 -57
- edsl/questions/QuestionMatrix.py +265 -0
- edsl/questions/QuestionMultipleChoice.py +293 -69
- edsl/questions/QuestionNumerical.py +109 -56
- edsl/questions/QuestionRank.py +244 -49
- edsl/questions/Quick.py +41 -0
- edsl/questions/SimpleAskMixin.py +74 -0
- edsl/questions/__init__.py +9 -6
- edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +153 -38
- edsl/questions/compose_questions.py +13 -7
- edsl/questions/data_structures.py +20 -0
- edsl/questions/decorators.py +21 -0
- edsl/questions/derived/QuestionLikertFive.py +28 -26
- edsl/questions/derived/QuestionLinearScale.py +41 -28
- edsl/questions/derived/QuestionTopK.py +34 -26
- edsl/questions/derived/QuestionYesNo.py +40 -27
- edsl/questions/descriptors.py +228 -74
- edsl/questions/loop_processor.py +149 -0
- edsl/questions/prompt_templates/question_budget.jinja +13 -0
- edsl/questions/prompt_templates/question_checkbox.jinja +32 -0
- edsl/questions/prompt_templates/question_extract.jinja +11 -0
- edsl/questions/prompt_templates/question_free_text.jinja +3 -0
- edsl/questions/prompt_templates/question_linear_scale.jinja +11 -0
- edsl/questions/prompt_templates/question_list.jinja +17 -0
- edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -0
- edsl/questions/prompt_templates/question_numerical.jinja +37 -0
- edsl/questions/question_base_gen_mixin.py +168 -0
- edsl/questions/question_registry.py +130 -46
- edsl/questions/register_questions_meta.py +71 -0
- edsl/questions/response_validator_abc.py +188 -0
- edsl/questions/response_validator_factory.py +34 -0
- edsl/questions/settings.py +5 -2
- edsl/questions/templates/__init__.py +0 -0
- edsl/questions/templates/budget/__init__.py +0 -0
- edsl/questions/templates/budget/answering_instructions.jinja +7 -0
- edsl/questions/templates/budget/question_presentation.jinja +7 -0
- edsl/questions/templates/checkbox/__init__.py +0 -0
- edsl/questions/templates/checkbox/answering_instructions.jinja +10 -0
- edsl/questions/templates/checkbox/question_presentation.jinja +22 -0
- edsl/questions/templates/dict/__init__.py +0 -0
- edsl/questions/templates/dict/answering_instructions.jinja +21 -0
- edsl/questions/templates/dict/question_presentation.jinja +1 -0
- edsl/questions/templates/extract/__init__.py +0 -0
- edsl/questions/templates/extract/answering_instructions.jinja +7 -0
- edsl/questions/templates/extract/question_presentation.jinja +1 -0
- edsl/questions/templates/free_text/__init__.py +0 -0
- edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
- edsl/questions/templates/free_text/question_presentation.jinja +1 -0
- edsl/questions/templates/likert_five/__init__.py +0 -0
- edsl/questions/templates/likert_five/answering_instructions.jinja +10 -0
- edsl/questions/templates/likert_five/question_presentation.jinja +12 -0
- edsl/questions/templates/linear_scale/__init__.py +0 -0
- edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -0
- edsl/questions/templates/linear_scale/question_presentation.jinja +5 -0
- edsl/questions/templates/list/__init__.py +0 -0
- edsl/questions/templates/list/answering_instructions.jinja +4 -0
- edsl/questions/templates/list/question_presentation.jinja +5 -0
- edsl/questions/templates/matrix/__init__.py +1 -0
- edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
- edsl/questions/templates/matrix/question_presentation.jinja +20 -0
- edsl/questions/templates/multiple_choice/__init__.py +0 -0
- edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -0
- edsl/questions/templates/multiple_choice/html.jinja +0 -0
- edsl/questions/templates/multiple_choice/question_presentation.jinja +12 -0
- edsl/questions/templates/numerical/__init__.py +0 -0
- edsl/questions/templates/numerical/answering_instructions.jinja +7 -0
- edsl/questions/templates/numerical/question_presentation.jinja +7 -0
- edsl/questions/templates/rank/__init__.py +0 -0
- edsl/questions/templates/rank/answering_instructions.jinja +11 -0
- edsl/questions/templates/rank/question_presentation.jinja +15 -0
- edsl/questions/templates/top_k/__init__.py +0 -0
- edsl/questions/templates/top_k/answering_instructions.jinja +8 -0
- edsl/questions/templates/top_k/question_presentation.jinja +22 -0
- edsl/questions/templates/yes_no/__init__.py +0 -0
- edsl/questions/templates/yes_no/answering_instructions.jinja +6 -0
- edsl/questions/templates/yes_no/question_presentation.jinja +12 -0
- edsl/results/CSSParameterizer.py +108 -0
- edsl/results/Dataset.py +550 -19
- edsl/results/DatasetExportMixin.py +594 -0
- edsl/results/DatasetTree.py +295 -0
- edsl/results/MarkdownToDocx.py +122 -0
- edsl/results/MarkdownToPDF.py +111 -0
- edsl/results/Result.py +477 -173
- edsl/results/Results.py +987 -269
- edsl/results/ResultsExportMixin.py +28 -125
- edsl/results/ResultsGGMixin.py +83 -15
- edsl/results/TableDisplay.py +125 -0
- edsl/results/TextEditor.py +50 -0
- edsl/results/__init__.py +1 -1
- edsl/results/file_exports.py +252 -0
- edsl/results/results_fetch_mixin.py +33 -0
- edsl/results/results_selector.py +145 -0
- edsl/results/results_tools_mixin.py +98 -0
- edsl/results/smart_objects.py +96 -0
- edsl/results/table_data_class.py +12 -0
- edsl/results/table_display.css +78 -0
- edsl/results/table_renderers.py +118 -0
- edsl/results/tree_explore.py +115 -0
- edsl/scenarios/ConstructDownloadLink.py +109 -0
- edsl/scenarios/DocumentChunker.py +102 -0
- edsl/scenarios/DocxScenario.py +16 -0
- edsl/scenarios/FileStore.py +543 -0
- edsl/scenarios/PdfExtractor.py +40 -0
- edsl/scenarios/Scenario.py +431 -62
- edsl/scenarios/ScenarioHtmlMixin.py +65 -0
- edsl/scenarios/ScenarioList.py +1415 -45
- edsl/scenarios/ScenarioListExportMixin.py +45 -0
- edsl/scenarios/ScenarioListPdfMixin.py +239 -0
- edsl/scenarios/__init__.py +2 -0
- edsl/scenarios/directory_scanner.py +96 -0
- edsl/scenarios/file_methods.py +85 -0
- edsl/scenarios/handlers/__init__.py +13 -0
- edsl/scenarios/handlers/csv.py +49 -0
- edsl/scenarios/handlers/docx.py +76 -0
- edsl/scenarios/handlers/html.py +37 -0
- edsl/scenarios/handlers/json.py +111 -0
- edsl/scenarios/handlers/latex.py +5 -0
- edsl/scenarios/handlers/md.py +51 -0
- edsl/scenarios/handlers/pdf.py +68 -0
- edsl/scenarios/handlers/png.py +39 -0
- edsl/scenarios/handlers/pptx.py +105 -0
- edsl/scenarios/handlers/py.py +294 -0
- edsl/scenarios/handlers/sql.py +313 -0
- edsl/scenarios/handlers/sqlite.py +149 -0
- edsl/scenarios/handlers/txt.py +33 -0
- edsl/scenarios/scenario_join.py +131 -0
- edsl/scenarios/scenario_selector.py +156 -0
- edsl/shared.py +1 -0
- edsl/study/ObjectEntry.py +173 -0
- edsl/study/ProofOfWork.py +113 -0
- edsl/study/SnapShot.py +80 -0
- edsl/study/Study.py +521 -0
- edsl/study/__init__.py +4 -0
- edsl/surveys/ConstructDAG.py +92 -0
- edsl/surveys/DAG.py +92 -11
- edsl/surveys/EditSurvey.py +221 -0
- edsl/surveys/InstructionHandler.py +100 -0
- edsl/surveys/Memory.py +9 -4
- edsl/surveys/MemoryManagement.py +72 -0
- edsl/surveys/MemoryPlan.py +156 -35
- edsl/surveys/Rule.py +221 -74
- edsl/surveys/RuleCollection.py +241 -61
- edsl/surveys/RuleManager.py +172 -0
- edsl/surveys/Simulator.py +75 -0
- edsl/surveys/Survey.py +1079 -339
- edsl/surveys/SurveyCSS.py +273 -0
- edsl/surveys/SurveyExportMixin.py +235 -40
- edsl/surveys/SurveyFlowVisualization.py +181 -0
- edsl/surveys/SurveyQualtricsImport.py +284 -0
- edsl/surveys/SurveyToApp.py +141 -0
- edsl/surveys/__init__.py +4 -2
- edsl/surveys/base.py +19 -3
- edsl/surveys/descriptors.py +17 -6
- edsl/surveys/instructions/ChangeInstruction.py +48 -0
- edsl/surveys/instructions/Instruction.py +56 -0
- edsl/surveys/instructions/InstructionCollection.py +82 -0
- edsl/surveys/instructions/__init__.py +0 -0
- edsl/templates/error_reporting/base.html +24 -0
- edsl/templates/error_reporting/exceptions_by_model.html +35 -0
- edsl/templates/error_reporting/exceptions_by_question_name.html +17 -0
- edsl/templates/error_reporting/exceptions_by_type.html +17 -0
- edsl/templates/error_reporting/interview_details.html +116 -0
- edsl/templates/error_reporting/interviews.html +19 -0
- edsl/templates/error_reporting/overview.html +5 -0
- edsl/templates/error_reporting/performance_plot.html +2 -0
- edsl/templates/error_reporting/report.css +74 -0
- edsl/templates/error_reporting/report.html +118 -0
- edsl/templates/error_reporting/report.js +25 -0
- edsl/tools/__init__.py +1 -0
- edsl/tools/clusters.py +192 -0
- edsl/tools/embeddings.py +27 -0
- edsl/tools/embeddings_plotting.py +118 -0
- edsl/tools/plotting.py +112 -0
- edsl/tools/summarize.py +18 -0
- edsl/utilities/PrettyList.py +56 -0
- edsl/utilities/SystemInfo.py +5 -0
- edsl/utilities/__init__.py +21 -20
- edsl/utilities/ast_utilities.py +3 -0
- edsl/utilities/data/Registry.py +2 -0
- edsl/utilities/decorators.py +41 -0
- edsl/utilities/gcp_bucket/__init__.py +0 -0
- edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
- edsl/utilities/interface.py +310 -60
- edsl/utilities/is_notebook.py +18 -0
- edsl/utilities/is_valid_variable_name.py +11 -0
- edsl/utilities/naming_utilities.py +263 -0
- edsl/utilities/remove_edsl_version.py +24 -0
- edsl/utilities/repair_functions.py +28 -0
- edsl/utilities/restricted_python.py +70 -0
- edsl/utilities/utilities.py +203 -13
- edsl-0.1.40.dist-info/METADATA +111 -0
- edsl-0.1.40.dist-info/RECORD +362 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/WHEEL +1 -1
- edsl/agents/AgentListExportMixin.py +0 -24
- edsl/coop/old.py +0 -31
- edsl/data/Database.py +0 -141
- edsl/data/crud.py +0 -121
- edsl/jobs/Interview.py +0 -417
- edsl/jobs/JobsRunner.py +0 -63
- edsl/jobs/JobsRunnerStatusMixin.py +0 -115
- edsl/jobs/base.py +0 -47
- edsl/jobs/buckets.py +0 -166
- edsl/jobs/runners/JobsRunnerDryRun.py +0 -19
- edsl/jobs/runners/JobsRunnerStreaming.py +0 -54
- edsl/jobs/task_management.py +0 -218
- edsl/jobs/token_tracking.py +0 -78
- edsl/language_models/DeepInfra.py +0 -69
- edsl/language_models/OpenAI.py +0 -98
- edsl/language_models/model_interfaces/GeminiPro.py +0 -66
- edsl/language_models/model_interfaces/LanguageModelOpenAIFour.py +0 -8
- edsl/language_models/model_interfaces/LanguageModelOpenAIThreeFiveTurbo.py +0 -8
- edsl/language_models/model_interfaces/LlamaTwo13B.py +0 -21
- edsl/language_models/model_interfaces/LlamaTwo70B.py +0 -21
- edsl/language_models/model_interfaces/Mixtral8x7B.py +0 -24
- edsl/language_models/registry.py +0 -81
- edsl/language_models/schemas.py +0 -15
- edsl/language_models/unused/ReplicateBase.py +0 -83
- edsl/prompts/QuestionInstructionsBase.py +0 -6
- edsl/prompts/library/agent_instructions.py +0 -29
- edsl/prompts/library/agent_persona.py +0 -17
- edsl/prompts/library/question_budget.py +0 -26
- edsl/prompts/library/question_checkbox.py +0 -32
- edsl/prompts/library/question_extract.py +0 -19
- edsl/prompts/library/question_freetext.py +0 -14
- edsl/prompts/library/question_linear_scale.py +0 -20
- edsl/prompts/library/question_list.py +0 -22
- edsl/prompts/library/question_multiple_choice.py +0 -44
- edsl/prompts/library/question_numerical.py +0 -31
- edsl/prompts/library/question_rank.py +0 -21
- edsl/prompts/prompt_config.py +0 -33
- edsl/prompts/registry.py +0 -185
- edsl/questions/Question.py +0 -240
- edsl/report/InputOutputDataTypes.py +0 -134
- edsl/report/RegressionMixin.py +0 -28
- edsl/report/ReportOutputs.py +0 -1228
- edsl/report/ResultsFetchMixin.py +0 -106
- edsl/report/ResultsOutputMixin.py +0 -14
- edsl/report/demo.ipynb +0 -645
- edsl/results/ResultsDBMixin.py +0 -184
- edsl/surveys/SurveyFlowVisualizationMixin.py +0 -92
- edsl/trackers/Tracker.py +0 -91
- edsl/trackers/TrackerAPI.py +0 -196
- edsl/trackers/TrackerTasks.py +0 -70
- edsl/utilities/pastebin.py +0 -141
- edsl-0.1.14.dist-info/METADATA +0 -69
- edsl-0.1.14.dist-info/RECORD +0 -141
- /edsl/{language_models/model_interfaces → inference_services}/__init__.py +0 -0
- /edsl/{report/__init__.py → jobs/runners/JobsRunnerStatusData.py} +0 -0
- /edsl/{trackers/__init__.py → language_models/ServiceDataSources.py} +0 -0
- {edsl-0.1.14.dist-info → edsl-0.1.40.dist-info}/LICENSE +0 -0
edsl/study/Study.py
ADDED
@@ -0,0 +1,521 @@
|
|
1
|
+
import copy
|
2
|
+
import inspect
|
3
|
+
import json
|
4
|
+
import os
|
5
|
+
import platform
|
6
|
+
import socket
|
7
|
+
from datetime import datetime
|
8
|
+
from typing import Dict, Optional, Union
|
9
|
+
from uuid import UUID, uuid4
|
10
|
+
|
11
|
+
from edsl.data.Cache import Cache
|
12
|
+
from edsl import set_session_cache, unset_session_cache
|
13
|
+
from edsl.utilities.utilities import dict_hash
|
14
|
+
from edsl.study.ObjectEntry import ObjectEntry
|
15
|
+
from edsl.study.ProofOfWork import ProofOfWork
|
16
|
+
from edsl.study.SnapShot import SnapShot
|
17
|
+
|
18
|
+
|
19
|
+
class Study:
|
20
|
+
"""A study organizes a series of EDSL objects.
|
21
|
+
|
22
|
+
```python
|
23
|
+
with Study(name = "cool_study") as study:
|
24
|
+
q = QuestionFreeText.example()
|
25
|
+
results = q.run()
|
26
|
+
```
|
27
|
+
|
28
|
+
The `study` object is a context manager.
|
29
|
+
It lets you group a series of events and objects together.
|
30
|
+
|
31
|
+
>>> with Study(name = "cool_study", verbose = False) as study:
|
32
|
+
... from edsl import QuestionFreeText
|
33
|
+
... q = QuestionFreeText.example()
|
34
|
+
>>> len(study.objects)
|
35
|
+
1
|
36
|
+
>>> _ = os.system("rm cool_study.json")
|
37
|
+
|
38
|
+
|
39
|
+
It records all the edsl objects that are created during the study.
|
40
|
+
On exit, is saves them to a study file.
|
41
|
+
|
42
|
+
"""
|
43
|
+
|
44
|
+
def __init__(
|
45
|
+
self,
|
46
|
+
name: Optional[str] = None,
|
47
|
+
filename: Optional[str] = None,
|
48
|
+
description: Optional[str] = None,
|
49
|
+
objects: Optional[Dict[str, ObjectEntry]] = None,
|
50
|
+
cache: Optional[Cache] = None,
|
51
|
+
coop: bool = False,
|
52
|
+
use_study_cache=True,
|
53
|
+
overwrite_on_change=True,
|
54
|
+
proof_of_work=None,
|
55
|
+
proof_of_work_difficulty: int = None,
|
56
|
+
namespace: Optional[dict] = None,
|
57
|
+
verbose: Optional[bool] = True,
|
58
|
+
):
|
59
|
+
"""
|
60
|
+
:param name: The name of the study.
|
61
|
+
:param description: A description of the study.
|
62
|
+
:param objects: A dictionary of objects to add to the study.
|
63
|
+
:param cache: A cache object to (potentially) use for the study.
|
64
|
+
:param filename: The path to the study file.
|
65
|
+
:param coop: Whether to push the study to coop.
|
66
|
+
:param use_study_cache: Whether to use the study cache.
|
67
|
+
:param overwrite_on_change: Whether to overwrite the study file if it has changed.
|
68
|
+
|
69
|
+
>>> s = Study()
|
70
|
+
Traceback (most recent call last):
|
71
|
+
...
|
72
|
+
ValueError: You must provide a name or a filename for the study.
|
73
|
+
|
74
|
+
"""
|
75
|
+
self.verbose = verbose
|
76
|
+
|
77
|
+
if name is None and filename is None:
|
78
|
+
raise ValueError("You must provide a name or a filename for the study.")
|
79
|
+
|
80
|
+
if filename is None:
|
81
|
+
self.filename = name
|
82
|
+
else:
|
83
|
+
self.filename = filename
|
84
|
+
|
85
|
+
if (
|
86
|
+
self.filename
|
87
|
+
and os.path.exists(self.filename + ".json")
|
88
|
+
and os.path.getsize(self.filename + ".json") > 0
|
89
|
+
):
|
90
|
+
if self.verbose:
|
91
|
+
print(f"Using existing study file {self.filename}.json")
|
92
|
+
self._load_from_file()
|
93
|
+
else:
|
94
|
+
self.name = name
|
95
|
+
self.description = description
|
96
|
+
self.objects = objects or {}
|
97
|
+
self.cache = cache or Cache()
|
98
|
+
self.proof_of_work = proof_of_work or ProofOfWork()
|
99
|
+
|
100
|
+
# These always overwrite the saved study
|
101
|
+
self.coop = coop
|
102
|
+
self.use_study_cache = use_study_cache
|
103
|
+
self.overwrite_on_change = overwrite_on_change
|
104
|
+
self.proof_of_work_difficulty = proof_of_work_difficulty
|
105
|
+
|
106
|
+
self.starting_objects = copy.deepcopy(self.objects)
|
107
|
+
|
108
|
+
if namespace:
|
109
|
+
self._namespace = namespace
|
110
|
+
else:
|
111
|
+
self._namespace = None
|
112
|
+
|
113
|
+
self._create_mapping_dicts()
|
114
|
+
|
115
|
+
@property
|
116
|
+
def namespace(self):
|
117
|
+
return self._find_stack()
|
118
|
+
|
119
|
+
def _find_stack(self) -> dict:
|
120
|
+
"Finds the frame with the Study context"
|
121
|
+
# if self.verbose:
|
122
|
+
# self.explore_stacks()
|
123
|
+
frame = inspect.currentframe()
|
124
|
+
candidate_frames = []
|
125
|
+
while frame:
|
126
|
+
if "Study" in frame.f_globals:
|
127
|
+
candidate_frames.append(frame)
|
128
|
+
|
129
|
+
frame = frame.f_back
|
130
|
+
|
131
|
+
found_variables_dict = {}
|
132
|
+
for frame in candidate_frames:
|
133
|
+
found_variables_dict.update(frame.f_globals)
|
134
|
+
found_variables_dict.update(frame.f_locals)
|
135
|
+
|
136
|
+
return found_variables_dict
|
137
|
+
|
138
|
+
def explore_stacks(self):
|
139
|
+
frame = inspect.currentframe()
|
140
|
+
count = 0
|
141
|
+
d = {}
|
142
|
+
while frame:
|
143
|
+
d[count] = "Study" in frame.f_globals.keys()
|
144
|
+
count += 1
|
145
|
+
from rich import print as rprint
|
146
|
+
|
147
|
+
print("Globals:")
|
148
|
+
rprint(frame.f_globals["__name__"])
|
149
|
+
rprint(frame.f_globals.keys())
|
150
|
+
print("Locals:")
|
151
|
+
rprint(frame.f_locals.keys())
|
152
|
+
print("\n")
|
153
|
+
frame = frame.f_back
|
154
|
+
return d
|
155
|
+
|
156
|
+
def _create_mapping_dicts(self):
|
157
|
+
self._name_to_object = {}
|
158
|
+
self._hash_to_name = {}
|
159
|
+
self._name_to_oe = {}
|
160
|
+
name_counts = {}
|
161
|
+
for hash, obj in self.objects.items():
|
162
|
+
new_name = obj.variable_name
|
163
|
+
if obj.variable_name in name_counts:
|
164
|
+
name_counts[obj.variable_name] += 1
|
165
|
+
new_name = obj.variable_name + "_" + str(name_counts[obj.variable_name])
|
166
|
+
else:
|
167
|
+
name_counts[obj.variable_name] = 1
|
168
|
+
self._name_to_object[new_name] = obj.object
|
169
|
+
self._hash_to_name[hash] = new_name
|
170
|
+
|
171
|
+
def __len__(self):
|
172
|
+
return len(self.objects)
|
173
|
+
|
174
|
+
def __eq__(self, other):
|
175
|
+
return self.objects.keys() == other.objects.keys()
|
176
|
+
|
177
|
+
@property
|
178
|
+
def name_to_object(self):
|
179
|
+
"""
|
180
|
+
>>> s = Study.example()
|
181
|
+
>>> s.name_to_object
|
182
|
+
{'q': Question('free_text', question_name = \"""how_are_you\""", question_text = \"""How are you?\""")}
|
183
|
+
"""
|
184
|
+
self._create_mapping_dicts()
|
185
|
+
return self._name_to_object
|
186
|
+
|
187
|
+
@property
|
188
|
+
def hash_to_name(self):
|
189
|
+
self._create_mapping_dicts()
|
190
|
+
return self._hash_to_name
|
191
|
+
|
192
|
+
def __getattr__(self, name):
|
193
|
+
return self.name_to_object[name]
|
194
|
+
|
195
|
+
@classmethod
|
196
|
+
def from_file(cls, filename: str):
|
197
|
+
"""Load a study from a file."""
|
198
|
+
if filename.endswith(".json"):
|
199
|
+
filename = filename[:-5]
|
200
|
+
return cls(filename=filename)
|
201
|
+
|
202
|
+
def _load_from_file(self):
|
203
|
+
"""Load the study from a file.
|
204
|
+
|
205
|
+
>>> import tempfile
|
206
|
+
>>> filename = tempfile.NamedTemporaryFile(delete=False)
|
207
|
+
>>> study = Study(name = "poo", filename = filename.name)
|
208
|
+
>>> study.save()
|
209
|
+
Saving study to ...
|
210
|
+
>>> study2 = Study(filename = filename.name)
|
211
|
+
Using existing study file ...
|
212
|
+
>>> study2.name
|
213
|
+
'poo'
|
214
|
+
"""
|
215
|
+
with open(self.filename + ".json", "r") as f:
|
216
|
+
d = json.load(f)
|
217
|
+
d["cache"] = Cache.from_dict(d["cache"])
|
218
|
+
d["proof_of_work"] = ProofOfWork.from_dict(d["proof_of_work"])
|
219
|
+
d["objects"] = {
|
220
|
+
hash: ObjectEntry.from_dict(obj_dict)
|
221
|
+
for hash, obj_dict in d["objects"].items()
|
222
|
+
}
|
223
|
+
self.__dict__.update(d)
|
224
|
+
|
225
|
+
def __enter__(self):
|
226
|
+
"""
|
227
|
+
>>> s = Study(name = "temp", use_study_cache = True, verbose = False)
|
228
|
+
>>> _ = s.__enter__()
|
229
|
+
>>> from edsl.config import CONFIG
|
230
|
+
>>> hasattr(CONFIG, "EDSL_SESSION_CACHE")
|
231
|
+
True
|
232
|
+
>>> _ = s.__exit__(None, None, None)
|
233
|
+
>>> len(s.objects)
|
234
|
+
0
|
235
|
+
>>> os.remove("temp.json")
|
236
|
+
|
237
|
+
"""
|
238
|
+
if self.verbose:
|
239
|
+
print("Existing objects in study:")
|
240
|
+
self.print()
|
241
|
+
snapshot = SnapShot(self.namespace, exclude=[self])
|
242
|
+
if self.use_study_cache:
|
243
|
+
if self.verbose:
|
244
|
+
print("Using study cache.")
|
245
|
+
set_session_cache(self.cache)
|
246
|
+
|
247
|
+
if snapshot.edsl_objects:
|
248
|
+
raise ValueError(
|
249
|
+
"You have EDSL objects in the global namespace.",
|
250
|
+
"Please remove them before starting a study or put under the 'Study' context manager."
|
251
|
+
"Objects found:",
|
252
|
+
snapshot.edsl_objects,
|
253
|
+
)
|
254
|
+
return self
|
255
|
+
|
256
|
+
def __hash__(self) -> int:
|
257
|
+
return dict_hash(list(self.objects.keys()))
|
258
|
+
|
259
|
+
def study_diff(self):
|
260
|
+
## Need to also report missing.
|
261
|
+
from edsl.BaseDiff import BaseDiff
|
262
|
+
|
263
|
+
raise NotImplementedError("Need to implement this.")
|
264
|
+
|
265
|
+
def print(self):
|
266
|
+
from rich.console import Console
|
267
|
+
from rich.table import Table
|
268
|
+
|
269
|
+
console = Console()
|
270
|
+
table = Table(title="Study")
|
271
|
+
table.add_column("Original Name")
|
272
|
+
table.add_column("Study Name")
|
273
|
+
table.add_column("Class")
|
274
|
+
table.add_column("Description")
|
275
|
+
table.add_column("Hash")
|
276
|
+
table.add_column("Coop info")
|
277
|
+
table.add_column("Created")
|
278
|
+
|
279
|
+
for obj_hash, obj in self.objects.items():
|
280
|
+
url = (
|
281
|
+
""
|
282
|
+
if not hasattr(obj, "coop_info") or obj.coop_info is None
|
283
|
+
else obj.coop_info.get("url", "")
|
284
|
+
)
|
285
|
+
table.add_row(
|
286
|
+
obj.variable_name,
|
287
|
+
self.hash_to_name[obj_hash],
|
288
|
+
obj.edsl_class_name,
|
289
|
+
obj.description,
|
290
|
+
obj.hash,
|
291
|
+
url,
|
292
|
+
datetime.fromtimestamp(obj.created_at).strftime("%Y-%m-%d %H:%M:%S"),
|
293
|
+
)
|
294
|
+
# Add cache at the end
|
295
|
+
table.add_row(
|
296
|
+
"N/A - Study Cache",
|
297
|
+
"cache",
|
298
|
+
"Cache",
|
299
|
+
f"Cache of study, entries: {len(self.cache)}",
|
300
|
+
str(hash(self.cache)),
|
301
|
+
"N/A",
|
302
|
+
"N/A",
|
303
|
+
)
|
304
|
+
console.print(table)
|
305
|
+
|
306
|
+
def __exit__(self, exc_type, exc_val, exc_tb):
|
307
|
+
snapshot = SnapShot(namespace=self.namespace, exclude=[self])
|
308
|
+
# print("Frame objects are:", snapshot.namespace.keys())
|
309
|
+
# breakpoint()
|
310
|
+
if self.use_study_cache:
|
311
|
+
unset_session_cache()
|
312
|
+
|
313
|
+
for variable_name, object in snapshot.edsl_objects.items():
|
314
|
+
self._add_edsl_object(object=object, variable_name=variable_name)
|
315
|
+
|
316
|
+
if not self.starting_objects:
|
317
|
+
if self.verbose:
|
318
|
+
print(f"New study saved to {self.filename}.json")
|
319
|
+
self.save()
|
320
|
+
|
321
|
+
if self.starting_objects and list(self.starting_objects.keys()) == list(
|
322
|
+
self.objects.keys()
|
323
|
+
):
|
324
|
+
if self.verbose:
|
325
|
+
print("Study perfectly replicated.")
|
326
|
+
else:
|
327
|
+
if self.verbose:
|
328
|
+
print("Starting hashes:", self.starting_objects.keys())
|
329
|
+
print("Current hashes:", self.objects.keys())
|
330
|
+
if self.starting_objects:
|
331
|
+
missing = set(self.starting_objects.keys()) - set(self.objects.keys())
|
332
|
+
added = set(self.objects.keys()) - set(self.starting_objects.keys())
|
333
|
+
# breakpoint()
|
334
|
+
print("Study did not perfectly replicate.")
|
335
|
+
for hash in missing:
|
336
|
+
print(f"Missing object: {self.starting_objects[hash]}")
|
337
|
+
for hash in added:
|
338
|
+
print(f"Added object: {self.objects[hash]}")
|
339
|
+
if self.overwrite_on_change:
|
340
|
+
print("Overwriting study file.")
|
341
|
+
self.save()
|
342
|
+
else:
|
343
|
+
print(
|
344
|
+
"Please save the study file with a new name or call study iwth 'overwrite_on_change=True' to overwrite the existing study file."
|
345
|
+
)
|
346
|
+
|
347
|
+
if self.coop:
|
348
|
+
self.push()
|
349
|
+
if self.overwrite_on_change:
|
350
|
+
self.save()
|
351
|
+
else:
|
352
|
+
raise ValueError(
|
353
|
+
"If you want to push to coop, you must save the study file with a new name or call study iwth 'overwrite_on_change=True' to overwrite the existing study file."
|
354
|
+
)
|
355
|
+
|
356
|
+
if self.verbose:
|
357
|
+
print("Objects in study now:")
|
358
|
+
self.print()
|
359
|
+
|
360
|
+
if self.proof_of_work_difficulty:
|
361
|
+
print("Adding proof of work to study...")
|
362
|
+
from edsl.study.ProofOfWork import ProofOfWork
|
363
|
+
|
364
|
+
# TODO: Need to check if hashes are the same.
|
365
|
+
if not self.proof_of_work.input_data:
|
366
|
+
self.proof_of_work.add_input_data(str(self.__hash__()))
|
367
|
+
self.proof_of_work.add_proof(self.proof_of_work_difficulty)
|
368
|
+
print(
|
369
|
+
"Proof of work added to study with difficulty ",
|
370
|
+
self.proof_of_work_difficulty,
|
371
|
+
)
|
372
|
+
print(self.proof_of_work)
|
373
|
+
self.save()
|
374
|
+
|
375
|
+
def to_dict(self):
|
376
|
+
return {
|
377
|
+
"name": self.name,
|
378
|
+
"description": self.description,
|
379
|
+
"objects": {hash: obj.to_dict() for hash, obj in self.objects.items()},
|
380
|
+
"filename": self.filename,
|
381
|
+
"cache": self.cache.to_dict(),
|
382
|
+
"use_study_cache": self.use_study_cache,
|
383
|
+
"overwrite_on_change": self.overwrite_on_change,
|
384
|
+
"proof_of_work": self.proof_of_work.to_dict(),
|
385
|
+
}
|
386
|
+
|
387
|
+
def versions(self):
|
388
|
+
"""Return a dictionary of objects grouped by variable name."""
|
389
|
+
d = {}
|
390
|
+
for _, obj_entry in self.objects.items():
|
391
|
+
if obj_entry.variable_name not in d:
|
392
|
+
d[obj_entry.variable_name] = [obj_entry]
|
393
|
+
else:
|
394
|
+
d[obj_entry.variable_name].append(obj_entry)
|
395
|
+
|
396
|
+
return d
|
397
|
+
|
398
|
+
def diff(self, variable_name: str, index1: int, index2: int):
|
399
|
+
"""Return the difference between the versions of an object."""
|
400
|
+
versions = self.versions()[variable_name]
|
401
|
+
diff = versions[index2].object - versions[index1].object
|
402
|
+
return diff
|
403
|
+
|
404
|
+
@classmethod
|
405
|
+
def example(cls, verbose=False, randomize=False):
|
406
|
+
import tempfile
|
407
|
+
|
408
|
+
study_file = tempfile.NamedTemporaryFile()
|
409
|
+
with cls(filename=study_file.name, verbose=verbose) as study:
|
410
|
+
from edsl.questions.QuestionFreeText import QuestionFreeText
|
411
|
+
|
412
|
+
q = QuestionFreeText.example(randomize=randomize)
|
413
|
+
return study
|
414
|
+
|
415
|
+
@classmethod
|
416
|
+
def from_dict(cls, d):
|
417
|
+
d["cache"] = Cache.from_dict(d["cache"])
|
418
|
+
d["objects"] = {
|
419
|
+
str(object_hash): ObjectEntry.from_dict(obj_dict)
|
420
|
+
for object_hash, obj_dict in d["objects"].items()
|
421
|
+
}
|
422
|
+
d["proof_of_work"] = ProofOfWork.from_dict(d["proof_of_work"])
|
423
|
+
return cls(**d)
|
424
|
+
|
425
|
+
def save(self):
|
426
|
+
if self.verbose:
|
427
|
+
print(f"Saving study to {self.filename}.json")
|
428
|
+
with open(self.filename + ".json", "w") as f:
|
429
|
+
json.dump(self.to_dict(), f, indent=4)
|
430
|
+
|
431
|
+
def _get_system_info(self):
|
432
|
+
return {
|
433
|
+
"platform": platform.platform(),
|
434
|
+
"system": platform.system(),
|
435
|
+
"processor": platform.processor(),
|
436
|
+
"hostname": socket.gethostname(),
|
437
|
+
}
|
438
|
+
|
439
|
+
@staticmethod
|
440
|
+
def _get_description(object):
|
441
|
+
text = ""
|
442
|
+
if hasattr(object, "__len__"):
|
443
|
+
text += f"Num. entries: {len(object)}"
|
444
|
+
if hasattr(object, "question_name"):
|
445
|
+
text += f"Question name: {object.question_name}"
|
446
|
+
return text
|
447
|
+
|
448
|
+
def _add_edsl_object(self, object, variable_name, description=None) -> None:
|
449
|
+
"""
|
450
|
+
>>> s = Study.example()
|
451
|
+
>>> from edsl import QuestionLinearScale
|
452
|
+
>>> s._add_edsl_object(QuestionLinearScale.example(), 'q')
|
453
|
+
>>> len(s)
|
454
|
+
2
|
455
|
+
"""
|
456
|
+
if description is None:
|
457
|
+
description = self._get_description(object)
|
458
|
+
oe = ObjectEntry(
|
459
|
+
variable_name=variable_name, object=object, description=description
|
460
|
+
)
|
461
|
+
if oe.hash in self.objects:
|
462
|
+
return
|
463
|
+
else:
|
464
|
+
self.objects[oe.hash] = oe
|
465
|
+
|
466
|
+
def push(self) -> dict:
|
467
|
+
"""Push the objects to coop."""
|
468
|
+
|
469
|
+
from edsl.coop.coop import Coop
|
470
|
+
|
471
|
+
coop = Coop()
|
472
|
+
return coop.create(self, description=self.description)
|
473
|
+
|
474
|
+
def delete_object(self, identifier: Union[str, UUID]):
|
475
|
+
"""
|
476
|
+
Delete an EDSL object from the study.
|
477
|
+
|
478
|
+
:param identifier: Either the variable name or the hash of the object to delete
|
479
|
+
:raises ValueError: If the object is not found in the study
|
480
|
+
"""
|
481
|
+
if isinstance(identifier, str):
|
482
|
+
# If identifier is a variable name or a string representation of UUID
|
483
|
+
for hash, obj_entry in list(self.objects.items()):
|
484
|
+
if obj_entry.variable_name == identifier or hash == identifier:
|
485
|
+
del self.objects[hash]
|
486
|
+
self._create_mapping_dicts() # Update internal mappings
|
487
|
+
if self.verbose:
|
488
|
+
print(f"Deleted object with identifier: {identifier}")
|
489
|
+
return
|
490
|
+
raise ValueError(f"No object found with identifier: {identifier}")
|
491
|
+
elif isinstance(identifier, UUID):
|
492
|
+
# If identifier is a UUID object
|
493
|
+
hash_str = str(identifier)
|
494
|
+
if hash_str in self.objects:
|
495
|
+
del self.objects[hash_str]
|
496
|
+
self._create_mapping_dicts() # Update internal mappings
|
497
|
+
if self.verbose:
|
498
|
+
print(f"Deleted object with hash: {hash_str}")
|
499
|
+
return
|
500
|
+
raise ValueError(f"No object found with hash: {hash_str}")
|
501
|
+
else:
|
502
|
+
raise TypeError(
|
503
|
+
"Identifier must be either a string (variable name or hash) or a UUID object"
|
504
|
+
)
|
505
|
+
|
506
|
+
@classmethod
|
507
|
+
def pull(cls, uuid: Optional[Union[str, UUID]] = None, url: Optional[str] = None):
|
508
|
+
"""Pull the object from coop."""
|
509
|
+
from edsl.coop import Coop
|
510
|
+
|
511
|
+
coop = Coop()
|
512
|
+
return coop.get(uuid, url, "study")
|
513
|
+
|
514
|
+
def __repr__(self):
|
515
|
+
return f"""Study(name = "{self.name}", description = "{self.description}", objects = {self.objects}, cache = {self.cache}, filename = "{self.filename}", coop = {self.coop}, use_study_cache = {self.use_study_cache}, overwrite_on_change = {self.overwrite_on_change})"""
|
516
|
+
|
517
|
+
|
518
|
+
if __name__ == "__main__":
|
519
|
+
import doctest
|
520
|
+
|
521
|
+
doctest.testmod(optionflags=doctest.ELLIPSIS)
|
edsl/study/__init__.py
ADDED
@@ -0,0 +1,92 @@
|
|
1
|
+
from edsl.surveys.base import EndOfSurvey
|
2
|
+
from edsl.surveys.DAG import DAG
|
3
|
+
from edsl.exceptions.surveys import SurveyError
|
4
|
+
|
5
|
+
|
6
|
+
class ConstructDAG:
|
7
|
+
def __init__(self, survey):
|
8
|
+
self.survey = survey
|
9
|
+
self.questions = survey.questions
|
10
|
+
|
11
|
+
self.parameters_by_question = self.survey.parameters_by_question
|
12
|
+
self.question_name_to_index = self.survey.question_name_to_index
|
13
|
+
|
14
|
+
def dag(self, textify: bool = False) -> DAG:
|
15
|
+
memory_dag = self.survey.memory_plan.dag
|
16
|
+
rule_dag = self.survey.rule_collection.dag
|
17
|
+
piping_dag = self.piping_dag
|
18
|
+
if textify:
|
19
|
+
memory_dag = DAG(self.textify(memory_dag))
|
20
|
+
rule_dag = DAG(self.textify(rule_dag))
|
21
|
+
piping_dag = DAG(self.textify(piping_dag))
|
22
|
+
return memory_dag + rule_dag + piping_dag
|
23
|
+
|
24
|
+
@property
|
25
|
+
def piping_dag(self) -> DAG:
|
26
|
+
"""Figures out the DAG of piping dependencies.
|
27
|
+
|
28
|
+
>>> from edsl import Survey
|
29
|
+
>>> from edsl import QuestionFreeText
|
30
|
+
>>> q0 = QuestionFreeText(question_text="Here is a question", question_name="q0")
|
31
|
+
>>> q1 = QuestionFreeText(question_text="You previously answered {{ q0 }}---how do you feel now?", question_name="q1")
|
32
|
+
>>> s = Survey([q0, q1])
|
33
|
+
>>> ConstructDAG(s).piping_dag
|
34
|
+
{1: {0}}
|
35
|
+
"""
|
36
|
+
d = {}
|
37
|
+
for question_name, depenencies in self.parameters_by_question.items():
|
38
|
+
if depenencies:
|
39
|
+
question_index = self.question_name_to_index[question_name]
|
40
|
+
for dependency in depenencies:
|
41
|
+
if dependency not in self.question_name_to_index:
|
42
|
+
pass
|
43
|
+
else:
|
44
|
+
dependency_index = self.question_name_to_index[dependency]
|
45
|
+
if question_index not in d:
|
46
|
+
d[question_index] = set()
|
47
|
+
d[question_index].add(dependency_index)
|
48
|
+
return d
|
49
|
+
|
50
|
+
def textify(self, index_dag: DAG) -> DAG:
|
51
|
+
"""Convert the DAG of question indices to a DAG of question names.
|
52
|
+
|
53
|
+
:param index_dag: The DAG of question indices.
|
54
|
+
|
55
|
+
Example:
|
56
|
+
|
57
|
+
>>> from edsl import Survey
|
58
|
+
>>> s = Survey.example()
|
59
|
+
>>> d = s.dag()
|
60
|
+
>>> d
|
61
|
+
{1: {0}, 2: {0}}
|
62
|
+
>>> ConstructDAG(s).textify(d)
|
63
|
+
{'q1': {'q0'}, 'q2': {'q0'}}
|
64
|
+
"""
|
65
|
+
|
66
|
+
def get_name(index: int):
|
67
|
+
"""Return the name of the question given the index."""
|
68
|
+
if index >= len(self.questions):
|
69
|
+
return EndOfSurvey
|
70
|
+
try:
|
71
|
+
return self.questions[index].question_name
|
72
|
+
except IndexError:
|
73
|
+
print(
|
74
|
+
f"The index is {index} but the length of the questions is {len(self.questions)}"
|
75
|
+
)
|
76
|
+
raise SurveyError
|
77
|
+
|
78
|
+
try:
|
79
|
+
text_dag = {}
|
80
|
+
for child_index, parent_indices in index_dag.items():
|
81
|
+
parent_names = {get_name(index) for index in parent_indices}
|
82
|
+
child_name = get_name(child_index)
|
83
|
+
text_dag[child_name] = parent_names
|
84
|
+
return text_dag
|
85
|
+
except IndexError:
|
86
|
+
raise
|
87
|
+
|
88
|
+
|
89
|
+
if __name__ == "__main__":
|
90
|
+
import doctest
|
91
|
+
|
92
|
+
doctest.testmod()
|