edsl 0.1.37.dev2__py3-none-any.whl → 0.1.37.dev3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- edsl/Base.py +303 -303
- edsl/BaseDiff.py +260 -260
- edsl/TemplateLoader.py +24 -24
- edsl/__init__.py +48 -48
- edsl/__version__.py +1 -1
- edsl/agents/Agent.py +804 -804
- edsl/agents/AgentList.py +345 -345
- edsl/agents/Invigilator.py +222 -222
- edsl/agents/InvigilatorBase.py +305 -305
- edsl/agents/PromptConstructor.py +312 -312
- edsl/agents/__init__.py +3 -3
- edsl/agents/descriptors.py +86 -86
- edsl/agents/prompt_helpers.py +129 -129
- edsl/auto/AutoStudy.py +117 -117
- edsl/auto/StageBase.py +230 -230
- edsl/auto/StageGenerateSurvey.py +178 -178
- edsl/auto/StageLabelQuestions.py +125 -125
- edsl/auto/StagePersona.py +61 -61
- edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
- edsl/auto/StagePersonaDimensionValues.py +74 -74
- edsl/auto/StagePersonaDimensions.py +69 -69
- edsl/auto/StageQuestions.py +73 -73
- edsl/auto/SurveyCreatorPipeline.py +21 -21
- edsl/auto/utilities.py +224 -224
- edsl/base/Base.py +289 -289
- edsl/config.py +149 -149
- edsl/conjure/AgentConstructionMixin.py +152 -152
- edsl/conjure/Conjure.py +62 -62
- edsl/conjure/InputData.py +659 -659
- edsl/conjure/InputDataCSV.py +48 -48
- edsl/conjure/InputDataMixinQuestionStats.py +182 -182
- edsl/conjure/InputDataPyRead.py +91 -91
- edsl/conjure/InputDataSPSS.py +8 -8
- edsl/conjure/InputDataStata.py +8 -8
- edsl/conjure/QuestionOptionMixin.py +76 -76
- edsl/conjure/QuestionTypeMixin.py +23 -23
- edsl/conjure/RawQuestion.py +65 -65
- edsl/conjure/SurveyResponses.py +7 -7
- edsl/conjure/__init__.py +9 -9
- edsl/conjure/naming_utilities.py +263 -263
- edsl/conjure/utilities.py +201 -201
- edsl/conversation/Conversation.py +238 -238
- edsl/conversation/car_buying.py +58 -58
- edsl/conversation/mug_negotiation.py +81 -81
- edsl/conversation/next_speaker_utilities.py +93 -93
- edsl/coop/PriceFetcher.py +54 -54
- edsl/coop/__init__.py +2 -2
- edsl/coop/coop.py +824 -824
- edsl/coop/utils.py +131 -131
- edsl/data/Cache.py +527 -527
- edsl/data/CacheEntry.py +228 -228
- edsl/data/CacheHandler.py +149 -149
- edsl/data/RemoteCacheSync.py +97 -97
- edsl/data/SQLiteDict.py +292 -292
- edsl/data/__init__.py +4 -4
- edsl/data/orm.py +10 -10
- edsl/data_transfer_models.py +73 -73
- edsl/enums.py +173 -173
- edsl/exceptions/__init__.py +50 -50
- edsl/exceptions/agents.py +40 -40
- edsl/exceptions/configuration.py +16 -16
- edsl/exceptions/coop.py +10 -10
- edsl/exceptions/data.py +14 -14
- edsl/exceptions/general.py +34 -34
- edsl/exceptions/jobs.py +33 -33
- edsl/exceptions/language_models.py +63 -63
- edsl/exceptions/prompts.py +15 -15
- edsl/exceptions/questions.py +91 -91
- edsl/exceptions/results.py +26 -26
- edsl/exceptions/surveys.py +34 -34
- edsl/inference_services/AnthropicService.py +87 -87
- edsl/inference_services/AwsBedrock.py +115 -115
- edsl/inference_services/AzureAI.py +217 -217
- edsl/inference_services/DeepInfraService.py +18 -18
- edsl/inference_services/GoogleService.py +156 -156
- edsl/inference_services/GroqService.py +20 -20
- edsl/inference_services/InferenceServiceABC.py +147 -147
- edsl/inference_services/InferenceServicesCollection.py +74 -74
- edsl/inference_services/MistralAIService.py +123 -123
- edsl/inference_services/OllamaService.py +18 -18
- edsl/inference_services/OpenAIService.py +224 -224
- edsl/inference_services/TestService.py +89 -89
- edsl/inference_services/TogetherAIService.py +170 -170
- edsl/inference_services/models_available_cache.py +118 -118
- edsl/inference_services/rate_limits_cache.py +25 -25
- edsl/inference_services/registry.py +39 -39
- edsl/inference_services/write_available.py +10 -10
- edsl/jobs/Answers.py +56 -56
- edsl/jobs/Jobs.py +1121 -1112
- edsl/jobs/__init__.py +1 -1
- edsl/jobs/buckets/BucketCollection.py +63 -63
- edsl/jobs/buckets/ModelBuckets.py +65 -65
- edsl/jobs/buckets/TokenBucket.py +248 -248
- edsl/jobs/interviews/Interview.py +661 -661
- edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
- edsl/jobs/interviews/InterviewExceptionEntry.py +182 -182
- edsl/jobs/interviews/InterviewStatistic.py +63 -63
- edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
- edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
- edsl/jobs/interviews/InterviewStatusLog.py +92 -92
- edsl/jobs/interviews/ReportErrors.py +66 -66
- edsl/jobs/interviews/interview_status_enum.py +9 -9
- edsl/jobs/runners/JobsRunnerAsyncio.py +338 -338
- edsl/jobs/runners/JobsRunnerStatus.py +332 -332
- edsl/jobs/tasks/QuestionTaskCreator.py +242 -242
- edsl/jobs/tasks/TaskCreators.py +64 -64
- edsl/jobs/tasks/TaskHistory.py +441 -441
- edsl/jobs/tasks/TaskStatusLog.py +23 -23
- edsl/jobs/tasks/task_status_enum.py +163 -163
- edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
- edsl/jobs/tokens/TokenUsage.py +34 -34
- edsl/language_models/LanguageModel.py +718 -718
- edsl/language_models/ModelList.py +102 -102
- edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
- edsl/language_models/__init__.py +2 -2
- edsl/language_models/fake_openai_call.py +15 -15
- edsl/language_models/fake_openai_service.py +61 -61
- edsl/language_models/registry.py +137 -137
- edsl/language_models/repair.py +156 -156
- edsl/language_models/unused/ReplicateBase.py +83 -83
- edsl/language_models/utilities.py +64 -64
- edsl/notebooks/Notebook.py +259 -259
- edsl/notebooks/__init__.py +1 -1
- edsl/prompts/Prompt.py +353 -353
- edsl/prompts/__init__.py +2 -2
- edsl/questions/AnswerValidatorMixin.py +289 -289
- edsl/questions/QuestionBase.py +616 -616
- edsl/questions/QuestionBaseGenMixin.py +161 -161
- edsl/questions/QuestionBasePromptsMixin.py +266 -266
- edsl/questions/QuestionBudget.py +227 -227
- edsl/questions/QuestionCheckBox.py +359 -359
- edsl/questions/QuestionExtract.py +183 -183
- edsl/questions/QuestionFreeText.py +114 -114
- edsl/questions/QuestionFunctional.py +159 -159
- edsl/questions/QuestionList.py +231 -231
- edsl/questions/QuestionMultipleChoice.py +286 -286
- edsl/questions/QuestionNumerical.py +153 -153
- edsl/questions/QuestionRank.py +324 -324
- edsl/questions/Quick.py +41 -41
- edsl/questions/RegisterQuestionsMeta.py +71 -71
- edsl/questions/ResponseValidatorABC.py +174 -174
- edsl/questions/SimpleAskMixin.py +73 -73
- edsl/questions/__init__.py +26 -26
- edsl/questions/compose_questions.py +98 -98
- edsl/questions/decorators.py +21 -21
- edsl/questions/derived/QuestionLikertFive.py +76 -76
- edsl/questions/derived/QuestionLinearScale.py +87 -87
- edsl/questions/derived/QuestionTopK.py +91 -91
- edsl/questions/derived/QuestionYesNo.py +82 -82
- edsl/questions/descriptors.py +418 -418
- edsl/questions/prompt_templates/question_budget.jinja +13 -13
- edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
- edsl/questions/prompt_templates/question_extract.jinja +11 -11
- edsl/questions/prompt_templates/question_free_text.jinja +3 -3
- edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
- edsl/questions/prompt_templates/question_list.jinja +17 -17
- edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
- edsl/questions/prompt_templates/question_numerical.jinja +36 -36
- edsl/questions/question_registry.py +147 -147
- edsl/questions/settings.py +12 -12
- edsl/questions/templates/budget/answering_instructions.jinja +7 -7
- edsl/questions/templates/budget/question_presentation.jinja +7 -7
- edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
- edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
- edsl/questions/templates/extract/answering_instructions.jinja +7 -7
- edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
- edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
- edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
- edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
- edsl/questions/templates/list/answering_instructions.jinja +3 -3
- edsl/questions/templates/list/question_presentation.jinja +5 -5
- edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
- edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
- edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
- edsl/questions/templates/numerical/question_presentation.jinja +6 -6
- edsl/questions/templates/rank/answering_instructions.jinja +11 -11
- edsl/questions/templates/rank/question_presentation.jinja +15 -15
- edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
- edsl/questions/templates/top_k/question_presentation.jinja +22 -22
- edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
- edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
- edsl/results/Dataset.py +293 -293
- edsl/results/DatasetExportMixin.py +693 -693
- edsl/results/DatasetTree.py +145 -145
- edsl/results/Result.py +435 -435
- edsl/results/Results.py +1160 -1160
- edsl/results/ResultsDBMixin.py +238 -238
- edsl/results/ResultsExportMixin.py +43 -43
- edsl/results/ResultsFetchMixin.py +33 -33
- edsl/results/ResultsGGMixin.py +121 -121
- edsl/results/ResultsToolsMixin.py +98 -98
- edsl/results/Selector.py +118 -118
- edsl/results/__init__.py +2 -2
- edsl/results/tree_explore.py +115 -115
- edsl/scenarios/FileStore.py +458 -458
- edsl/scenarios/Scenario.py +510 -510
- edsl/scenarios/ScenarioHtmlMixin.py +59 -59
- edsl/scenarios/ScenarioList.py +1101 -1101
- edsl/scenarios/ScenarioListExportMixin.py +52 -52
- edsl/scenarios/ScenarioListPdfMixin.py +261 -261
- edsl/scenarios/__init__.py +4 -4
- edsl/shared.py +1 -1
- edsl/study/ObjectEntry.py +173 -173
- edsl/study/ProofOfWork.py +113 -113
- edsl/study/SnapShot.py +80 -80
- edsl/study/Study.py +528 -528
- edsl/study/__init__.py +4 -4
- edsl/surveys/DAG.py +148 -148
- edsl/surveys/Memory.py +31 -31
- edsl/surveys/MemoryPlan.py +244 -244
- edsl/surveys/Rule.py +324 -324
- edsl/surveys/RuleCollection.py +387 -387
- edsl/surveys/Survey.py +1772 -1772
- edsl/surveys/SurveyCSS.py +261 -261
- edsl/surveys/SurveyExportMixin.py +259 -259
- edsl/surveys/SurveyFlowVisualizationMixin.py +121 -121
- edsl/surveys/SurveyQualtricsImport.py +284 -284
- edsl/surveys/__init__.py +3 -3
- edsl/surveys/base.py +53 -53
- edsl/surveys/descriptors.py +56 -56
- edsl/surveys/instructions/ChangeInstruction.py +47 -47
- edsl/surveys/instructions/Instruction.py +51 -51
- edsl/surveys/instructions/InstructionCollection.py +77 -77
- edsl/templates/error_reporting/base.html +23 -23
- edsl/templates/error_reporting/exceptions_by_model.html +34 -34
- edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
- edsl/templates/error_reporting/exceptions_by_type.html +16 -16
- edsl/templates/error_reporting/interview_details.html +115 -115
- edsl/templates/error_reporting/interviews.html +9 -9
- edsl/templates/error_reporting/overview.html +4 -4
- edsl/templates/error_reporting/performance_plot.html +1 -1
- edsl/templates/error_reporting/report.css +73 -73
- edsl/templates/error_reporting/report.html +117 -117
- edsl/templates/error_reporting/report.js +25 -25
- edsl/tools/__init__.py +1 -1
- edsl/tools/clusters.py +192 -192
- edsl/tools/embeddings.py +27 -27
- edsl/tools/embeddings_plotting.py +118 -118
- edsl/tools/plotting.py +112 -112
- edsl/tools/summarize.py +18 -18
- edsl/utilities/SystemInfo.py +28 -28
- edsl/utilities/__init__.py +22 -22
- edsl/utilities/ast_utilities.py +25 -25
- edsl/utilities/data/Registry.py +6 -6
- edsl/utilities/data/__init__.py +1 -1
- edsl/utilities/data/scooter_results.json +1 -1
- edsl/utilities/decorators.py +77 -77
- edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
- edsl/utilities/interface.py +627 -627
- edsl/utilities/repair_functions.py +28 -28
- edsl/utilities/restricted_python.py +70 -70
- edsl/utilities/utilities.py +391 -391
- {edsl-0.1.37.dev2.dist-info → edsl-0.1.37.dev3.dist-info}/LICENSE +21 -21
- {edsl-0.1.37.dev2.dist-info → edsl-0.1.37.dev3.dist-info}/METADATA +1 -1
- edsl-0.1.37.dev3.dist-info/RECORD +279 -0
- edsl-0.1.37.dev2.dist-info/RECORD +0 -279
- {edsl-0.1.37.dev2.dist-info → edsl-0.1.37.dev3.dist-info}/WHEEL +0 -0
edsl/results/ResultsGGMixin.py
CHANGED
@@ -1,121 +1,121 @@
|
|
1
|
-
"""Mixin class for ggplot2 plotting."""
|
2
|
-
|
3
|
-
import subprocess
|
4
|
-
import tempfile
|
5
|
-
from typing import Optional
|
6
|
-
|
7
|
-
|
8
|
-
class ResultsGGMixin:
|
9
|
-
"""Mixin class for ggplot2 plotting."""
|
10
|
-
|
11
|
-
def ggplot2(
|
12
|
-
self,
|
13
|
-
ggplot_code: str,
|
14
|
-
filename: str = None,
|
15
|
-
shape="wide",
|
16
|
-
sql: str = None,
|
17
|
-
remove_prefix: bool = True,
|
18
|
-
debug: bool = False,
|
19
|
-
height=4,
|
20
|
-
width=6,
|
21
|
-
format="svg",
|
22
|
-
factor_orders: Optional[dict] = None,
|
23
|
-
):
|
24
|
-
"""Create a ggplot2 plot from a DataFrame.
|
25
|
-
|
26
|
-
:param ggplot_code: The ggplot2 code to execute.
|
27
|
-
:param filename: The filename to save the plot to.
|
28
|
-
:param shape: The shape of the data in the DataFrame (wide or long).
|
29
|
-
:param sql: The SQL query to execute beforehand to manipulate the data.
|
30
|
-
:param remove_prefix: Whether to remove the prefix from the column names.
|
31
|
-
:param debug: Whether to print the R code instead of executing it.
|
32
|
-
:param height: The height of the plot in inches.
|
33
|
-
:param width: The width of the plot in inches.
|
34
|
-
:param format: The format to save the plot in (png or svg).
|
35
|
-
:param factor_orders: A dictionary of factor columns and their order.
|
36
|
-
"""
|
37
|
-
|
38
|
-
if sql == None:
|
39
|
-
sql = "select * from self"
|
40
|
-
|
41
|
-
if shape == "long":
|
42
|
-
df = self.sql(sql, shape="long")
|
43
|
-
elif shape == "wide":
|
44
|
-
df = self.sql(sql, shape="wide", remove_prefix=remove_prefix)
|
45
|
-
|
46
|
-
# Convert DataFrame to CSV format
|
47
|
-
csv_data = df.to_csv(index=False)
|
48
|
-
|
49
|
-
# Embed the CSV data within the R script
|
50
|
-
csv_data_escaped = csv_data.replace("\n", "\\n").replace("'", "\\'")
|
51
|
-
read_csv_code = f"self <- read.csv(text = '{csv_data_escaped}', sep = ',')\n"
|
52
|
-
|
53
|
-
if factor_orders is not None:
|
54
|
-
for factor, order in factor_orders.items():
|
55
|
-
# read_csv_code += f"""self${{{factor}}} <- factor(self${{{factor}}}, levels=c({','.join(['"{}"'.format(x) for x in order])}))"""
|
56
|
-
|
57
|
-
level_string = ", ".join([f'"{x}"' for x in order])
|
58
|
-
read_csv_code += (
|
59
|
-
f"self${factor} <- factor(self${factor}, levels=c({level_string}))"
|
60
|
-
)
|
61
|
-
read_csv_code += "\n"
|
62
|
-
|
63
|
-
# Load ggplot2 library
|
64
|
-
load_ggplot2 = "library(ggplot2)\n"
|
65
|
-
|
66
|
-
# Check if a filename is provided for the plot, if not create a temporary one
|
67
|
-
if not filename:
|
68
|
-
filename = tempfile.mktemp(suffix=f".{format}")
|
69
|
-
|
70
|
-
# Combine all R script parts
|
71
|
-
full_r_code = load_ggplot2 + read_csv_code + ggplot_code
|
72
|
-
|
73
|
-
# Add command to save the plot to a file
|
74
|
-
full_r_code += f'\nggsave("{filename}", plot = last_plot(), width = {width}, height = {height}, device = "{format}")'
|
75
|
-
|
76
|
-
if debug:
|
77
|
-
print(full_r_code)
|
78
|
-
return
|
79
|
-
|
80
|
-
result = subprocess.run(
|
81
|
-
["Rscript", "-"],
|
82
|
-
input=full_r_code,
|
83
|
-
text=True,
|
84
|
-
stdout=subprocess.PIPE,
|
85
|
-
stderr=subprocess.PIPE,
|
86
|
-
)
|
87
|
-
|
88
|
-
if result.returncode != 0:
|
89
|
-
if result.returncode == 127: # 'command not found'
|
90
|
-
raise RuntimeError(
|
91
|
-
"Rscript is probably not installed. Please install R from https://cran.r-project.org/"
|
92
|
-
)
|
93
|
-
else:
|
94
|
-
raise RuntimeError(
|
95
|
-
f"An error occurred while running Rscript: {result.stderr}"
|
96
|
-
)
|
97
|
-
|
98
|
-
if result.stderr:
|
99
|
-
print("Error in R script:", result.stderr)
|
100
|
-
else:
|
101
|
-
self._display_plot(filename, width, height)
|
102
|
-
|
103
|
-
def _display_plot(self, filename: str, width: float, height: float):
|
104
|
-
"""Display the plot in the notebook."""
|
105
|
-
import matplotlib.pyplot as plt
|
106
|
-
import matplotlib.image as mpimg
|
107
|
-
|
108
|
-
if filename.endswith(".png"):
|
109
|
-
img = mpimg.imread(filename)
|
110
|
-
plt.figure(
|
111
|
-
figsize=(width, height)
|
112
|
-
) # Set the figure size (width, height) in inches
|
113
|
-
plt.imshow(img)
|
114
|
-
plt.axis("off")
|
115
|
-
plt.show()
|
116
|
-
elif filename.endswith(".svg"):
|
117
|
-
from IPython.display import SVG, display
|
118
|
-
|
119
|
-
display(SVG(filename=filename))
|
120
|
-
else:
|
121
|
-
print("Unsupported file format. Please provide a PNG or SVG file.")
|
1
|
+
"""Mixin class for ggplot2 plotting."""
|
2
|
+
|
3
|
+
import subprocess
|
4
|
+
import tempfile
|
5
|
+
from typing import Optional
|
6
|
+
|
7
|
+
|
8
|
+
class ResultsGGMixin:
|
9
|
+
"""Mixin class for ggplot2 plotting."""
|
10
|
+
|
11
|
+
def ggplot2(
|
12
|
+
self,
|
13
|
+
ggplot_code: str,
|
14
|
+
filename: str = None,
|
15
|
+
shape="wide",
|
16
|
+
sql: str = None,
|
17
|
+
remove_prefix: bool = True,
|
18
|
+
debug: bool = False,
|
19
|
+
height=4,
|
20
|
+
width=6,
|
21
|
+
format="svg",
|
22
|
+
factor_orders: Optional[dict] = None,
|
23
|
+
):
|
24
|
+
"""Create a ggplot2 plot from a DataFrame.
|
25
|
+
|
26
|
+
:param ggplot_code: The ggplot2 code to execute.
|
27
|
+
:param filename: The filename to save the plot to.
|
28
|
+
:param shape: The shape of the data in the DataFrame (wide or long).
|
29
|
+
:param sql: The SQL query to execute beforehand to manipulate the data.
|
30
|
+
:param remove_prefix: Whether to remove the prefix from the column names.
|
31
|
+
:param debug: Whether to print the R code instead of executing it.
|
32
|
+
:param height: The height of the plot in inches.
|
33
|
+
:param width: The width of the plot in inches.
|
34
|
+
:param format: The format to save the plot in (png or svg).
|
35
|
+
:param factor_orders: A dictionary of factor columns and their order.
|
36
|
+
"""
|
37
|
+
|
38
|
+
if sql == None:
|
39
|
+
sql = "select * from self"
|
40
|
+
|
41
|
+
if shape == "long":
|
42
|
+
df = self.sql(sql, shape="long")
|
43
|
+
elif shape == "wide":
|
44
|
+
df = self.sql(sql, shape="wide", remove_prefix=remove_prefix)
|
45
|
+
|
46
|
+
# Convert DataFrame to CSV format
|
47
|
+
csv_data = df.to_csv(index=False)
|
48
|
+
|
49
|
+
# Embed the CSV data within the R script
|
50
|
+
csv_data_escaped = csv_data.replace("\n", "\\n").replace("'", "\\'")
|
51
|
+
read_csv_code = f"self <- read.csv(text = '{csv_data_escaped}', sep = ',')\n"
|
52
|
+
|
53
|
+
if factor_orders is not None:
|
54
|
+
for factor, order in factor_orders.items():
|
55
|
+
# read_csv_code += f"""self${{{factor}}} <- factor(self${{{factor}}}, levels=c({','.join(['"{}"'.format(x) for x in order])}))"""
|
56
|
+
|
57
|
+
level_string = ", ".join([f'"{x}"' for x in order])
|
58
|
+
read_csv_code += (
|
59
|
+
f"self${factor} <- factor(self${factor}, levels=c({level_string}))"
|
60
|
+
)
|
61
|
+
read_csv_code += "\n"
|
62
|
+
|
63
|
+
# Load ggplot2 library
|
64
|
+
load_ggplot2 = "library(ggplot2)\n"
|
65
|
+
|
66
|
+
# Check if a filename is provided for the plot, if not create a temporary one
|
67
|
+
if not filename:
|
68
|
+
filename = tempfile.mktemp(suffix=f".{format}")
|
69
|
+
|
70
|
+
# Combine all R script parts
|
71
|
+
full_r_code = load_ggplot2 + read_csv_code + ggplot_code
|
72
|
+
|
73
|
+
# Add command to save the plot to a file
|
74
|
+
full_r_code += f'\nggsave("{filename}", plot = last_plot(), width = {width}, height = {height}, device = "{format}")'
|
75
|
+
|
76
|
+
if debug:
|
77
|
+
print(full_r_code)
|
78
|
+
return
|
79
|
+
|
80
|
+
result = subprocess.run(
|
81
|
+
["Rscript", "-"],
|
82
|
+
input=full_r_code,
|
83
|
+
text=True,
|
84
|
+
stdout=subprocess.PIPE,
|
85
|
+
stderr=subprocess.PIPE,
|
86
|
+
)
|
87
|
+
|
88
|
+
if result.returncode != 0:
|
89
|
+
if result.returncode == 127: # 'command not found'
|
90
|
+
raise RuntimeError(
|
91
|
+
"Rscript is probably not installed. Please install R from https://cran.r-project.org/"
|
92
|
+
)
|
93
|
+
else:
|
94
|
+
raise RuntimeError(
|
95
|
+
f"An error occurred while running Rscript: {result.stderr}"
|
96
|
+
)
|
97
|
+
|
98
|
+
if result.stderr:
|
99
|
+
print("Error in R script:", result.stderr)
|
100
|
+
else:
|
101
|
+
self._display_plot(filename, width, height)
|
102
|
+
|
103
|
+
def _display_plot(self, filename: str, width: float, height: float):
|
104
|
+
"""Display the plot in the notebook."""
|
105
|
+
import matplotlib.pyplot as plt
|
106
|
+
import matplotlib.image as mpimg
|
107
|
+
|
108
|
+
if filename.endswith(".png"):
|
109
|
+
img = mpimg.imread(filename)
|
110
|
+
plt.figure(
|
111
|
+
figsize=(width, height)
|
112
|
+
) # Set the figure size (width, height) in inches
|
113
|
+
plt.imshow(img)
|
114
|
+
plt.axis("off")
|
115
|
+
plt.show()
|
116
|
+
elif filename.endswith(".svg"):
|
117
|
+
from IPython.display import SVG, display
|
118
|
+
|
119
|
+
display(SVG(filename=filename))
|
120
|
+
else:
|
121
|
+
print("Unsupported file format. Please provide a PNG or SVG file.")
|
@@ -1,98 +1,98 @@
|
|
1
|
-
class ResultsToolsMixin:
|
2
|
-
def get_themes(
|
3
|
-
self,
|
4
|
-
field: str,
|
5
|
-
context: str,
|
6
|
-
max_values=100,
|
7
|
-
num_themes: int = 10,
|
8
|
-
seed=None,
|
9
|
-
progress_bar=False,
|
10
|
-
print_exceptions=False,
|
11
|
-
) -> list:
|
12
|
-
values = [
|
13
|
-
str(txt)[:1000]
|
14
|
-
for txt in self.shuffle(seed=seed).select(field).to_list()[:max_values]
|
15
|
-
]
|
16
|
-
from edsl import ScenarioList
|
17
|
-
from edsl.questions import QuestionList, QuestionCheckBox
|
18
|
-
|
19
|
-
q = QuestionList(
|
20
|
-
question_text=f"""
|
21
|
-
{context}
|
22
|
-
Here are some examples: { values }.
|
23
|
-
What are some 5-8 word themes that would mostly capture these examples?
|
24
|
-
Please shoot for {num_themes} as target number of themes.
|
25
|
-
""",
|
26
|
-
question_name="themes",
|
27
|
-
)
|
28
|
-
results = q.run(print_exceptions=print_exceptions, progress_bar=progress_bar)
|
29
|
-
return results.select("themes").first()
|
30
|
-
|
31
|
-
def answers_to_themes(
|
32
|
-
self,
|
33
|
-
field,
|
34
|
-
context: str,
|
35
|
-
themes: list,
|
36
|
-
progress_bar=False,
|
37
|
-
print_exceptions=False,
|
38
|
-
) -> dict:
|
39
|
-
from edsl import ScenarioList
|
40
|
-
from edsl import QuestionCheckBox
|
41
|
-
|
42
|
-
values = self.select(field).to_list()
|
43
|
-
scenarios = ScenarioList.from_list("field", values).add_value(
|
44
|
-
"context", context
|
45
|
-
)
|
46
|
-
q = QuestionCheckBox(
|
47
|
-
question_text="""
|
48
|
-
{{ context }}
|
49
|
-
Consider the following response:
|
50
|
-
|
51
|
-
" {{ field }} "
|
52
|
-
|
53
|
-
Please check the themes that apply to these examples.
|
54
|
-
If blank, please check 'None'.
|
55
|
-
""",
|
56
|
-
question_options=themes + ["None", "Other"],
|
57
|
-
question_name="themes",
|
58
|
-
)
|
59
|
-
results = q.by(scenarios).run(
|
60
|
-
progress_bar=progress_bar, print_exceptions=print_exceptions
|
61
|
-
)
|
62
|
-
return {k: v for k, v in results.select("field", "themes").to_list()}
|
63
|
-
|
64
|
-
def apply_themes(self, field: str, new_field: str, answers_to_themes: dict):
|
65
|
-
def translate(x):
|
66
|
-
return answers_to_themes.get(x, "Other")
|
67
|
-
|
68
|
-
self.mutate(f"{new_field} = f({field})", functions_dict={"f": translate})
|
69
|
-
return self
|
70
|
-
|
71
|
-
def auto_theme(
|
72
|
-
self,
|
73
|
-
field: str,
|
74
|
-
context: str,
|
75
|
-
themes: list[str],
|
76
|
-
newfield: str = None,
|
77
|
-
progress_bar=False,
|
78
|
-
print_exceptions=False,
|
79
|
-
) -> tuple:
|
80
|
-
"""
|
81
|
-
:param field: The field to be themed.
|
82
|
-
:param context: The context of the field.
|
83
|
-
:param themes: The list of themes.
|
84
|
-
:param newfield: The new field name.
|
85
|
-
|
86
|
-
"""
|
87
|
-
|
88
|
-
if not newfield:
|
89
|
-
newfield = f"{field}_themes"
|
90
|
-
|
91
|
-
answers_to_themes = self.answers_to_themes(
|
92
|
-
field=field,
|
93
|
-
context=context,
|
94
|
-
themes=themes,
|
95
|
-
progress_bar=progress_bar,
|
96
|
-
print_exceptions=print_exceptions,
|
97
|
-
)
|
98
|
-
return self.apply_themes(field, newfield, answers_to_themes), themes
|
1
|
+
class ResultsToolsMixin:
|
2
|
+
def get_themes(
|
3
|
+
self,
|
4
|
+
field: str,
|
5
|
+
context: str,
|
6
|
+
max_values=100,
|
7
|
+
num_themes: int = 10,
|
8
|
+
seed=None,
|
9
|
+
progress_bar=False,
|
10
|
+
print_exceptions=False,
|
11
|
+
) -> list:
|
12
|
+
values = [
|
13
|
+
str(txt)[:1000]
|
14
|
+
for txt in self.shuffle(seed=seed).select(field).to_list()[:max_values]
|
15
|
+
]
|
16
|
+
from edsl import ScenarioList
|
17
|
+
from edsl.questions import QuestionList, QuestionCheckBox
|
18
|
+
|
19
|
+
q = QuestionList(
|
20
|
+
question_text=f"""
|
21
|
+
{context}
|
22
|
+
Here are some examples: { values }.
|
23
|
+
What are some 5-8 word themes that would mostly capture these examples?
|
24
|
+
Please shoot for {num_themes} as target number of themes.
|
25
|
+
""",
|
26
|
+
question_name="themes",
|
27
|
+
)
|
28
|
+
results = q.run(print_exceptions=print_exceptions, progress_bar=progress_bar)
|
29
|
+
return results.select("themes").first()
|
30
|
+
|
31
|
+
def answers_to_themes(
|
32
|
+
self,
|
33
|
+
field,
|
34
|
+
context: str,
|
35
|
+
themes: list,
|
36
|
+
progress_bar=False,
|
37
|
+
print_exceptions=False,
|
38
|
+
) -> dict:
|
39
|
+
from edsl import ScenarioList
|
40
|
+
from edsl import QuestionCheckBox
|
41
|
+
|
42
|
+
values = self.select(field).to_list()
|
43
|
+
scenarios = ScenarioList.from_list("field", values).add_value(
|
44
|
+
"context", context
|
45
|
+
)
|
46
|
+
q = QuestionCheckBox(
|
47
|
+
question_text="""
|
48
|
+
{{ context }}
|
49
|
+
Consider the following response:
|
50
|
+
|
51
|
+
" {{ field }} "
|
52
|
+
|
53
|
+
Please check the themes that apply to these examples.
|
54
|
+
If blank, please check 'None'.
|
55
|
+
""",
|
56
|
+
question_options=themes + ["None", "Other"],
|
57
|
+
question_name="themes",
|
58
|
+
)
|
59
|
+
results = q.by(scenarios).run(
|
60
|
+
progress_bar=progress_bar, print_exceptions=print_exceptions
|
61
|
+
)
|
62
|
+
return {k: v for k, v in results.select("field", "themes").to_list()}
|
63
|
+
|
64
|
+
def apply_themes(self, field: str, new_field: str, answers_to_themes: dict):
|
65
|
+
def translate(x):
|
66
|
+
return answers_to_themes.get(x, "Other")
|
67
|
+
|
68
|
+
self.mutate(f"{new_field} = f({field})", functions_dict={"f": translate})
|
69
|
+
return self
|
70
|
+
|
71
|
+
def auto_theme(
|
72
|
+
self,
|
73
|
+
field: str,
|
74
|
+
context: str,
|
75
|
+
themes: list[str],
|
76
|
+
newfield: str = None,
|
77
|
+
progress_bar=False,
|
78
|
+
print_exceptions=False,
|
79
|
+
) -> tuple:
|
80
|
+
"""
|
81
|
+
:param field: The field to be themed.
|
82
|
+
:param context: The context of the field.
|
83
|
+
:param themes: The list of themes.
|
84
|
+
:param newfield: The new field name.
|
85
|
+
|
86
|
+
"""
|
87
|
+
|
88
|
+
if not newfield:
|
89
|
+
newfield = f"{field}_themes"
|
90
|
+
|
91
|
+
answers_to_themes = self.answers_to_themes(
|
92
|
+
field=field,
|
93
|
+
context=context,
|
94
|
+
themes=themes,
|
95
|
+
progress_bar=progress_bar,
|
96
|
+
print_exceptions=print_exceptions,
|
97
|
+
)
|
98
|
+
return self.apply_themes(field, newfield, answers_to_themes), themes
|