PyPI - edsl - Versions diffs - 0.1.39__py3-none-any.whl → 0.1.39.dev1__py3-none-any.whl - Mend

edsl 0.1.39py3-none-any.whl → 0.1.39.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

edsl/Base.py +116 -197
edsl/__init__.py +7 -15
edsl/__version__.py +1 -1
edsl/agents/Agent.py +147 -351
edsl/agents/AgentList.py +73 -211
edsl/agents/Invigilator.py +50 -101
edsl/agents/InvigilatorBase.py +70 -62
edsl/agents/PromptConstructor.py +225 -143
edsl/agents/__init__.py +1 -0
edsl/agents/prompt_helpers.py +3 -3
edsl/auto/AutoStudy.py +5 -18
edsl/auto/StageBase.py +40 -53
edsl/auto/StageQuestions.py +1 -2
edsl/auto/utilities.py +6 -0
edsl/config.py +2 -22
edsl/conversation/car_buying.py +1 -2
edsl/coop/PriceFetcher.py +1 -1
edsl/coop/coop.py +47 -125
edsl/coop/utils.py +14 -14
edsl/data/Cache.py +27 -45
edsl/data/CacheEntry.py +15 -12
edsl/data/CacheHandler.py +12 -31
edsl/data/RemoteCacheSync.py +46 -154
edsl/data/__init__.py +3 -4
edsl/data_transfer_models.py +1 -2
edsl/enums.py +0 -27
edsl/exceptions/__init__.py +50 -50
edsl/exceptions/agents.py +0 -12
edsl/exceptions/questions.py +6 -24
edsl/exceptions/scenarios.py +0 -7
edsl/inference_services/AnthropicService.py +19 -38
edsl/inference_services/AwsBedrock.py +2 -0
edsl/inference_services/AzureAI.py +2 -0
edsl/inference_services/GoogleService.py +12 -7
edsl/inference_services/InferenceServiceABC.py +85 -18
edsl/inference_services/InferenceServicesCollection.py +79 -120
edsl/inference_services/MistralAIService.py +3 -0
edsl/inference_services/OpenAIService.py +35 -47
edsl/inference_services/PerplexityService.py +3 -0
edsl/inference_services/TestService.py +10 -11
edsl/inference_services/TogetherAIService.py +3 -5
edsl/jobs/Answers.py +14 -1
edsl/jobs/Jobs.py +431 -356
edsl/jobs/JobsChecks.py +10 -35
edsl/jobs/JobsPrompts.py +4 -6
edsl/jobs/JobsRemoteInferenceHandler.py +133 -205
edsl/jobs/buckets/BucketCollection.py +3 -44
edsl/jobs/buckets/TokenBucket.py +21 -53
edsl/jobs/interviews/Interview.py +408 -143
edsl/jobs/runners/JobsRunnerAsyncio.py +403 -88
edsl/jobs/runners/JobsRunnerStatus.py +165 -133
edsl/jobs/tasks/QuestionTaskCreator.py +19 -21
edsl/jobs/tasks/TaskHistory.py +18 -38
edsl/jobs/tasks/task_status_enum.py +2 -0
edsl/language_models/KeyLookup.py +30 -0
edsl/language_models/LanguageModel.py +236 -194
edsl/language_models/ModelList.py +19 -28
edsl/language_models/__init__.py +2 -1
edsl/language_models/registry.py +190 -0
edsl/language_models/repair.py +2 -2
edsl/language_models/unused/ReplicateBase.py +83 -0
edsl/language_models/utilities.py +4 -5
edsl/notebooks/Notebook.py +14 -19
edsl/prompts/Prompt.py +39 -29
edsl/questions/{answer_validator_mixin.py → AnswerValidatorMixin.py} +2 -47
edsl/questions/QuestionBase.py +214 -68
edsl/questions/{question_base_gen_mixin.py → QuestionBaseGenMixin.py} +50 -57
edsl/questions/QuestionBasePromptsMixin.py +3 -7
edsl/questions/QuestionBudget.py +1 -1
edsl/questions/QuestionCheckBox.py +3 -3
edsl/questions/QuestionExtract.py +7 -5
edsl/questions/QuestionFreeText.py +3 -2
edsl/questions/QuestionList.py +18 -10
edsl/questions/QuestionMultipleChoice.py +23 -67
edsl/questions/QuestionNumerical.py +4 -2
edsl/questions/QuestionRank.py +17 -7
edsl/questions/{response_validator_abc.py → ResponseValidatorABC.py} +26 -40
edsl/questions/SimpleAskMixin.py +3 -4
edsl/questions/__init__.py +1 -2
edsl/questions/derived/QuestionLinearScale.py +3 -6
edsl/questions/derived/QuestionTopK.py +1 -1
edsl/questions/descriptors.py +3 -17
edsl/questions/question_registry.py +1 -1
edsl/results/CSSParameterizer.py +1 -1
edsl/results/Dataset.py +7 -170
edsl/results/DatasetExportMixin.py +305 -168
edsl/results/DatasetTree.py +8 -28
edsl/results/Result.py +206 -298
edsl/results/Results.py +131 -149
edsl/results/ResultsDBMixin.py +238 -0
edsl/results/ResultsExportMixin.py +0 -2
edsl/results/{results_selector.py → Selector.py} +13 -23
edsl/results/TableDisplay.py +171 -98
edsl/results/__init__.py +1 -1
edsl/scenarios/FileStore.py +239 -150
edsl/scenarios/Scenario.py +193 -90
edsl/scenarios/ScenarioHtmlMixin.py +3 -4
edsl/scenarios/{scenario_join.py → ScenarioJoin.py} +6 -10
edsl/scenarios/ScenarioList.py +244 -415
edsl/scenarios/ScenarioListExportMixin.py +7 -0
edsl/scenarios/ScenarioListPdfMixin.py +37 -15
edsl/scenarios/__init__.py +2 -1
edsl/study/ObjectEntry.py +1 -1
edsl/study/SnapShot.py +1 -1
edsl/study/Study.py +12 -5
edsl/surveys/Rule.py +4 -5
edsl/surveys/RuleCollection.py +27 -25
edsl/surveys/Survey.py +791 -270
edsl/surveys/SurveyCSS.py +8 -20
edsl/surveys/{SurveyFlowVisualization.py → SurveyFlowVisualizationMixin.py} +9 -11
edsl/surveys/__init__.py +2 -4
edsl/surveys/descriptors.py +2 -6
edsl/surveys/instructions/ChangeInstruction.py +2 -1
edsl/surveys/instructions/Instruction.py +13 -4
edsl/surveys/instructions/InstructionCollection.py +6 -11
edsl/templates/error_reporting/interview_details.html +1 -1
edsl/templates/error_reporting/report.html +1 -1
edsl/tools/plotting.py +1 -1
edsl/utilities/utilities.py +23 -35
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/METADATA +10 -12
edsl-0.1.39.dev1.dist-info/RECORD +277 -0
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/WHEEL +1 -1
edsl/agents/QuestionInstructionPromptBuilder.py +0 -128
edsl/agents/QuestionTemplateReplacementsBuilder.py +0 -137
edsl/agents/question_option_processor.py +0 -172
edsl/coop/CoopFunctionsMixin.py +0 -15
edsl/coop/ExpectedParrotKeyHandler.py +0 -125
edsl/exceptions/inference_services.py +0 -5
edsl/inference_services/AvailableModelCacheHandler.py +0 -184
edsl/inference_services/AvailableModelFetcher.py +0 -215
edsl/inference_services/ServiceAvailability.py +0 -135
edsl/inference_services/data_structures.py +0 -134
edsl/jobs/AnswerQuestionFunctionConstructor.py +0 -223
edsl/jobs/FetchInvigilator.py +0 -47
edsl/jobs/InterviewTaskManager.py +0 -98
edsl/jobs/InterviewsConstructor.py +0 -50
edsl/jobs/JobsComponentConstructor.py +0 -189
edsl/jobs/JobsRemoteInferenceLogger.py +0 -239
edsl/jobs/RequestTokenEstimator.py +0 -30
edsl/jobs/async_interview_runner.py +0 -138
edsl/jobs/buckets/TokenBucketAPI.py +0 -211
edsl/jobs/buckets/TokenBucketClient.py +0 -191
edsl/jobs/check_survey_scenario_compatibility.py +0 -85
edsl/jobs/data_structures.py +0 -120
edsl/jobs/decorators.py +0 -35
edsl/jobs/jobs_status_enums.py +0 -9
edsl/jobs/loggers/HTMLTableJobLogger.py +0 -304
edsl/jobs/results_exceptions_handler.py +0 -98
edsl/language_models/ComputeCost.py +0 -63
edsl/language_models/PriceManager.py +0 -127
edsl/language_models/RawResponseHandler.py +0 -106
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/key_management/KeyLookup.py +0 -63
edsl/language_models/key_management/KeyLookupBuilder.py +0 -273
edsl/language_models/key_management/KeyLookupCollection.py +0 -38
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +0 -131
edsl/language_models/model.py +0 -256
edsl/notebooks/NotebookToLaTeX.py +0 -142
edsl/questions/ExceptionExplainer.py +0 -77
edsl/questions/HTMLQuestion.py +0 -103
edsl/questions/QuestionMatrix.py +0 -265
edsl/questions/data_structures.py +0 -20
edsl/questions/loop_processor.py +0 -149
edsl/questions/response_validator_factory.py +0 -34
edsl/questions/templates/matrix/__init__.py +0 -1
edsl/questions/templates/matrix/answering_instructions.jinja +0 -5
edsl/questions/templates/matrix/question_presentation.jinja +0 -20
edsl/results/MarkdownToDocx.py +0 -122
edsl/results/MarkdownToPDF.py +0 -111
edsl/results/TextEditor.py +0 -50
edsl/results/file_exports.py +0 -252
edsl/results/smart_objects.py +0 -96
edsl/results/table_data_class.py +0 -12
edsl/results/table_renderers.py +0 -118
edsl/scenarios/ConstructDownloadLink.py +0 -109
edsl/scenarios/DocumentChunker.py +0 -102
edsl/scenarios/DocxScenario.py +0 -16
edsl/scenarios/PdfExtractor.py +0 -40
edsl/scenarios/directory_scanner.py +0 -96
edsl/scenarios/file_methods.py +0 -85
edsl/scenarios/handlers/__init__.py +0 -13
edsl/scenarios/handlers/csv.py +0 -49
edsl/scenarios/handlers/docx.py +0 -76
edsl/scenarios/handlers/html.py +0 -37
edsl/scenarios/handlers/json.py +0 -111
edsl/scenarios/handlers/latex.py +0 -5
edsl/scenarios/handlers/md.py +0 -51
edsl/scenarios/handlers/pdf.py +0 -68
edsl/scenarios/handlers/png.py +0 -39
edsl/scenarios/handlers/pptx.py +0 -105
edsl/scenarios/handlers/py.py +0 -294
edsl/scenarios/handlers/sql.py +0 -313
edsl/scenarios/handlers/sqlite.py +0 -149
edsl/scenarios/handlers/txt.py +0 -33
edsl/scenarios/scenario_selector.py +0 -156
edsl/surveys/ConstructDAG.py +0 -92
edsl/surveys/EditSurvey.py +0 -221
edsl/surveys/InstructionHandler.py +0 -100
edsl/surveys/MemoryManagement.py +0 -72
edsl/surveys/RuleManager.py +0 -172
edsl/surveys/Simulator.py +0 -75
edsl/surveys/SurveyToApp.py +0 -141
edsl/utilities/PrettyList.py +0 -56
edsl/utilities/is_notebook.py +0 -18
edsl/utilities/is_valid_variable_name.py +0 -11
edsl/utilities/remove_edsl_version.py +0 -24
edsl-0.1.39.dist-info/RECORD +0 -358
/edsl/questions/{register_questions_meta.py → RegisterQuestionsMeta.py} +0 -0
/edsl/results/{results_fetch_mixin.py → ResultsFetchMixin.py} +0 -0
/edsl/results/{results_tools_mixin.py → ResultsToolsMixin.py} +0 -0
{edsl-0.1.39.dist-info → edsl-0.1.39.dev1.dist-info}/LICENSE +0 -0

edsl/scenarios/Scenario.py CHANGED Viewed

@@ -2,65 +2,54 @@
 from __future__ import annotations
 import copy
+import hashlib
 import os
 import json
 from collections import UserDict
-from typing import Union, List, Optional, TYPE_CHECKING, Collection
+from typing import Union, List, Optional, Generator
 from uuid import uuid4
 from edsl.Base import Base
 from edsl.scenarios.ScenarioHtmlMixin import ScenarioHtmlMixin
-from edsl.utilities.remove_edsl_version import remove_edsl_version
+from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
 from edsl.exceptions.scenarios import ScenarioError
-if TYPE_CHECKING:
-    from edsl.scenarios.ScenarioList import ScenarioList
-    from edsl.results.Dataset import Dataset
 class DisplayJSON:
-    """Display a dictionary as JSON."""
-    def __init__(self, input_dict: dict):
-        self.text = json.dumps(input_dict, indent=4)
+    def __init__(self, dict):
+        self.text = json.dumps(dict, indent=4)
     def __repr__(self):
         return self.text
 class DisplayYAML:
-    """Display a dictionary as YAML."""
-    def __init__(self, input_dict: dict):
+    def __init__(self, dict):
         import yaml
-        self.text = yaml.dump(input_dict)
+        self.text = yaml.dump(dict)
     def __repr__(self):
         return self.text
 class Scenario(Base, UserDict, ScenarioHtmlMixin):
-    """A Scenario is a dictionary of keys/values that can be used to parameterize questions."""
+    """A Scenario is a dictionary of keys/values.
+    They can be used parameterize EDSL questions."""
     __documentation__ = "https://docs.expectedparrot.com/en/latest/scenarios.html"
-    def __init__(self, data: Optional[dict] = None, name: Optional[str] = None):
+    def __init__(self, data: Union[dict, None] = None, name: str = None):
         """Initialize a new Scenario.
-        :param data: A dictionary of keys/values for parameterizing questions.
-        :param name: The name of the scenario.
-        """
+        # :param data: A dictionary of keys/values for parameterizing questions.
+        #"""
         if not isinstance(data, dict) and data is not None:
-            try:
-                data = dict(data)
-            except Exception as e:
-                raise ScenarioError(
-                    f"You must pass in a dictionary to initialize a Scenario. You passed in {data}",
-                    "Exception message:" + str(e),
-                )
+            raise EDSLScenarioError(
+                "You must pass in a dictionary to initialize a Scenario."
+            )
-        super().__init__()
         self.data = data if data is not None else {}
         self.name = name
@@ -70,6 +59,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         :param n: The number of times to replicate the scenario.
         Example:
         >>> s = Scenario({"food": "wood chips"})
         >>> s.replicate(2)
         ScenarioList([Scenario({'food': 'wood chips'}), Scenario({'food': 'wood chips'})])
@@ -92,13 +82,13 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
                     return True
         return False
-    def _convert_jinja_braces(
-        self, replacement_left: str = "<<", replacement_right: str = ">>"
+    def convert_jinja_braces(
+        self, replacement_left="<<", replacement_right=">>"
     ) -> Scenario:
         """Convert Jinja braces to some other character.
         >>> s = Scenario({"food": "I love {{wood chips}}"})
-        >>> s._convert_jinja_braces()
+        >>> s.convert_jinja_braces()
         Scenario({'food': 'I love <<wood chips>>'})
         """
@@ -112,7 +102,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
                 new_scenario[key] = value
         return new_scenario
-    def __add__(self, other_scenario: Scenario) -> Scenario:
+    def __add__(self, other_scenario: "Scenario") -> "Scenario":
         """Combine two scenarios by taking the union of their keys
         If the other scenario is None, then just return self.
@@ -137,14 +127,11 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
             return s
     def rename(
-        self,
-        old_name_or_replacement_dict: Union[str, dict[str, str]],
-        new_name: Optional[str] = None,
-    ) -> Scenario:
+        self, old_name_or_replacement_dict: dict, new_name: Optional[str] = None
+    ) -> "Scenario":
         """Rename the keys of a scenario.
-        :param old_name_or_replacement_dict: A dictionary of old keys to new keys *OR* a string of the old key.
-        :param new_name: The new name of the key.
+        :param replacement_dict: A dictionary of old keys to new keys.
         Example:
@@ -169,26 +156,13 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
                 new_scenario[key] = value
         return new_scenario
-    def new_column_names(self, new_names: List[str]) -> Scenario:
-        """Rename the keys of a scenario.
-        >>> s = Scenario({"food": "wood chips"})
-        >>> s.new_column_names(["food_preference"])
-        Scenario({'food_preference': 'wood chips'})
-        """
-        try:
-            assert len(new_names) == len(self.keys())
-        except AssertionError:
-            print("The number of new names must match the number of keys.")
-        new_scenario = Scenario()
-        for new_names, value in zip(new_names, self.values()):
-            new_scenario[new_names] = value
-        return new_scenario
     def table(self, tablefmt: str = "grid") -> str:
-        """Display a scenario as a table."""
-        return self.to_dataset().table(tablefmt=tablefmt)
+        from edsl.results.Dataset import Dataset
+        keys = [key for key, value in self.items()]
+        values = [value for key, value in self.items()]
+        d = Dataset([{"key": keys}, {"value": values}])
+        return d.table(tablefmt=tablefmt)
     def json(self):
         return DisplayJSON(self.to_dict(add_edsl_version=False))
@@ -198,7 +172,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         return DisplayYAML(self.to_dict(add_edsl_version=False))
-    def to_dict(self, add_edsl_version: bool = True) -> dict:
+    def to_dict(self, add_edsl_version=True) -> dict:
         """Convert a scenario to a dictionary.
         Example:
@@ -226,7 +200,8 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         return d
     def __hash__(self) -> int:
-        """Return a hash of the scenario.
+        """
+        Return a hash of the scenario.
         Example:
@@ -238,23 +213,44 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         return dict_hash(self.to_dict(add_edsl_version=False))
+    def print(self):
+        from rich import print_json
+        import json
+        print_json(json.dumps(self.to_dict()))
     def __repr__(self):
         return "Scenario(" + repr(self.data) + ")"
     def to_dataset(self) -> "Dataset":
-        """Convert a scenario to a dataset.
-        >>> s = Scenario({"food": "wood chips"})
-        >>> s.to_dataset()
-        Dataset([{'key': ['food']}, {'value': ['wood chips']}])
-        """
+        # d = Dataset([{'a.b':[1,2,3,4]}])
         from edsl.results.Dataset import Dataset
-        keys = list(self.keys())
-        values = list(self.values())
+        keys = [key for key, value in self.items()]
+        values = [value for key, value in self.items()]
         return Dataset([{"key": keys}, {"value": values}])
-    def select(self, list_of_keys: Collection[str]) -> "Scenario":
+    def _repr_html_(self):
+        from tabulate import tabulate
+        import reprlib
+        d = self.to_dict(add_edsl_version=False)
+        # return self.to_dataset()
+        r = reprlib.Repr()
+        r.maxstring = 70
+        data = [[k, r.repr(v)] for k, v in d.items()]
+        from tabulate import tabulate
+        if hasattr(self, "__documentation__"):
+            footer = f"<a href='{self.__documentation__}'>(docs)</a></p>"
+        else:
+            footer = ""
+        table = str(tabulate(data, headers=["keys", "values"], tablefmt="html"))
+        return f"<pre>{table}</pre>" + footer
+    def select(self, list_of_keys: List[str]) -> "Scenario":
         """Select a subset of keys from a scenario.
         :param list_of_keys: The keys to select.
@@ -270,7 +266,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
             new_scenario[key] = self[key]
         return new_scenario
-    def drop(self, list_of_keys: Collection[str]) -> "Scenario":
+    def drop(self, list_of_keys: List[str]) -> "Scenario":
         """Drop a subset of keys from a scenario.
         :param list_of_keys: The keys to drop.
@@ -324,7 +320,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         ...     _ = f.flush()
         ...     s = Scenario.from_file(f.name, "file")
         >>> s
-        Scenario({'file': FileStore(path='...', ...)})
+        Scenario({'file': FileStore(path='...')})
         """
         from edsl.scenarios.FileStore import FileStore
@@ -355,10 +351,35 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         return cls.from_file(image_path, image_name)
     @classmethod
-    def from_pdf(cls, pdf_path: str):
-        from edsl.scenarios.PdfExtractor import PdfExtractor
+    def from_pdf(cls, pdf_path):
+        # Ensure the file exists
+        import fitz
+        if not os.path.exists(pdf_path):
+            raise FileNotFoundError(f"The file {pdf_path} does not exist.")
+        # Open the PDF file
+        document = fitz.open(pdf_path)
+        # Get the filename from the path
+        filename = os.path.basename(pdf_path)
-        return PdfExtractor(pdf_path, cls).get_object()
+        # Iterate through each page and extract text
+        text = ""
+        for page_num in range(len(document)):
+            page = document.load_page(page_num)
+            blocks = page.get_text("blocks")  # Extract text blocks
+            # Sort blocks by their vertical position (y0) to maintain reading order
+            blocks.sort(key=lambda b: (b[1], b[0]))  # Sort by y0 first, then x0
+            # Combine the text blocks in order
+            for block in blocks:
+                text += block[4] + "\n"
+        # Create a dictionary for the combined text
+        page_info = {"filename": filename, "text": text}
+        return Scenario(page_info)
     @classmethod
     def from_docx(cls, docx_path: str) -> "Scenario":
@@ -378,9 +399,52 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         Scenario({'file_path': 'test.docx', 'text': 'EDSL Survey\\nThis is a test.'})
         >>> import os; os.remove("test.docx")
         """
-        from edsl.scenarios.DocxScenario import DocxScenario
+        from docx import Document
+        doc = Document(docx_path)
-        return Scenario(DocxScenario(docx_path).get_scenario_dict())
+        # Extract all text
+        full_text = []
+        for para in doc.paragraphs:
+            full_text.append(para.text)
+        # Join the text from all paragraphs
+        text = "\n".join(full_text)
+        return Scenario({"file_path": docx_path, "text": text})
+    @staticmethod
+    def _line_chunks(text, num_lines: int) -> Generator[str, None, None]:
+        """Split a text into chunks of a given size.
+        :param text: The text to split.
+        :param num_lines: The number of lines in each chunk.
+        Example:
+        >>> list(Scenario._line_chunks("This is a test.\\nThis is a test. This is a test.", 1))
+        ['This is a test.', 'This is a test. This is a test.']
+        """
+        lines = text.split("\n")
+        for i in range(0, len(lines), num_lines):
+            chunk = "\n".join(lines[i : i + num_lines])
+            yield chunk
+    @staticmethod
+    def _word_chunks(text, num_words: int) -> Generator[str, None, None]:
+        """Split a text into chunks of a given size.
+        :param text: The text to split.
+        :param num_words: The number of words in each chunk.
+        Example:
+        >>> list(Scenario._word_chunks("This is a test.", 2))
+        ['This is', 'a test.']
+        """
+        words = text.split()
+        for i in range(0, len(words), num_words):
+            chunk = " ".join(words[i : i + num_words])
+            yield chunk
     def chunk(
         self,
@@ -431,11 +495,36 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         ...
         ValueError: You must specify either num_words or num_lines, but not both.
         """
-        from edsl.scenarios.DocumentChunker import DocumentChunker
+        from edsl.scenarios.ScenarioList import ScenarioList
-        return DocumentChunker(self).chunk(
-            field, num_words, num_lines, include_original, hash_original
-        )
+        if num_words is not None:
+            chunks = list(self._word_chunks(self[field], num_words))
+        if num_lines is not None:
+            chunks = list(self._line_chunks(self[field], num_lines))
+        if num_words is None and num_lines is None:
+            raise ValueError("You must specify either num_words or num_lines.")
+        if num_words is not None and num_lines is not None:
+            raise ValueError(
+                "You must specify either num_words or num_lines, but not both."
+            )
+        scenarios = []
+        for i, chunk in enumerate(chunks):
+            new_scenario = copy.deepcopy(self)
+            new_scenario[field] = chunk
+            new_scenario[field + "_chunk"] = i
+            if include_original:
+                if hash_original:
+                    new_scenario[field + "_original"] = hashlib.md5(
+                        self[field].encode()
+                    ).hexdigest()
+                else:
+                    new_scenario[field + "_original"] = self[field]
+            scenarios.append(new_scenario)
+        return ScenarioList(scenarios)
     @classmethod
     @remove_edsl_version
@@ -458,30 +547,44 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         return cls(d)
     def _table(self) -> tuple[dict, list]:
-        """Prepare generic table data.
-        >>> s = Scenario({"food": "wood chips"})
-        >>> s._table()
-        ([{'Attribute': 'data', 'Value': "{'food': 'wood chips'}"}, {'Attribute': 'name', 'Value': 'None'}], ['Attribute', 'Value'])
-        """
+        """Prepare generic table data."""
         table_data = []
         for attr_name, attr_value in self.__dict__.items():
             table_data.append({"Attribute": attr_name, "Value": repr(attr_value)})
         column_names = ["Attribute", "Value"]
         return table_data, column_names
+    def rich_print(self) -> "Table":
+        """Display an object as a rich table."""
+        from rich.table import Table
+        table_data, column_names = self._table()
+        table = Table(title=f"{self.__class__.__name__} Attributes")
+        for column in column_names:
+            table.add_column(column, style="bold")
+        for row in table_data:
+            row_data = [row[column] for column in column_names]
+            table.add_row(*row_data)
+        return table
     @classmethod
-    def example(cls, randomize: bool = False) -> Scenario:
+    def example(cls, randomize: bool = False, has_image=False) -> Scenario:
         """
         Returns an example Scenario instance.
         :param randomize: If True, adds a random string to the value of the example key.
         """
-        addition = "" if not randomize else str(uuid4())
-        return cls(
-            {
-                "persona": f"A reseacher studying whether LLMs can be used to generate surveys.{addition}",
-            }
-        )
+        if not has_image:
+            addition = "" if not randomize else str(uuid4())
+            return cls(
+                {
+                    "persona": f"A reseacher studying whether LLMs can be used to generate surveys.{addition}",
+                }
+            )
+        else:
+            return cls.from_image(cls.example_image())
     def code(self) -> List[str]:
         """Return the code for the scenario."""

edsl/scenarios/ScenarioHtmlMixin.py CHANGED Viewed

@@ -1,4 +1,7 @@
+import requests
 from typing import Optional
+from requests.adapters import HTTPAdapter
+from requests.packages.urllib3.util.retry import Retry
 class ScenarioHtmlMixin:
@@ -19,10 +22,6 @@ class ScenarioHtmlMixin:
     def fetch_html(url):
         # Define the user-agent to mimic a browser
-        import requests
-        from requests.adapters import HTTPAdapter
-        from requests.packages.urllib3.util.retry import Retry
         headers = {
             "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
         }

edsl/scenarios/{scenario_join.py → ScenarioJoin.py} RENAMED Viewed

@@ -1,9 +1,9 @@
 from __future__ import annotations
 from typing import Union, TYPE_CHECKING
-if TYPE_CHECKING:
-    from edsl.scenarios.ScenarioList import ScenarioList
-    from edsl.scenarios.Scenario import Scenario
+# if TYPE_CHECKING:
+from edsl.scenarios.ScenarioList import ScenarioList
+from edsl.scenarios.Scenario import Scenario
 class ScenarioJoin:
@@ -23,7 +23,7 @@ class ScenarioJoin:
         self.left = left
         self.right = right
-    def left_join(self, by: Union[str, list[str]]) -> "ScenarioList":
+    def left_join(self, by: Union[str, list[str]]) -> ScenarioList:
         """Perform a left join between the two ScenarioLists.
         Args:
@@ -35,8 +35,6 @@ class ScenarioJoin:
         Raises:
             ValueError: If by is empty or if any join keys don't exist in both ScenarioLists
         """
-        from edsl.scenarios.ScenarioList import ScenarioList
         self._validate_join_keys(by)
         by_keys = [by] if isinstance(by, str) else by
@@ -88,8 +86,6 @@ class ScenarioJoin:
         self, by_keys: list[str], other_dict: dict, all_keys: set
     ) -> list[Scenario]:
         """Create the joined scenarios."""
-        from edsl.scenarios.Scenario import Scenario
         new_scenarios = []
         for scenario in self.left:
@@ -109,8 +105,8 @@ class ScenarioJoin:
     def _handle_matching_scenario(
         self,
         new_scenario: dict,
-        left_scenario: "Scenario",
-        right_scenario: "Scenario",
+        left_scenario: Scenario,
+        right_scenario: Scenario,
         by_keys: list[str],
     ) -> None:
         """Handle merging of matching scenarios and conflict warnings."""

edsl 0.1.39__py3-none-any.whl → 0.1.39.dev1__py3-none-any.whl

edsl 0.1.39py3-none-any.whl → 0.1.39.dev1py3-none-any.whl