PyPI - edsl - Versions diffs - 0.1.27.dev2__py3-none-any.whl → 0.1.28__py3-none-any.whl - Mend

edsl 0.1.27.dev2py3-none-any.whl → 0.1.28py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

edsl/Base.py +99 -22
edsl/BaseDiff.py +260 -0
edsl/__init__.py +4 -0
edsl/__version__.py +1 -1
edsl/agents/Agent.py +26 -5
edsl/agents/AgentList.py +62 -7
edsl/agents/Invigilator.py +4 -9
edsl/agents/InvigilatorBase.py +5 -5
edsl/agents/descriptors.py +3 -1
edsl/conjure/AgentConstructionMixin.py +152 -0
edsl/conjure/Conjure.py +56 -0
edsl/conjure/InputData.py +628 -0
edsl/conjure/InputDataCSV.py +48 -0
edsl/conjure/InputDataMixinQuestionStats.py +182 -0
edsl/conjure/InputDataPyRead.py +91 -0
edsl/conjure/InputDataSPSS.py +8 -0
edsl/conjure/InputDataStata.py +8 -0
edsl/conjure/QuestionOptionMixin.py +76 -0
edsl/conjure/QuestionTypeMixin.py +23 -0
edsl/conjure/RawQuestion.py +65 -0
edsl/conjure/SurveyResponses.py +7 -0
edsl/conjure/__init__.py +9 -4
edsl/conjure/examples/placeholder.txt +0 -0
edsl/conjure/naming_utilities.py +263 -0
edsl/conjure/utilities.py +165 -28
edsl/conversation/Conversation.py +238 -0
edsl/conversation/car_buying.py +58 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/coop.py +191 -12
edsl/coop/utils.py +20 -2
edsl/data/Cache.py +55 -17
edsl/data/CacheHandler.py +10 -9
edsl/inference_services/AnthropicService.py +1 -0
edsl/inference_services/DeepInfraService.py +20 -13
edsl/inference_services/GoogleService.py +7 -1
edsl/inference_services/InferenceServicesCollection.py +33 -7
edsl/inference_services/OpenAIService.py +17 -10
edsl/inference_services/models_available_cache.py +69 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/Jobs.py +240 -36
edsl/jobs/buckets/BucketCollection.py +9 -3
edsl/jobs/interviews/Interview.py +4 -1
edsl/jobs/interviews/InterviewTaskBuildingMixin.py +24 -10
edsl/jobs/interviews/retry_management.py +4 -4
edsl/jobs/runners/JobsRunnerAsyncio.py +87 -45
edsl/jobs/runners/JobsRunnerStatusData.py +3 -3
edsl/jobs/tasks/QuestionTaskCreator.py +4 -2
edsl/language_models/LanguageModel.py +37 -44
edsl/language_models/ModelList.py +96 -0
edsl/language_models/registry.py +14 -0
edsl/language_models/repair.py +95 -24
edsl/notebooks/Notebook.py +119 -31
edsl/questions/QuestionBase.py +109 -12
edsl/questions/descriptors.py +5 -2
edsl/questions/question_registry.py +7 -0
edsl/results/Result.py +20 -8
edsl/results/Results.py +85 -11
edsl/results/ResultsDBMixin.py +3 -6
edsl/results/ResultsExportMixin.py +47 -16
edsl/results/ResultsToolsMixin.py +5 -5
edsl/scenarios/Scenario.py +59 -5
edsl/scenarios/ScenarioList.py +97 -40
edsl/study/ObjectEntry.py +97 -0
edsl/study/ProofOfWork.py +110 -0
edsl/study/SnapShot.py +77 -0
edsl/study/Study.py +491 -0
edsl/study/__init__.py +2 -0
edsl/surveys/Survey.py +79 -31
edsl/surveys/SurveyExportMixin.py +21 -3
edsl/utilities/__init__.py +1 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/gcp_bucket/simple_example.py +9 -0
edsl/utilities/interface.py +24 -28
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/utilities.py +57 -2
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/METADATA +43 -17
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/RECORD +83 -55
edsl-0.1.28.dist-info/entry_points.txt +3 -0
edsl/conjure/RawResponseColumn.py +0 -327
edsl/conjure/SurveyBuilder.py +0 -308
edsl/conjure/SurveyBuilderCSV.py +0 -78
edsl/conjure/SurveyBuilderSPSS.py +0 -118
edsl/data/RemoteDict.py +0 -103
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/LICENSE +0 -0
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/WHEEL +0 -0

edsl/conjure/naming_utilities.py ADDED Viewed

@@ -0,0 +1,263 @@
+import re
+import keyword
+stop_words = {
+    "into",
+    "mustn't",
+    "there",
+    "you'll",
+    "don",
+    "have",
+    "at",
+    "if",
+    "on",
+    "some",
+    "with",
+    "in",
+    "can",
+    "mightn",
+    "off",
+    "few",
+    "not",
+    "d",
+    "hadn",
+    "shan't",
+    "t",
+    "re",
+    "where",
+    "s",
+    "won't",
+    "mustn",
+    "wasn't",
+    "didn't",
+    "has",
+    "same",
+    "too",
+    "will",
+    "you've",
+    "all",
+    "haven't",
+    "isn't",
+    "over",
+    "of",
+    "about",
+    "its",
+    "being",
+    "it",
+    "her",
+    "should",
+    "himself",
+    "wasn",
+    "out",
+    "theirs",
+    "aren",
+    "that",
+    "our",
+    "shouldn't",
+    "you'd",
+    "such",
+    "above",
+    "my",
+    "the",
+    "any",
+    "been",
+    "as",
+    "very",
+    "herself",
+    "o",
+    "weren",
+    "until",
+    "their",
+    "shouldn",
+    "up",
+    "wouldn",
+    "couldn't",
+    "hasn't",
+    "no",
+    "than",
+    "hadn't",
+    "had",
+    "you",
+    "here",
+    "yourself",
+    "yourselves",
+    "during",
+    "ain",
+    "once",
+    "aren't",
+    "what",
+    "so",
+    "hers",
+    "that'll",
+    "other",
+    "ours",
+    "yours",
+    "nor",
+    "him",
+    "doesn",
+    "doesn't",
+    "he",
+    "them",
+    "for",
+    "ll",
+    "isn",
+    "this",
+    "or",
+    "who",
+    "only",
+    "itself",
+    "they",
+    "between",
+    "against",
+    "under",
+    "me",
+    "now",
+    "mightn't",
+    "those",
+    "needn't",
+    "these",
+    "when",
+    "before",
+    "his",
+    "she's",
+    "having",
+    "be",
+    "don't",
+    "haven",
+    "won",
+    "while",
+    "both",
+    "didn",
+    "by",
+    "ourselves",
+    "m",
+    "your",
+    "then",
+    "myself",
+    "we",
+    "it's",
+    "should've",
+    "through",
+    "why",
+    "from",
+    "and",
+    "hasn",
+    "more",
+    "how",
+    "ve",
+    "most",
+    "because",
+    "did",
+    "y",
+    "i",
+    "an",
+    "but",
+    "whom",
+    "below",
+    "further",
+    "am",
+    "which",
+    "just",
+    "ma",
+    "you're",
+    "couldn",
+    "do",
+    "shan",
+    "own",
+    "again",
+    "are",
+    "weren't",
+    "down",
+    "is",
+    "were",
+    "each",
+    "needn",
+    "themselves",
+    "she",
+    "after",
+    "does",
+    "wouldn't",
+    "to",
+    "a",
+    "was",
+    "doing",
+}
+def sanitize_string(input_string, max_length=35):
+    """Return a sanitized version of the input string that can be used as a variable name.
+    >>> candidate_names = ["How are you doing this morning, Dave? What is your favorite kind of coffee?", "class", "def", "here_is_some_text"]
+    >>> [sanitize_string(name) for name in candidate_names]
+    ['morning_dave_favorite_kind_coffee', 'class_modified', 'def_modified', 'here_is_some_text']
+    """
+    # Ensure nltk stopwords are downloaded
+    # try:
+    #     from nltk.corpus import stopwords
+    # except ImportError or ModuleNotFoundError:
+    #     print(
+    #         "nltk is not installed. Please install it using 'pip install nltk' to use these features."
+    #     )
+    #     raise
+    # try:
+    #     stop_words = set(stopwords.words("english"))
+    # except LookupError:
+    #     nltk.download("stopwords")
+    #     stop_words = set(stopwords.words("english"))
+    #     # raise LookupError("Stopwords not found. Please download them using nltk.download('stopwords')")
+    # # Define the list of stopwords
+    # Replace special characters with spaces and split into words
+    words = re.sub(r"\W+", " ", input_string).split()
+    # Remove stopwords
+    important_words = [word for word in words if word.lower() not in stop_words]
+    # Join words with underscores
+    sanitized_string = "_".join(important_words)
+    # Ensure the length is less than 25 characters
+    if len(sanitized_string) > max_length:
+        # split off the last word and remove it
+        words = sanitized_string[:max_length].split("_")
+        if len(words) == 1:
+            sanitized_string = words[0]
+        else:
+            sanitized_string = "_".join(words[:-1])
+    # Remove leading and trailing underscores
+    sanitized_string = sanitized_string.strip("_")
+    # Check if the string is a Python keyword
+    if keyword.iskeyword(sanitized_string):
+        sanitized_string += "_modified"
+    result = sanitized_string.lower()
+    return result
+# Example usage
+# input_string = "This is a sample variable-name@123 for testing"
+# sanitized_string = sanitize_string(input_string)
+# print(sanitized_string)  # Output might be: sample_variable_name_123
+# if __name__ == "__main__":
+#     candidate_names = [
+#         "How are you doing this morning, Dave? What is your favorite kind of coffee?",
+#         "class",
+#         "def",
+#         "here_is_some_text",
+#     ]
+#     for name in candidate_names:
+#         print(f"Original: {name}")
+#         print(f"Sanitized: {sanitize_string(name)}")
+#         print()
+if __name__ == "__main__":
+    from edsl.conjure.InputData import InputDataABC
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl/conjure/utilities.py CHANGED Viewed

@@ -1,9 +1,59 @@
+import requests
 import subprocess
 from io import StringIO
+import os
 import pandas as pd
+class ValidFilename:
+    """A descriptor that checks if a file exists.
+    >>> f = ValidFilename()
+    >>> f = "hello"
+    """
+    def __set_name__(self, owner, name):
+        self.name = name
+    def __get__(self, instance, owner):
+        return instance.__dict__.get(self.name, None)
+    def __set__(self, instance, value):
+        if not isinstance(value, str):
+            raise ValueError(
+                f"The filename must be a string, not {type(value).__name__}"
+            )
+        if not os.path.exists(value):
+            raise ValueError(f"The file '{value}' does not exist.")
+        instance.__dict__[self.name] = value
+class DummyClassToTestDescriptor:
+    """
+    >>> d = DummyClassToTestDescriptor(1)
+    Traceback (most recent call last):
+    ...
+    ValueError: The filename must be a string, not int
+    >>> d = DummyClassToTestDescriptor("hello")
+    Traceback (most recent call last):
+    ...
+    ValueError: The file 'hello' does not exist.
+    """
+    filename = ValidFilename()
+    def __init__(self, filename):
+        self.filename = filename
+    def __repr__(self):
+        return f"DummyClassToTestDescriptor({self.filename})"
 class Missing:
     def __repr__(self):
         return "Missing()"
@@ -16,6 +66,18 @@ class Missing:
 def convert_value(x):
+    """Takes a string and tries to convert it.
+    >>> convert_value('1')
+    1
+    >>> convert_value('1.2')
+    1.2
+    >>> convert_value("how are you?")
+    'how are you?'
+    >>> convert_value("")
+    'missing'
+    """
     try:
         float_val = float(x)
         if float_val.is_integer():
@@ -29,36 +91,111 @@ def convert_value(x):
             return str(x)
-class RCodeSnippet:
-    def __init__(self, r_code):
-        self.r_code = r_code
+# class RCodeSnippet:
+#     def __init__(self, r_code):
+#         self.r_code = r_code
-    def __call__(self, data_file_name):
-        return self.run_R_stdin(self.r_code, data_file_name)
+#     def __call__(self, data_file_name):
+#         return self.run_R_stdin(self.r_code, data_file_name)
-    def __add__(self, other):
-        return RCodeSnippet(self.r_code + other.r_code)
+#     def __add__(self, other):
+#         return RCodeSnippet(self.r_code + other.r_code)
-    def write_to_file(self, filename) -> None:
-        """Writes the R code to a file; useful for debugging."""
-        if filename.endswith(".R") or filename.endswith(".r"):
-            pass
-        else:
-            filename += ".R"
+#     def write_to_file(self, filename) -> None:
+#         """Writes the R code to a file; useful for debugging."""
+#         if filename.endswith(".R") or filename.endswith(".r"):
+#             pass
+#         else:
+#             filename += ".R"
-        with open(filename, "w") as f:
-            f.write(self.r_code)
+#         with open(filename, "w") as f:
+#             f.write(self.r_code)
-    @staticmethod
-    def run_R_stdin(r_code, data_file_name, transform_func=lambda x: pd.read_csv(x)):
-        """Runs an R script and returns the stdout as a string."""
-        cmd = ["Rscript", "-e", r_code, data_file_name]
-        process = subprocess.Popen(
-            cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True
+#     @staticmethod
+#     def run_R_stdin(r_code, data_file_name, transform_func=lambda x: pd.read_csv(x)):
+#         """Runs an R script and returns the stdout as a string."""
+#         cmd = ["Rscript", "-e", r_code, data_file_name]
+#         process = subprocess.Popen(
+#             cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True
+#         )
+#         stdout, stderr = process.communicate()
+#         if stderr != "":
+#             print("Warning: stderr is not empty.")
+#             print(f"Problem running: {r_code}")
+#             raise Exception(stderr)
+#         return transform_func(StringIO(stdout))
+def infer_question_type(question_text, responses, sample_size=15):
+    from edsl.questions import QuestionMultipleChoice
+    q = QuestionMultipleChoice(
+        question_text="""We have a survey question and we are trying to infer its type.
+                        The question text is: '{{question_text}}'.
+                        The first {{ sample_size }} responses are: '{{responses}}'.
+                        There are {{ total }} responses in total.
+                        If a response is a command-separated list, it is likely a checkbox question.
+                        """,
+        question_name="infer_question_type",
+        question_options=[
+            "budget",
+            "checkbox",
+            "extract",
+            "free_text",
+            "likert_five",
+            "linear_scale",
+            "list",
+            "multiple_choice",
+            "numerical",
+            "rank",
+            "top_k",
+            "yes_no",
+        ],
+    )
+    response = (
+        q.to_survey()(
+            question_text=question_text,
+            sample_zize=sample_size,
+            responses=responses[:sample_size],
         )
-        stdout, stderr = process.communicate()
-        if stderr != "":
-            print("Warning: stderr is not empty.")
-            print(f"Problem running: {r_code}")
-            raise Exception(stderr)
-        return transform_func(StringIO(stdout))
+        .select("infer_question_type")
+        .first()
+    )
+    return response
+def download_file(url, filename):
+    """
+    Downloads a file from a given URL and saves it to the specified filename.
+    Parameters:
+    url (str): The URL of the file to download.
+    filename (str): The name of the file to save the downloaded content.
+    Returns:
+    str: The path to the saved file.
+    """
+    headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
+    }
+    # Sending the GET request
+    response = requests.get(url, headers=headers)
+    # Checking if the request was successful
+    if response.status_code == 200:
+        # Writing the content to the specified file
+        with open(filename, "wb") as file:
+            file.write(response.content)
+        print(f"File downloaded successfully and saved to {filename}")
+        return filename
+    else:
+        print(f"Failed to download file: {response.status_code}")
+        return None
+# Example usage
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)

edsl 0.1.27.dev2__py3-none-any.whl → 0.1.28__py3-none-any.whl

edsl 0.1.27.dev2py3-none-any.whl → 0.1.28py3-none-any.whl