PyPI - edsl - Versions diffs - 0.1.50__py3-none-any.whl → 0.1.51__py3-none-any.whl - Mend

edsl 0.1.50py3-none-any.whl → 0.1.51py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

edsl/__version__.py +1 -1
edsl/base/base_exception.py +2 -2
edsl/buckets/bucket_collection.py +1 -1
edsl/buckets/exceptions.py +32 -0
edsl/buckets/token_bucket_api.py +26 -10
edsl/caching/cache.py +5 -2
edsl/caching/remote_cache_sync.py +5 -5
edsl/caching/sql_dict.py +12 -11
edsl/config/__init__.py +1 -1
edsl/config/config_class.py +4 -2
edsl/conversation/Conversation.py +7 -4
edsl/conversation/car_buying.py +1 -3
edsl/conversation/mug_negotiation.py +2 -6
edsl/coop/__init__.py +11 -8
edsl/coop/coop.py +13 -13
edsl/coop/coop_functions.py +1 -1
edsl/coop/ep_key_handling.py +1 -1
edsl/coop/price_fetcher.py +2 -2
edsl/coop/utils.py +2 -2
edsl/dataset/dataset.py +144 -63
edsl/dataset/dataset_operations_mixin.py +14 -6
edsl/dataset/dataset_tree.py +3 -3
edsl/dataset/display/table_renderers.py +6 -3
edsl/dataset/file_exports.py +4 -4
edsl/dataset/r/ggplot.py +3 -3
edsl/inference_services/available_model_fetcher.py +2 -2
edsl/inference_services/data_structures.py +5 -5
edsl/inference_services/inference_service_abc.py +1 -1
edsl/inference_services/inference_services_collection.py +1 -1
edsl/inference_services/service_availability.py +3 -3
edsl/inference_services/services/azure_ai.py +3 -3
edsl/inference_services/services/google_service.py +1 -1
edsl/inference_services/services/test_service.py +1 -1
edsl/instructions/change_instruction.py +5 -4
edsl/instructions/instruction.py +1 -0
edsl/instructions/instruction_collection.py +5 -4
edsl/instructions/instruction_handler.py +10 -8
edsl/interviews/exception_tracking.py +1 -1
edsl/interviews/interview.py +1 -1
edsl/interviews/interview_status_dictionary.py +1 -1
edsl/interviews/interview_task_manager.py +2 -2
edsl/interviews/request_token_estimator.py +3 -2
edsl/interviews/statistics.py +2 -2
edsl/invigilators/invigilators.py +2 -2
edsl/jobs/__init__.py +39 -2
edsl/jobs/async_interview_runner.py +1 -1
edsl/jobs/check_survey_scenario_compatibility.py +5 -5
edsl/jobs/data_structures.py +2 -2
edsl/jobs/jobs.py +2 -2
edsl/jobs/jobs_checks.py +5 -5
edsl/jobs/jobs_component_constructor.py +2 -2
edsl/jobs/jobs_pricing_estimation.py +1 -1
edsl/jobs/jobs_runner_asyncio.py +2 -2
edsl/jobs/remote_inference.py +1 -1
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/language_models/language_model.py +5 -1
edsl/notebooks/__init__.py +24 -1
edsl/notebooks/exceptions.py +82 -0
edsl/notebooks/notebook.py +7 -3
edsl/notebooks/notebook_to_latex.py +1 -1
edsl/prompts/__init__.py +23 -2
edsl/prompts/prompt.py +1 -1
edsl/questions/__init__.py +4 -4
edsl/questions/answer_validator_mixin.py +0 -5
edsl/questions/compose_questions.py +2 -2
edsl/questions/descriptors.py +1 -1
edsl/questions/question_base.py +32 -3
edsl/questions/question_base_prompts_mixin.py +4 -4
edsl/questions/question_budget.py +503 -102
edsl/questions/question_check_box.py +658 -156
edsl/questions/question_dict.py +176 -2
edsl/questions/question_extract.py +401 -61
edsl/questions/question_free_text.py +77 -9
edsl/questions/question_functional.py +118 -9
edsl/questions/{derived/question_likert_five.py → question_likert_five.py} +2 -2
edsl/questions/{derived/question_linear_scale.py → question_linear_scale.py} +3 -4
edsl/questions/question_list.py +246 -26
edsl/questions/question_matrix.py +586 -73
edsl/questions/question_multiple_choice.py +213 -47
edsl/questions/question_numerical.py +360 -29
edsl/questions/question_rank.py +401 -124
edsl/questions/question_registry.py +3 -3
edsl/questions/{derived/question_top_k.py → question_top_k.py} +3 -3
edsl/questions/{derived/question_yes_no.py → question_yes_no.py} +3 -4
edsl/questions/register_questions_meta.py +2 -1
edsl/questions/response_validator_abc.py +6 -2
edsl/questions/response_validator_factory.py +10 -12
edsl/results/report.py +1 -1
edsl/results/result.py +7 -4
edsl/results/results.py +471 -271
edsl/results/results_selector.py +2 -2
edsl/scenarios/construct_download_link.py +3 -3
edsl/scenarios/scenario.py +1 -2
edsl/scenarios/scenario_list.py +41 -23
edsl/surveys/survey_css.py +3 -3
edsl/surveys/survey_simulator.py +2 -1
edsl/tasks/__init__.py +22 -2
edsl/tasks/exceptions.py +72 -0
edsl/tasks/task_history.py +3 -3
edsl/tokens/__init__.py +27 -1
edsl/tokens/exceptions.py +37 -0
edsl/tokens/interview_token_usage.py +3 -2
edsl/tokens/token_usage.py +4 -3
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/METADATA +1 -1
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/RECORD +108 -106
edsl/questions/derived/__init__.py +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/LICENSE +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/WHEEL +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/entry_points.txt +0 -0

edsl/questions/question_multiple_choice.py CHANGED Viewed

@@ -9,6 +9,29 @@ from .descriptors import QuestionOptionsDescriptor
 from .decorators import inject_exception
 from .response_validator_abc import ResponseValidatorABC
+class BaseMultipleChoiceResponse(BaseModel):
+    """
+    Base model for multiple choice responses.
+    Attributes:
+        answer: The selected choice
+        comment: Optional comment field
+        generated_tokens: Optional raw tokens generated by the model
+    """
+    answer: Any = Field(..., description="Selected choice")
+    comment: Optional[str] = Field(None, description="Optional comment field")
+    generated_tokens: Optional[Any] = Field(None, description="Generated tokens")
+    """
+    Examples:
+        >>> model = BaseMultipleChoiceResponse(answer="Option A", comment="My reasoning")
+        >>> model.answer
+        'Option A'
+        >>> model.comment
+        'My reasoning'
+    """
 def create_response_model(choices: List[str], permissive: bool = False):
     """
     Create a ChoiceResponse model class with a predefined list of choices.
@@ -16,95 +39,238 @@ def create_response_model(choices: List[str], permissive: bool = False):
     :param choices: A list of allowed values for the answer field.
     :param permissive: If True, any value will be accepted as an answer.
     :return: A new Pydantic model class.
+    Examples:
+        >>> model = create_response_model(["Red", "Green", "Blue"], permissive=False)
+        >>> response = model(answer="Red")
+        >>> response.answer
+        'Red'
+        >>> try:
+        ...     model(answer="Purple")
+        ... except Exception:
+        ...     print("Invalid value")
+        Invalid value
+        >>> permissive_model = create_response_model(["Red", "Green", "Blue"], permissive=True)
+        >>> response = permissive_model(answer="Purple")
+        >>> response.answer
+        'Purple'
     """
     choice_tuple = tuple(choices)
     if not permissive:
-        class ChoiceResponse(BaseModel):
+        class ChoiceResponse(BaseMultipleChoiceResponse):
+            """
+            A model for multiple choice responses with strict validation.
+            Attributes:
+                answer: Must be one of the predefined choices
+            Examples:
+                >>> choices = ["Option A", "Option B", "Option C"]
+                >>> model = create_response_model(choices, permissive=False)
+                >>> response = model(answer="Option A")
+                >>> response.answer
+                'Option A'
+            """
             answer: Literal[choice_tuple] = Field(description="Selected choice")
-            comment: Optional[str] = Field(None, description="Optional comment field")
-            generated_tokens: Optional[Any] = Field(
-                None, description="Generated tokens"
-            )
-            class Config:
-                @staticmethod
-                def json_schema_extra(schema: dict, model: BaseModel) -> None:
-                    for prop in schema.get("properties", {}).values():
-                        if prop.get("title") == "answer":
-                            prop["enum"] = choices
+            model_config = {
+                "json_schema_extra": {
+                    "properties": {
+                        "answer": {
+                            "enum": choices
+                        }
+                    }
+                }
+            }
     else:
+        class ChoiceResponse(BaseMultipleChoiceResponse):
+            """
+            A model for multiple choice responses with permissive validation.
+            Attributes:
+                answer: Can be any value, with suggested choices provided
+            Examples:
+                >>> choices = ["Option A", "Option B", "Option C"]
+                >>> model = create_response_model(choices, permissive=True)
+                >>> response = model(answer="Something Else")
+                >>> response.answer
+                'Something Else'
+            """
+            answer: Any = Field(description=f"Selected choice (can be any value). Suggested choices are: {choices}")
-        class ChoiceResponse(BaseModel):
-            answer: Any = Field(description="Selected choice (can be any value)")
-            comment: Optional[str] = Field(None, description="Optional comment field")
-            generated_tokens: Optional[Any] = Field(
-                None, description="Generated tokens"
-            )
-            class Config:
-                @staticmethod
-                def json_schema_extra(schema: dict, model: BaseModel) -> None:
-                    for prop in schema.get("properties", {}).values():
-                        if prop.get("title") == "answer":
-                            prop["description"] += f". Suggested choices are: {choices}"
-                    schema["title"] += " (Permissive)"
+            model_config = {
+                "title": "PermissiveChoiceResponse"
+            }
     return ChoiceResponse
 class MultipleChoiceResponseValidator(ResponseValidatorABC):
+    """
+    Validator for multiple choice responses.
+    This validator ensures that the answer is one of the allowed options.
+    In permissive mode, any answer is accepted.
+    Examples:
+        >>> from edsl.questions import QuestionMultipleChoice
+        >>> q = QuestionMultipleChoice(
+        ...     question_name="feeling",
+        ...     question_text="How are you feeling?",
+        ...     question_options=["Good", "Bad", "Neutral"]
+        ... )
+        >>> validator = q.response_validator
+        >>> result = validator.validate({"answer": "Good"})
+        >>> sorted(result.keys())
+        ['answer', 'comment', 'generated_tokens']
+        >>> result["answer"]
+        'Good'
+    """
     required_params = ["question_options", "use_code"]
     def fix(self, response, verbose=False):
-        response_text = str(response.get("answer"))
-        if response_text is None:
-            response_text = response.get("generated_tokens", "")
+        """
+        Attempt to fix an invalid multiple choice response.
+        Strategies:
+        1. Extract an option mentioned in the generated text
+        2. Check for exact matches in the text
+        3. Look for substring matches
+        4. Normalize whitespace and check for matches
+        5. Check if the answer is a prefix of any option (ignoring trailing spaces/punctuation)
+        Parameters:
+            response: The invalid response to fix
+            verbose: Whether to print debug information
+        Returns:
+            A fixed response dict if possible, otherwise the original response
+        Examples:
+            >>> from edsl.questions import QuestionMultipleChoice
+            >>> q = QuestionMultipleChoice.example()
+            >>> validator = q.response_validator
+            >>> result = validator.fix({"answer": "I'm feeling Good today"})
+            >>> sorted(result.keys())
+            ['answer', 'comment', 'generated_tokens']
+            >>> result["answer"]
+            'Good'
+        """
+        # Don't attempt to fix None values - they should be properly rejected
+        if response.get("answer") is None:
+            if verbose:
+                print("Not attempting to fix None answer value")
+            return response
+        # Get the raw text to analyze
+        response_text = str(response.get("answer", ""))
+        if not response_text:
+            response_text = str(response.get("generated_tokens", ""))
         if verbose:
-            print(f"Invalid generated tokens was: {response_text}")
+            print(f"Invalid response text: {response_text}")
+            print(f"Looking for options among: {self.question_options}")
+        # Strategy 1: Look for exact options in the text
         matches = []
-        for idx, option in enumerate(self.question_options):
-            if verbose:
-                print("The options are: ", self.question_options)
-            if str(option) in response_text:
+        for option in self.question_options:
+            option_str = str(option)
+            if option_str in response_text:
                 if verbose:
-                    print("Match found with option ", option)
+                    print(f"Match found with option: {option_str}")
                 if option not in matches:
                     matches.append(option)
-        if verbose:
-            print("The matches are: ", matches)
+        # If we have exactly one match, use it
         if len(matches) == 1:
+            fixed_answer = matches[0]
             proposed_data = {
-                "answer": matches[0],
-                "generated_tokens": response.get("generated_tokens", None),
+                "answer": fixed_answer,
+                "comment": response.get("comment"),
+                "generated_tokens": response.get("generated_tokens"),
             }
             try:
-                self.response_model(**proposed_data)
+                # Validate the fixed answer
+                self.response_model.model_validate(proposed_data)
+                if verbose:
+                    print(f"Fixed answer: {fixed_answer}")
                 return proposed_data
             except Exception as e:
                 if verbose:
-                    print(f"Proposed solution {proposed_data} is invalid. Error: {e}")
-            return response
+                    print(f"Validation failed for fixed answer: {e}")
+        # Strategy 2: Check if the answer is a match when normalized (strip whitespace)
+        response_text_normalized = response_text.strip()
+        for option in self.question_options:
+            option_str = str(option).strip()
+            if option_str == response_text_normalized:
+                if verbose:
+                    print(f"Normalized match found with option: {option}")
+                proposed_data = {
+                    "answer": option,  # Use the exact option from the list
+                    "comment": response.get("comment"),
+                    "generated_tokens": response.get("generated_tokens"),
+                }
+                try:
+                    self.response_model.model_validate(proposed_data)
+                    if verbose:
+                        print(f"Fixed answer with normalization: {option}")
+                    return proposed_data
+                except Exception as e:
+                    if verbose:
+                        print(f"Validation failed for normalized answer: {e}")
+        # Strategy 3: Check if the answer is a prefix of any option
+        # This handles cases where the model returns a partial answer
+        # Only apply this strategy if we have a meaningful response text
+        if response_text_normalized and not response_text_normalized.lower() == "none":
+            for option in self.question_options:
+                option_str = str(option).strip()
+                if option_str.startswith(response_text_normalized) or response_text_normalized.startswith(option_str):
+                    if verbose:
+                        print(f"Prefix match found with option: {option}")
+                    proposed_data = {
+                        "answer": option,  # Use the exact option from the list
+                        "comment": response.get("comment"),
+                        "generated_tokens": response.get("generated_tokens"),
+                    }
+                    try:
+                        self.response_model.model_validate(proposed_data)
+                        if verbose:
+                            print(f"Fixed answer with prefix matching: {option}")
+                        return proposed_data
+                    except Exception as e:
+                        if verbose:
+                            print(f"Validation failed for prefix answer: {e}")
+        # If multiple or no matches, return original response
+        if verbose:
+            if len(matches) > 1:
+                print(f"Multiple matches found: {matches}, cannot determine correct option")
+            else:
+                print("No matches found in response text")
+        return response
     valid_examples = [
-        ({"answer": 1}, {"question_options": ["Good", "Great", "OK", "Bad"]})
+        ({"answer": "Good"}, {"question_options": ["Good", "Great", "OK", "Bad"]})
     ]
     invalid_examples = [
         (
-            {"answer": -1},
+            {"answer": "Terrible"},
             {"question_options": ["Good", "Great", "OK", "Bad"]},
-            "Answer code must be a non-negative integer",
+            "Value error, Permitted values are 'Good', 'Great', 'OK', 'Bad'",
         ),
         (
             {"answer": None},
             {"question_options": ["Good", "Great", "OK", "Bad"]},
-            "Answer code must not be missing.",
+            "Answer must not be null",
         ),
     ]

edsl 0.1.50__py3-none-any.whl → 0.1.51__py3-none-any.whl

edsl 0.1.50py3-none-any.whl → 0.1.51py3-none-any.whl