PyPI - edsl - Versions diffs - 0.1.33__py3-none-any.whl → 0.1.33.dev1__py3-none-any.whl - Mend

edsl 0.1.33py3-none-any.whl → 0.1.33.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (180) hide show

edsl/Base.py +3 -9
edsl/__init__.py +3 -8
edsl/__version__.py +1 -1
edsl/agents/Agent.py +8 -40
edsl/agents/AgentList.py +0 -43
edsl/agents/Invigilator.py +219 -135
edsl/agents/InvigilatorBase.py +59 -148
edsl/agents/{PromptConstructor.py → PromptConstructionMixin.py} +89 -138
edsl/agents/__init__.py +0 -1
edsl/config.py +56 -47
edsl/coop/coop.py +7 -50
edsl/data/Cache.py +1 -35
edsl/data_transfer_models.py +38 -73
edsl/enums.py +0 -4
edsl/exceptions/language_models.py +1 -25
edsl/exceptions/questions.py +5 -62
edsl/exceptions/results.py +0 -4
edsl/inference_services/AnthropicService.py +11 -13
edsl/inference_services/AwsBedrock.py +17 -19
edsl/inference_services/AzureAI.py +20 -37
edsl/inference_services/GoogleService.py +12 -16
edsl/inference_services/GroqService.py +0 -2
edsl/inference_services/InferenceServiceABC.py +3 -58
edsl/inference_services/OpenAIService.py +54 -48
edsl/inference_services/models_available_cache.py +6 -0
edsl/inference_services/registry.py +0 -6
edsl/jobs/Answers.py +12 -10
edsl/jobs/Jobs.py +21 -36
edsl/jobs/buckets/BucketCollection.py +15 -24
edsl/jobs/buckets/TokenBucket.py +14 -93
edsl/jobs/interviews/Interview.py +78 -366
edsl/jobs/interviews/InterviewExceptionEntry.py +19 -85
edsl/jobs/interviews/InterviewTaskBuildingMixin.py +286 -0
edsl/jobs/interviews/{InterviewExceptionCollection.py → interview_exception_tracking.py} +68 -14
edsl/jobs/interviews/retry_management.py +37 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +175 -146
edsl/jobs/runners/JobsRunnerStatusMixin.py +333 -0
edsl/jobs/tasks/QuestionTaskCreator.py +23 -30
edsl/jobs/tasks/TaskHistory.py +213 -148
edsl/language_models/LanguageModel.py +156 -261
edsl/language_models/ModelList.py +2 -2
edsl/language_models/RegisterLanguageModelsMeta.py +29 -14
edsl/language_models/registry.py +6 -23
edsl/language_models/repair.py +19 -0
edsl/prompts/Prompt.py +2 -52
edsl/questions/AnswerValidatorMixin.py +26 -23
edsl/questions/QuestionBase.py +249 -329
edsl/questions/QuestionBudget.py +41 -99
edsl/questions/QuestionCheckBox.py +35 -227
edsl/questions/QuestionExtract.py +27 -98
edsl/questions/QuestionFreeText.py +29 -52
edsl/questions/QuestionFunctional.py +0 -7
edsl/questions/QuestionList.py +22 -141
edsl/questions/QuestionMultipleChoice.py +65 -159
edsl/questions/QuestionNumerical.py +46 -88
edsl/questions/QuestionRank.py +24 -182
edsl/questions/RegisterQuestionsMeta.py +12 -31
edsl/questions/__init__.py +4 -3
edsl/questions/derived/QuestionLikertFive.py +5 -10
edsl/questions/derived/QuestionLinearScale.py +2 -15
edsl/questions/derived/QuestionTopK.py +1 -10
edsl/questions/derived/QuestionYesNo.py +3 -24
edsl/questions/descriptors.py +7 -43
edsl/questions/question_registry.py +2 -6
edsl/results/Dataset.py +0 -20
edsl/results/DatasetExportMixin.py +48 -46
edsl/results/Result.py +5 -32
edsl/results/Results.py +46 -135
edsl/results/ResultsDBMixin.py +3 -3
edsl/scenarios/FileStore.py +10 -71
edsl/scenarios/Scenario.py +25 -96
edsl/scenarios/ScenarioImageMixin.py +2 -2
edsl/scenarios/ScenarioList.py +39 -361
edsl/scenarios/ScenarioListExportMixin.py +0 -9
edsl/scenarios/ScenarioListPdfMixin.py +4 -150
edsl/study/SnapShot.py +1 -8
edsl/study/Study.py +0 -32
edsl/surveys/Rule.py +1 -10
edsl/surveys/RuleCollection.py +5 -21
edsl/surveys/Survey.py +310 -636
edsl/surveys/SurveyExportMixin.py +9 -71
edsl/surveys/SurveyFlowVisualizationMixin.py +1 -2
edsl/surveys/SurveyQualtricsImport.py +4 -75
edsl/utilities/gcp_bucket/simple_example.py +9 -0
edsl/utilities/utilities.py +1 -9
{edsl-0.1.33.dist-info → edsl-0.1.33.dev1.dist-info}/METADATA +2 -5
edsl-0.1.33.dev1.dist-info/RECORD +209 -0
edsl/TemplateLoader.py +0 -24
edsl/auto/AutoStudy.py +0 -117
edsl/auto/StageBase.py +0 -230
edsl/auto/StageGenerateSurvey.py +0 -178
edsl/auto/StageLabelQuestions.py +0 -125
edsl/auto/StagePersona.py +0 -61
edsl/auto/StagePersonaDimensionValueRanges.py +0 -88
edsl/auto/StagePersonaDimensionValues.py +0 -74
edsl/auto/StagePersonaDimensions.py +0 -69
edsl/auto/StageQuestions.py +0 -73
edsl/auto/SurveyCreatorPipeline.py +0 -21
edsl/auto/utilities.py +0 -224
edsl/coop/PriceFetcher.py +0 -58
edsl/inference_services/MistralAIService.py +0 -120
edsl/inference_services/TestService.py +0 -80
edsl/inference_services/TogetherAIService.py +0 -170
edsl/jobs/FailedQuestion.py +0 -78
edsl/jobs/runners/JobsRunnerStatus.py +0 -331
edsl/language_models/fake_openai_call.py +0 -15
edsl/language_models/fake_openai_service.py +0 -61
edsl/language_models/utilities.py +0 -61
edsl/questions/QuestionBaseGenMixin.py +0 -133
edsl/questions/QuestionBasePromptsMixin.py +0 -266
edsl/questions/Quick.py +0 -41
edsl/questions/ResponseValidatorABC.py +0 -170
edsl/questions/decorators.py +0 -21
edsl/questions/prompt_templates/question_budget.jinja +0 -13
edsl/questions/prompt_templates/question_checkbox.jinja +0 -32
edsl/questions/prompt_templates/question_extract.jinja +0 -11
edsl/questions/prompt_templates/question_free_text.jinja +0 -3
edsl/questions/prompt_templates/question_linear_scale.jinja +0 -11
edsl/questions/prompt_templates/question_list.jinja +0 -17
edsl/questions/prompt_templates/question_multiple_choice.jinja +0 -33
edsl/questions/prompt_templates/question_numerical.jinja +0 -37
edsl/questions/templates/__init__.py +0 -0
edsl/questions/templates/budget/__init__.py +0 -0
edsl/questions/templates/budget/answering_instructions.jinja +0 -7
edsl/questions/templates/budget/question_presentation.jinja +0 -7
edsl/questions/templates/checkbox/__init__.py +0 -0
edsl/questions/templates/checkbox/answering_instructions.jinja +0 -10
edsl/questions/templates/checkbox/question_presentation.jinja +0 -22
edsl/questions/templates/extract/__init__.py +0 -0
edsl/questions/templates/extract/answering_instructions.jinja +0 -7
edsl/questions/templates/extract/question_presentation.jinja +0 -1
edsl/questions/templates/free_text/__init__.py +0 -0
edsl/questions/templates/free_text/answering_instructions.jinja +0 -0
edsl/questions/templates/free_text/question_presentation.jinja +0 -1
edsl/questions/templates/likert_five/__init__.py +0 -0
edsl/questions/templates/likert_five/answering_instructions.jinja +0 -10
edsl/questions/templates/likert_five/question_presentation.jinja +0 -12
edsl/questions/templates/linear_scale/__init__.py +0 -0
edsl/questions/templates/linear_scale/answering_instructions.jinja +0 -5
edsl/questions/templates/linear_scale/question_presentation.jinja +0 -5
edsl/questions/templates/list/__init__.py +0 -0
edsl/questions/templates/list/answering_instructions.jinja +0 -4
edsl/questions/templates/list/question_presentation.jinja +0 -5
edsl/questions/templates/multiple_choice/__init__.py +0 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +0 -9
edsl/questions/templates/multiple_choice/html.jinja +0 -0
edsl/questions/templates/multiple_choice/question_presentation.jinja +0 -12
edsl/questions/templates/numerical/__init__.py +0 -0
edsl/questions/templates/numerical/answering_instructions.jinja +0 -8
edsl/questions/templates/numerical/question_presentation.jinja +0 -7
edsl/questions/templates/rank/__init__.py +0 -0
edsl/questions/templates/rank/answering_instructions.jinja +0 -11
edsl/questions/templates/rank/question_presentation.jinja +0 -15
edsl/questions/templates/top_k/__init__.py +0 -0
edsl/questions/templates/top_k/answering_instructions.jinja +0 -8
edsl/questions/templates/top_k/question_presentation.jinja +0 -22
edsl/questions/templates/yes_no/__init__.py +0 -0
edsl/questions/templates/yes_no/answering_instructions.jinja +0 -6
edsl/questions/templates/yes_no/question_presentation.jinja +0 -12
edsl/results/DatasetTree.py +0 -145
edsl/results/Selector.py +0 -118
edsl/results/tree_explore.py +0 -115
edsl/surveys/instructions/ChangeInstruction.py +0 -47
edsl/surveys/instructions/Instruction.py +0 -34
edsl/surveys/instructions/InstructionCollection.py +0 -77
edsl/surveys/instructions/__init__.py +0 -0
edsl/templates/error_reporting/base.html +0 -24
edsl/templates/error_reporting/exceptions_by_model.html +0 -35
edsl/templates/error_reporting/exceptions_by_question_name.html +0 -17
edsl/templates/error_reporting/exceptions_by_type.html +0 -17
edsl/templates/error_reporting/interview_details.html +0 -116
edsl/templates/error_reporting/interviews.html +0 -10
edsl/templates/error_reporting/overview.html +0 -5
edsl/templates/error_reporting/performance_plot.html +0 -2
edsl/templates/error_reporting/report.css +0 -74
edsl/templates/error_reporting/report.html +0 -118
edsl/templates/error_reporting/report.js +0 -25
edsl-0.1.33.dist-info/RECORD +0 -295
{edsl-0.1.33.dist-info → edsl-0.1.33.dev1.dist-info}/LICENSE +0 -0
{edsl-0.1.33.dist-info → edsl-0.1.33.dev1.dist-info}/WHEEL +0 -0

edsl/inference_services/AwsBedrock.py CHANGED Viewed

@@ -16,18 +16,6 @@ class AwsBedrockService(InferenceServiceABC):
     _env_key_name_ = (
         "AWS_ACCESS_KEY_ID"  # or any other environment key for AWS credentials
     )
-    key_sequence = ["output", "message", "content", 0, "text"]
-    input_token_name = "inputTokens"
-    output_token_name = "outputTokens"
-    usage_sequence = ["usage"]
-    model_exclude_list = [
-        "ai21.j2-grande-instruct",
-        "ai21.j2-jumbo-instruct",
-        "ai21.j2-mid",
-        "ai21.j2-mid-v1",
-        "ai21.j2-ultra",
-        "ai21.j2-ultra-v1",
-    ]
     @classmethod
     def available(cls):
@@ -40,7 +28,7 @@ class AwsBedrockService(InferenceServiceABC):
         else:
             all_models_ids = cls._models_list_cache
-        return [m for m in all_models_ids if m not in cls.model_exclude_list]
+        return all_models_ids
     @classmethod
     def create_model(
@@ -54,8 +42,6 @@ class AwsBedrockService(InferenceServiceABC):
             Child class of LanguageModel for interacting with AWS Bedrock models.
             """
-            key_sequence = cls.key_sequence
-            usage_sequence = cls.usage_sequence
             _inference_service_ = cls._inference_service_
             _model_ = model_name
             _parameters_ = {
@@ -63,10 +49,6 @@ class AwsBedrockService(InferenceServiceABC):
                 "max_tokens": 512,
                 "top_p": 0.9,
             }
-            input_token_name = cls.input_token_name
-            output_token_name = cls.output_token_name
-            _rpm = cls.get_rpm(cls)
-            _tpm = cls.get_tpm(cls)
             async def async_execute_model_call(
                 self, user_prompt: str, system_prompt: str = ""
@@ -107,6 +89,22 @@ class AwsBedrockService(InferenceServiceABC):
                     print(e)
                     return {"error": str(e)}
+            @staticmethod
+            def parse_response(raw_response: dict[str, Any]) -> str:
+                """Parses the API response and returns the response text."""
+                if "output" in raw_response and "message" in raw_response["output"]:
+                    response = raw_response["output"]["message"]["content"][0]["text"]
+                    pattern = r"^```json(?:\\n|\n)(.+?)(?:\\n|\n)```$"
+                    match = re.match(pattern, response, re.DOTALL)
+                    if match:
+                        return match.group(1)
+                    else:
+                        out = fix_partial_correct_response(response)
+                        if "error" not in out:
+                            response = out["extracted_json"]
+                        return response
+                return "Error parsing response"
         LLM.__name__ = model_class_name
         return LLM

edsl/inference_services/AzureAI.py CHANGED Viewed

@@ -25,22 +25,11 @@ def json_handle_none(value: Any) -> Any:
 class AzureAIService(InferenceServiceABC):
     """Azure AI service class."""
-    # key_sequence = ["content", 0, "text"]  # ["content"][0]["text"]
-    key_sequence = ["choices", 0, "message", "content"]
-    usage_sequence = ["usage"]
-    input_token_name = "prompt_tokens"
-    output_token_name = "completion_tokens"
     _inference_service_ = "azure"
     _env_key_name_ = (
         "AZURE_ENDPOINT_URL_AND_KEY"  # Environment variable for Azure API key
     )
     _model_id_to_endpoint_and_key = {}
-    model_exclude_list = [
-        "Cohere-command-r-plus-xncmg",
-        "Mistral-Nemo-klfsi",
-        "Mistral-large-2407-ojfld",
-    ]
     @classmethod
     def available(cls):
@@ -93,7 +82,7 @@ class AzureAIService(InferenceServiceABC):
             except Exception as e:
                 raise e
-        return [m for m in out if m not in cls.model_exclude_list]
+        return out
     @classmethod
     def create_model(
@@ -107,10 +96,6 @@ class AzureAIService(InferenceServiceABC):
             Child class of LanguageModel for interacting with Azure OpenAI models.
             """
-            key_sequence = cls.key_sequence
-            usage_sequence = cls.usage_sequence
-            input_token_name = cls.input_token_name
-            output_token_name = cls.output_token_name
             _inference_service_ = cls._inference_service_
             _model_ = model_name
             _parameters_ = {
@@ -118,8 +103,6 @@ class AzureAIService(InferenceServiceABC):
                 "max_tokens": 512,
                 "top_p": 0.9,
             }
-            _rpm = cls.get_rpm(cls)
-            _tpm = cls.get_tpm(cls)
             async def async_execute_model_call(
                 self, user_prompt: str, system_prompt: str = ""
@@ -189,25 +172,25 @@ class AzureAIService(InferenceServiceABC):
                     )
                     return response.model_dump()
-            # @staticmethod
-            # def parse_response(raw_response: dict[str, Any]) -> str:
-            #     """Parses the API response and returns the response text."""
-            #     if (
-            #         raw_response
-            #         and "choices" in raw_response
-            #         and raw_response["choices"]
-            #     ):
-            #         response = raw_response["choices"][0]["message"]["content"]
-            #         pattern = r"^```json(?:\\n|\n)(.+?)(?:\\n|\n)```$"
-            #         match = re.match(pattern, response, re.DOTALL)
-            #         if match:
-            #             return match.group(1)
-            #         else:
-            #             out = fix_partial_correct_response(response)
-            #             if "error" not in out:
-            #                 response = out["extracted_json"]
-            #             return response
-            #     return "Error parsing response"
+            @staticmethod
+            def parse_response(raw_response: dict[str, Any]) -> str:
+                """Parses the API response and returns the response text."""
+                if (
+                    raw_response
+                    and "choices" in raw_response
+                    and raw_response["choices"]
+                ):
+                    response = raw_response["choices"][0]["message"]["content"]
+                    pattern = r"^```json(?:\\n|\n)(.+?)(?:\\n|\n)```$"
+                    match = re.match(pattern, response, re.DOTALL)
+                    if match:
+                        return match.group(1)
+                    else:
+                        out = fix_partial_correct_response(response)
+                        if "error" not in out:
+                            response = out["extracted_json"]
+                        return response
+                return "Error parsing response"
         LLM.__name__ = model_class_name

edsl/inference_services/GoogleService.py CHANGED Viewed

@@ -10,16 +10,10 @@ from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
 class GoogleService(InferenceServiceABC):
     _inference_service_ = "google"
-    key_sequence = ["candidates", 0, "content", "parts", 0, "text"]
-    usage_sequence = ["usageMetadata"]
-    input_token_name = "promptTokenCount"
-    output_token_name = "candidatesTokenCount"
-    model_exclude_list = []
     @classmethod
     def available(cls):
-        return ["gemini-pro", "gemini-1.5-pro", "gemini-1.5-flash", "gemini-1.0-pro"]
+        return ["gemini-pro"]
     @classmethod
     def create_model(
@@ -30,15 +24,7 @@ class GoogleService(InferenceServiceABC):
         class LLM(LanguageModel):
             _model_ = model_name
-            key_sequence = cls.key_sequence
-            usage_sequence = cls.usage_sequence
-            input_token_name = cls.input_token_name
-            output_token_name = cls.output_token_name
             _inference_service_ = cls._inference_service_
-            _tpm = cls.get_tpm(cls)
-            _rpm = cls.get_rpm(cls)
             _parameters_ = {
                 "temperature": 0.5,
                 "topP": 1,
@@ -64,7 +50,7 @@ class GoogleService(InferenceServiceABC):
                         "stopSequences": self.stopSequences,
                     },
                 }
-                # print(combined_prompt)
                 async with aiohttp.ClientSession() as session:
                     async with session.post(
                         url, headers=headers, data=json.dumps(data)
@@ -72,6 +58,16 @@ class GoogleService(InferenceServiceABC):
                         raw_response_text = await response.text()
                         return json.loads(raw_response_text)
+            def parse_response(self, raw_response: dict[str, Any]) -> str:
+                data = raw_response
+                try:
+                    return data["candidates"][0]["content"]["parts"][0]["text"]
+                except KeyError as e:
+                    print(
+                        f"The data return was {data}, which was missing the key 'candidates'"
+                    )
+                    raise e
         LLM.__name__ = model_name
         return LLM

edsl/inference_services/GroqService.py CHANGED Viewed

@@ -13,8 +13,6 @@ class GroqService(OpenAIService):
     _sync_client_ = groq.Groq
     _async_client_ = groq.AsyncGroq
-    model_exclude_list = ["whisper-large-v3", "distil-whisper-large-v3-en"]
     # _base_url_ = "https://api.deepinfra.com/v1/openai"
     _base_url_ = None
     _models_list_cache: List[str] = []

edsl/inference_services/InferenceServiceABC.py CHANGED Viewed

@@ -1,77 +1,22 @@
 from abc import abstractmethod, ABC
-import os
+from typing import Any
 import re
-from edsl.config import CONFIG
 class InferenceServiceABC(ABC):
-    """
-    Abstract class for inference services.
-    Anthropic: https://docs.anthropic.com/en/api/rate-limits
-    """
-    default_levels = {
-        "google": {"tpm": 2_000_000, "rpm": 15},
-        "openai": {"tpm": 2_000_000, "rpm": 10_000},
-        "anthropic": {"tpm": 2_000_000, "rpm": 500},
-    }
-    def __init_subclass__(cls):
-        """
-        Check that the subclass has the required attributes.
-        - `key_sequence` attribute determines...
-        - `model_exclude_list` attribute determines...
-        """
-        if not hasattr(cls, "key_sequence"):
-            raise NotImplementedError(
-                f"Class {cls.__name__} must have a 'key_sequence' attribute."
-            )
-        if not hasattr(cls, "model_exclude_list"):
-            raise NotImplementedError(
-                f"Class {cls.__name__} must have a 'model_exclude_list' attribute."
-            )
-    @classmethod
-    def _get_limt(cls, limit_type: str) -> int:
-        key = f"EDSL_SERVICE_{limit_type.upper()}_{cls._inference_service_.upper()}"
-        if key in os.environ:
-            return int(os.getenv(key))
-        if cls._inference_service_ in cls.default_levels:
-            return int(cls.default_levels[cls._inference_service_][limit_type])
-        return int(CONFIG.get(f"EDSL_SERVICE_{limit_type.upper()}_BASELINE"))
-    def get_tpm(cls) -> int:
-        """
-        Returns the TPM for the service. If the service is not defined in the environment variables, it will return the baseline TPM.
-        """
-        return cls._get_limt(limit_type="tpm")
-    def get_rpm(cls):
-        """
-        Returns the RPM for the service. If the service is not defined in the environment variables, it will return the baseline RPM.
-        """
-        return cls._get_limt(limit_type="rpm")
+    """Abstract class for inference services."""
     @abstractmethod
     def available() -> list[str]:
-        """
-        Returns a list of available models for the service.
-        """
         pass
     @abstractmethod
     def create_model():
-        """
-        Returns a LanguageModel object.
-        """
         pass
     @staticmethod
     def to_class_name(s):
-        """
-        Converts a string to a valid class name.
+        """Convert a string to a valid class name.
         >>> InferenceServiceABC.to_class_name("hello world")
         'HelloWorld'

edsl/inference_services/OpenAIService.py CHANGED Viewed

@@ -1,7 +1,8 @@
-from __future__ import annotations
-from typing import Any, List, Optional
+from typing import Any, List
+import re
 import os
+# from openai import AsyncOpenAI
 import openai
 from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
@@ -9,8 +10,6 @@ from edsl.language_models import LanguageModel
 from edsl.inference_services.rate_limits_cache import rate_limits
 from edsl.utilities.utilities import fix_partial_correct_response
-from edsl.config import CONFIG
 class OpenAIService(InferenceServiceABC):
     """OpenAI service class."""
@@ -22,36 +21,19 @@ class OpenAIService(InferenceServiceABC):
     _sync_client_ = openai.OpenAI
     _async_client_ = openai.AsyncOpenAI
-    _sync_client_instance = None
-    _async_client_instance = None
-    key_sequence = ["choices", 0, "message", "content"]
-    usage_sequence = ["usage"]
-    input_token_name = "prompt_tokens"
-    output_token_name = "completion_tokens"
-    def __init_subclass__(cls, **kwargs):
-        super().__init_subclass__(**kwargs)
-        # so subclasses have to create their own instances of the clients
-        cls._sync_client_instance = None
-        cls._async_client_instance = None
     @classmethod
     def sync_client(cls):
-        if cls._sync_client_instance is None:
-            cls._sync_client_instance = cls._sync_client_(
-                api_key=os.getenv(cls._env_key_name_), base_url=cls._base_url_
-            )
-        return cls._sync_client_instance
+        return cls._sync_client_(
+            api_key=os.getenv(cls._env_key_name_), base_url=cls._base_url_
+        )
     @classmethod
     def async_client(cls):
-        if cls._async_client_instance is None:
-            cls._async_client_instance = cls._async_client_(
-                api_key=os.getenv(cls._env_key_name_), base_url=cls._base_url_
-            )
-        return cls._async_client_instance
+        return cls._async_client_(
+            api_key=os.getenv(cls._env_key_name_), base_url=cls._base_url_
+        )
+    # TODO: Make this a coop call
     model_exclude_list = [
         "whisper-1",
         "davinci-002",
@@ -66,8 +48,6 @@ class OpenAIService(InferenceServiceABC):
         "text-embedding-3-small",
         "text-embedding-ada-002",
         "ft:davinci-002:mit-horton-lab::8OfuHgoo",
-        "gpt-3.5-turbo-instruct-0914",
-        "gpt-3.5-turbo-instruct",
     ]
     _models_list_cache: List[str] = []
@@ -81,8 +61,11 @@ class OpenAIService(InferenceServiceABC):
     @classmethod
     def available(cls) -> List[str]:
+        # from openai import OpenAI
         if not cls._models_list_cache:
             try:
+                # client = OpenAI(api_key = os.getenv(cls._env_key_name_), base_url = cls._base_url_)
                 cls._models_list_cache = [
                     m.id
                     for m in cls.get_model_list()
@@ -90,6 +73,15 @@ class OpenAIService(InferenceServiceABC):
                 ]
             except Exception as e:
                 raise
+                # print(
+                #     f"""Error retrieving models: {e}.
+                #     See instructions about storing your API keys: https://docs.expectedparrot.com/en/latest/api_keys.html"""
+                # )
+                # cls._models_list_cache = [
+                #     "gpt-3.5-turbo",
+                #     "gpt-4-1106-preview",
+                #     "gpt-4",
+                # ]  # Fallback list
         return cls._models_list_cache
     @classmethod
@@ -102,14 +94,6 @@ class OpenAIService(InferenceServiceABC):
             Child class of LanguageModel for interacting with OpenAI models
             """
-            key_sequence = cls.key_sequence
-            usage_sequence = cls.usage_sequence
-            input_token_name = cls.input_token_name
-            output_token_name = cls.output_token_name
-            _rpm = cls.get_rpm(cls)
-            _tpm = cls.get_tpm(cls)
             _inference_service_ = cls._inference_service_
             _model_ = model_name
             _parameters_ = {
@@ -130,9 +114,15 @@ class OpenAIService(InferenceServiceABC):
             @classmethod
             def available(cls) -> list[str]:
+                # import openai
+                # client = openai.OpenAI(api_key = os.getenv(cls._env_key_name_), base_url = cls._base_url_)
+                # return client.models.list()
                 return cls.sync_client().models.list()
             def get_headers(self) -> dict[str, Any]:
+                # from openai import OpenAI
+                # client = OpenAI(api_key = os.getenv(cls._env_key_name_), base_url = cls._base_url_)
                 client = self.sync_client()
                 response = client.chat.completions.with_raw_response.create(
                     messages=[
@@ -169,9 +159,6 @@ class OpenAIService(InferenceServiceABC):
                 user_prompt: str,
                 system_prompt: str = "",
                 encoded_image=None,
-                invigilator: Optional[
-                    "InvigilatorAI"
-                ] = None,  # TBD - can eventually be used for function-calling
             ) -> dict[str, Any]:
                 """Calls the OpenAI API and returns the API response."""
                 if encoded_image:
@@ -186,16 +173,17 @@ class OpenAIService(InferenceServiceABC):
                     )
                 else:
                     content = user_prompt
+                # self.client = AsyncOpenAI(
+                #     api_key = os.getenv(cls._env_key_name_),
+                #     base_url = cls._base_url_
+                #     )
                 client = self.async_client()
-                messages = [
-                    {"role": "system", "content": system_prompt},
-                    {"role": "user", "content": content},
-                ]
-                if system_prompt == "" and self.omit_system_prompt_if_empty:
-                    messages = messages[1:]
                 params = {
                     "model": self.model,
-                    "messages": messages,
+                    "messages": [
+                        {"role": "system", "content": system_prompt},
+                        {"role": "user", "content": content},
+                    ],
                     "temperature": self.temperature,
                     "max_tokens": self.max_tokens,
                     "top_p": self.top_p,
@@ -207,6 +195,24 @@ class OpenAIService(InferenceServiceABC):
                 response = await client.chat.completions.create(**params)
                 return response.model_dump()
+            @staticmethod
+            def parse_response(raw_response: dict[str, Any]) -> str:
+                """Parses the API response and returns the response text."""
+                try:
+                    response = raw_response["choices"][0]["message"]["content"]
+                except KeyError:
+                    print("Tried to parse response but failed:")
+                    print(raw_response)
+                pattern = r"^```json(?:\\n|\n)(.+?)(?:\\n|\n)```$"
+                match = re.match(pattern, response, re.DOTALL)
+                if match:
+                    return match.group(1)
+                else:
+                    out = fix_partial_correct_response(response)
+                    if "error" not in out:
+                        response = out["extracted_json"]
+                    return response
         LLM.__name__ = "LanguageModel"
         return LLM

edsl/inference_services/models_available_cache.py CHANGED Viewed

@@ -70,6 +70,12 @@ models_available = {
         "amazon.titan-tg1-large",
         "amazon.titan-text-lite-v1",
         "amazon.titan-text-express-v1",
+        "ai21.j2-grande-instruct",
+        "ai21.j2-jumbo-instruct",
+        "ai21.j2-mid",
+        "ai21.j2-mid-v1",
+        "ai21.j2-ultra",
+        "ai21.j2-ultra-v1",
         "anthropic.claude-instant-v1",
         "anthropic.claude-v2:1",
         "anthropic.claude-v2",

edsl/inference_services/registry.py CHANGED Viewed

@@ -10,9 +10,6 @@ from edsl.inference_services.GroqService import GroqService
 from edsl.inference_services.AwsBedrock import AwsBedrockService
 from edsl.inference_services.AzureAI import AzureAIService
 from edsl.inference_services.OllamaService import OllamaService
-from edsl.inference_services.TestService import TestService
-from edsl.inference_services.MistralAIService import MistralAIService
-from edsl.inference_services.TogetherAIService import TogetherAIService
 default = InferenceServicesCollection(
     [
@@ -24,8 +21,5 @@ default = InferenceServicesCollection(
         AwsBedrockService,
         AzureAIService,
         OllamaService,
-        TestService,
-        MistralAIService,
-        TogetherAIService,
     ]
 )

edsl/jobs/Answers.py CHANGED Viewed

@@ -2,22 +2,24 @@
 from collections import UserDict
 from rich.table import Table
-from edsl.data_transfer_models import EDSLResultObjectInput
 class Answers(UserDict):
     """Helper class to hold the answers to a survey."""
-    def add_answer(
-        self, response: EDSLResultObjectInput, question: "QuestionBase"
-    ) -> None:
-        """Add a response to the answers dictionary."""
-        answer = response.answer
-        comment = response.comment
-        generated_tokens = response.generated_tokens
+    def add_answer(self, response, question) -> None:
+        """Add a response to the answers dictionary.
+        >>> from edsl import QuestionFreeText
+        >>> q = QuestionFreeText.example()
+        >>> answers = Answers()
+        >>> answers.add_answer({"answer": "yes"}, q)
+        >>> answers[q.question_name]
+        'yes'
+        """
+        answer = response.get("answer")
+        comment = response.pop("comment", None)
         # record the answer
-        if generated_tokens:
-            self[question.question_name + "_generated_tokens"] = generated_tokens
         self[question.question_name] = answer
         if comment:
             self[question.question_name + "_comment"] = comment

edsl 0.1.33__py3-none-any.whl → 0.1.33.dev1__py3-none-any.whl

edsl 0.1.33py3-none-any.whl → 0.1.33.dev1py3-none-any.whl