PyPI - edsl - Versions diffs - 0.1.27.dev2__py3-none-any.whl → 0.1.28__py3-none-any.whl - Mend

edsl 0.1.27.dev2py3-none-any.whl → 0.1.28py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

edsl/Base.py +99 -22
edsl/BaseDiff.py +260 -0
edsl/__init__.py +4 -0
edsl/__version__.py +1 -1
edsl/agents/Agent.py +26 -5
edsl/agents/AgentList.py +62 -7
edsl/agents/Invigilator.py +4 -9
edsl/agents/InvigilatorBase.py +5 -5
edsl/agents/descriptors.py +3 -1
edsl/conjure/AgentConstructionMixin.py +152 -0
edsl/conjure/Conjure.py +56 -0
edsl/conjure/InputData.py +628 -0
edsl/conjure/InputDataCSV.py +48 -0
edsl/conjure/InputDataMixinQuestionStats.py +182 -0
edsl/conjure/InputDataPyRead.py +91 -0
edsl/conjure/InputDataSPSS.py +8 -0
edsl/conjure/InputDataStata.py +8 -0
edsl/conjure/QuestionOptionMixin.py +76 -0
edsl/conjure/QuestionTypeMixin.py +23 -0
edsl/conjure/RawQuestion.py +65 -0
edsl/conjure/SurveyResponses.py +7 -0
edsl/conjure/__init__.py +9 -4
edsl/conjure/examples/placeholder.txt +0 -0
edsl/conjure/naming_utilities.py +263 -0
edsl/conjure/utilities.py +165 -28
edsl/conversation/Conversation.py +238 -0
edsl/conversation/car_buying.py +58 -0
edsl/conversation/mug_negotiation.py +81 -0
edsl/conversation/next_speaker_utilities.py +93 -0
edsl/coop/coop.py +191 -12
edsl/coop/utils.py +20 -2
edsl/data/Cache.py +55 -17
edsl/data/CacheHandler.py +10 -9
edsl/inference_services/AnthropicService.py +1 -0
edsl/inference_services/DeepInfraService.py +20 -13
edsl/inference_services/GoogleService.py +7 -1
edsl/inference_services/InferenceServicesCollection.py +33 -7
edsl/inference_services/OpenAIService.py +17 -10
edsl/inference_services/models_available_cache.py +69 -0
edsl/inference_services/rate_limits_cache.py +25 -0
edsl/inference_services/write_available.py +10 -0
edsl/jobs/Jobs.py +240 -36
edsl/jobs/buckets/BucketCollection.py +9 -3
edsl/jobs/interviews/Interview.py +4 -1
edsl/jobs/interviews/InterviewTaskBuildingMixin.py +24 -10
edsl/jobs/interviews/retry_management.py +4 -4
edsl/jobs/runners/JobsRunnerAsyncio.py +87 -45
edsl/jobs/runners/JobsRunnerStatusData.py +3 -3
edsl/jobs/tasks/QuestionTaskCreator.py +4 -2
edsl/language_models/LanguageModel.py +37 -44
edsl/language_models/ModelList.py +96 -0
edsl/language_models/registry.py +14 -0
edsl/language_models/repair.py +95 -24
edsl/notebooks/Notebook.py +119 -31
edsl/questions/QuestionBase.py +109 -12
edsl/questions/descriptors.py +5 -2
edsl/questions/question_registry.py +7 -0
edsl/results/Result.py +20 -8
edsl/results/Results.py +85 -11
edsl/results/ResultsDBMixin.py +3 -6
edsl/results/ResultsExportMixin.py +47 -16
edsl/results/ResultsToolsMixin.py +5 -5
edsl/scenarios/Scenario.py +59 -5
edsl/scenarios/ScenarioList.py +97 -40
edsl/study/ObjectEntry.py +97 -0
edsl/study/ProofOfWork.py +110 -0
edsl/study/SnapShot.py +77 -0
edsl/study/Study.py +491 -0
edsl/study/__init__.py +2 -0
edsl/surveys/Survey.py +79 -31
edsl/surveys/SurveyExportMixin.py +21 -3
edsl/utilities/__init__.py +1 -0
edsl/utilities/gcp_bucket/__init__.py +0 -0
edsl/utilities/gcp_bucket/cloud_storage.py +96 -0
edsl/utilities/gcp_bucket/simple_example.py +9 -0
edsl/utilities/interface.py +24 -28
edsl/utilities/repair_functions.py +28 -0
edsl/utilities/utilities.py +57 -2
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/METADATA +43 -17
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/RECORD +83 -55
edsl-0.1.28.dist-info/entry_points.txt +3 -0
edsl/conjure/RawResponseColumn.py +0 -327
edsl/conjure/SurveyBuilder.py +0 -308
edsl/conjure/SurveyBuilderCSV.py +0 -78
edsl/conjure/SurveyBuilderSPSS.py +0 -118
edsl/data/RemoteDict.py +0 -103
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/LICENSE +0 -0
{edsl-0.1.27.dev2.dist-info → edsl-0.1.28.dist-info}/WHEEL +0 -0

edsl/inference_services/DeepInfraService.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import aiohttp
 import json
 import requests
-from typing import Any
+from typing import Any, List
 from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
 from edsl.language_models import LanguageModel
@@ -12,6 +12,8 @@ class DeepInfraService(InferenceServiceABC):
     _inference_service_ = "deep_infra"
     _env_key_name_ = "DEEP_INFRA_API_KEY"
+    _models_list_cache: List[str] = []
     @classmethod
     def available(cls):
         text_models = cls.full_details_available()
@@ -19,20 +21,25 @@ class DeepInfraService(InferenceServiceABC):
     @classmethod
     def full_details_available(cls, verbose=False):
-        url = "https://api.deepinfra.com/models/list"
-        response = requests.get(url)
-        if response.status_code == 200:
-            text_generation_models = [
-                r for r in response.json() if r["type"] == "text-generation"
-            ]
-            from rich import print_json
-            import json
+        if not cls._models_list_cache:
+            url = "https://api.deepinfra.com/models/list"
+            response = requests.get(url)
+            if response.status_code == 200:
+                text_generation_models = [
+                    r for r in response.json() if r["type"] == "text-generation"
+                ]
+                cls._models_list_cache = text_generation_models
+                from rich import print_json
+                import json
-            if verbose:
-                print_json(json.dumps(text_generation_models))
-            return text_generation_models
+                if verbose:
+                    print_json(json.dumps(text_generation_models))
+                return text_generation_models
+            else:
+                return f"Failed to fetch data: Status code {response.status_code}"
         else:
-            return f"Failed to fetch data: Status code {response.status_code}"
+            return cls._models_list_cache
     @classmethod
     def create_model(cls, model_name: str, model_class_name=None) -> LanguageModel:

edsl/inference_services/GoogleService.py CHANGED Viewed

@@ -60,7 +60,13 @@ class GoogleService(InferenceServiceABC):
             def parse_response(self, raw_response: dict[str, Any]) -> str:
                 data = raw_response
-                return data["candidates"][0]["content"]["parts"][0]["text"]
+                try:
+                    return data["candidates"][0]["content"]["parts"][0]["text"]
+                except KeyError as e:
+                    print(
+                        f"The data return was {data}, which was missing the key 'candidates'"
+                    )
+                    raise e
         LLM.__name__ = model_name

edsl/inference_services/InferenceServicesCollection.py CHANGED Viewed

@@ -1,21 +1,47 @@
 from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
+import warnings
 class InferenceServicesCollection:
+    added_models = {}
     def __init__(self, services: list[InferenceServiceABC] = None):
         self.services = services or []
+    @classmethod
+    def add_model(cls, service_name, model_name):
+        if service_name not in cls.added_models:
+            cls.added_models[service_name] = []
+        cls.added_models[service_name].append(model_name)
+    @staticmethod
+    def _get_service_available(service) -> list[str]:
+        from_api = True
+        try:
+            service_models = service.available()
+        except Exception as e:
+            warnings.warn(
+                f"Error getting models for {service._inference_service_}. Relying on cache.",
+                UserWarning,
+            )
+            from edsl.inference_services.models_available_cache import models_available
+            service_models = models_available.get(service._inference_service_, [])
+            # cache results
+            service._models_list_cache = service_models
+            from_api = False
+        return service_models  # , from_api
     def available(self):
         total_models = []
         for service in self.services:
-            try:
-                service_models = service.available()
-            except Exception as e:
-                print(f"Error getting models for {service._inference_service_}: {e}")
-                service_models = []
-                continue
+            service_models = self._get_service_available(service)
             for model in service_models:
                 total_models.append([model, service._inference_service_, -1])
+            for model in self.added_models.get(service._inference_service_, []):
+                total_models.append([model, service._inference_service_, -1])
         sorted_models = sorted(total_models)
         for i, model in enumerate(sorted_models):
             model[2] = i
@@ -27,7 +53,7 @@ class InferenceServicesCollection:
     def create_model_factory(self, model_name: str, service_name=None, index=None):
         for service in self.services:
-            if model_name in service.available():
+            if model_name in self._get_service_available(service):
                 if service_name is None or service_name == service._inference_service_:
                     return service.create_model(model_name)

edsl/inference_services/OpenAIService.py CHANGED Viewed

@@ -4,6 +4,7 @@ from openai import AsyncOpenAI
 from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
 from edsl.language_models import LanguageModel
+from edsl.inference_services.rate_limits_cache import rate_limits
 class OpenAIService(InferenceServiceABC):
@@ -43,15 +44,16 @@ class OpenAIService(InferenceServiceABC):
                     if m.id not in cls.model_exclude_list
                 ]
             except Exception as e:
-                print(
-                    f"""Error retrieving models: {e}.
-                    See instructions about storing your API keys: https://docs.expectedparrot.com/en/latest/api_keys.html"""
-                )
-                cls._models_list_cache = [
-                    "gpt-3.5-turbo",
-                    "gpt-4-1106-preview",
-                    "gpt-4",
-                ]  # Fallback list
+                raise
+                # print(
+                #     f"""Error retrieving models: {e}.
+                #     See instructions about storing your API keys: https://docs.expectedparrot.com/en/latest/api_keys.html"""
+                # )
+                # cls._models_list_cache = [
+                #     "gpt-3.5-turbo",
+                #     "gpt-4-1106-preview",
+                #     "gpt-4",
+                # ]  # Fallback list
         return cls._models_list_cache
     @classmethod
@@ -98,7 +100,12 @@ class OpenAIService(InferenceServiceABC):
             def get_rate_limits(self) -> dict[str, Any]:
                 try:
-                    headers = self.get_headers()
+                    if "openai" in rate_limits:
+                        headers = rate_limits["openai"]
+                    else:
+                        headers = self.get_headers()
                 except Exception as e:
                     return {
                         "rpm": 10_000,

edsl/inference_services/models_available_cache.py ADDED Viewed

@@ -0,0 +1,69 @@
+models_available = {
+    "openai": [
+        "gpt-3.5-turbo-1106",
+        "gpt-4-0125-preview",
+        "gpt-4-turbo-preview",
+        "gpt-3.5-turbo-16k",
+        "gpt-4-1106-preview",
+        "gpt-4-turbo-2024-04-09",
+        "gpt-3.5-turbo-16k-0613",
+        "gpt-4o-2024-05-13",
+        "gpt-4-turbo",
+        "gpt-3.5-turbo-0613",
+        "gpt-4",
+        "gpt-4-0613",
+        "gpt-3.5-turbo-0125",
+        "gpt-3.5-turbo",
+        "gpt-3.5-turbo-instruct",
+        "gpt-3.5-turbo-instruct-0914",
+        "gpt-3.5-turbo-0301",
+        "gpt-4-vision-preview",
+        "gpt-4-1106-vision-preview",
+        "gpt-4o",
+    ],
+    "anthropic": [
+        "claude-3-5-sonnet-20240620",
+        "claude-3-opus-20240229",
+        "claude-3-sonnet-20240229",
+        "claude-3-haiku-20240307",
+    ],
+    "deep_infra": [
+        "meta-llama/Llama-2-13b-chat-hf",
+        "mistralai/Mixtral-8x22B-Instruct-v0.1",
+        "Gryphe/MythoMax-L2-13b-turbo",
+        "mistralai/Mistral-7B-Instruct-v0.1",
+        "Austism/chronos-hermes-13b-v2",
+        "meta-llama/Llama-2-70b-chat-hf",
+        "mistralai/Mistral-7B-Instruct-v0.3",
+        "meta-llama/Llama-2-7b-chat-hf",
+        "Qwen/Qwen2-72B-Instruct",
+        "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
+        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
+        "bigcode/starcoder2-15b",
+        "microsoft/WizardLM-2-8x22B",
+        "codellama/CodeLlama-70b-Instruct-hf",
+        "Gryphe/MythoMax-L2-13b",
+        "microsoft/WizardLM-2-7B",
+        "01-ai/Yi-34B-Chat",
+        "bigcode/starcoder2-15b-instruct-v0.1",
+        "mistralai/Mixtral-8x7B-Instruct-v0.1",
+        "openchat/openchat-3.6-8b",
+        "meta-llama/Meta-Llama-3-8B-Instruct",
+        "microsoft/Phi-3-medium-4k-instruct",
+        "Phind/Phind-CodeLlama-34B-v2",
+        "google/codegemma-7b-it",
+        "mistralai/Mistral-7B-Instruct-v0.2",
+        "deepinfra/airoboros-70b",
+        "mistralai/Mixtral-8x22B-v0.1",
+        "llava-hf/llava-1.5-7b-hf",
+        "codellama/CodeLlama-34b-Instruct-hf",
+        "google/gemma-1.1-7b-it",
+        "lizpreciatior/lzlv_70b_fp16_hf",
+        "databricks/dbrx-instruct",
+        "nvidia/Nemotron-4-340B-Instruct",
+        "Qwen/Qwen2-7B-Instruct",
+        "meta-llama/Meta-Llama-3-70B-Instruct",
+        "openchat/openchat_3.5",
+    ],
+    "google": ["gemini-pro"],
+}

edsl/inference_services/rate_limits_cache.py ADDED Viewed

@@ -0,0 +1,25 @@
+rate_limits = {
+    "openai": {
+        "date": "Tue, 02 Jul 2024 15:25:28 GMT",
+        "content-type": "application/json",
+        "transfer-encoding": "chunked",
+        "connection": "keep-alive",
+        "openai-organization": "user-wmu32omw8ulzzutk6mjhtqgk",
+        "openai-processing-ms": "760",
+        "openai-version": "2020-10-01",
+        "strict-transport-security": "max-age=31536000; includeSubDomains",
+        "x-ratelimit-limit-requests": "5000",
+        "x-ratelimit-limit-tokens": "600000",
+        "x-ratelimit-remaining-requests": "4999",
+        "x-ratelimit-remaining-tokens": "599978",
+        "x-ratelimit-reset-requests": "12ms",
+        "x-ratelimit-reset-tokens": "2ms",
+        "x-request-id": "req_971608f3647f660a0cd6537fbe21f69c",
+        "cf-cache-status": "DYNAMIC",
+        "set-cookie": "__cf_bm=MJfUk.0TXdjtiNkUUqlUO2gaN3wzm0iHsRQRWExy52o-1719933928-1.0.1.1-0xk9gFxy_mD1KzAsKQ_HpL2pdQJ90D4B5frt65xU.c9k9QwD0oTBILqXB0rykXNh04Pm1UB1.H_W9sFJVOcSaw; path=/; expires=Tue, 02-Jul-24 15:55:28 GMT; domain=.api.openai.com; HttpOnly; Secure; SameSite=None, _cfuvid=GbheRct_iw9_I8iLWmt5ZRcLYZ_QVnroCrAt8QMVsUg-1719933928399-0.0.1.1-604800000; path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None",
+        "server": "cloudflare",
+        "cf-ray": "89cfa6059bb9b68f-OTP",
+        "content-encoding": "gzip",
+        "alt-svc": 'h3=":443"; ma=86400',
+    }
+}

edsl/inference_services/write_available.py ADDED Viewed

@@ -0,0 +1,10 @@
+from edsl.inference_services.registry import default
+def write_available():
+    d = {}
+    for service in default.services:
+        d[service._inference_service_] = service.available()
+    with open("models_available_cache.py", "w") as f:
+        f.write(f"models_available = {d}")

edsl 0.1.27.dev2__py3-none-any.whl → 0.1.28__py3-none-any.whl

edsl 0.1.27.dev2py3-none-any.whl → 0.1.28py3-none-any.whl