PyPI - ragaai-catalyst - Versions diffs - 2.0.5__py3-none-any.whl → 2.0.6__py3-none-any.whl - Mend

ragaai-catalyst 2.0.5py3-none-any.whl → 2.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

ragaai_catalyst/__init__.py +3 -1
ragaai_catalyst/dataset.py +50 -61
ragaai_catalyst/evaluation.py +48 -30
ragaai_catalyst/guard_executor.py +97 -0
ragaai_catalyst/guardrails_manager.py +259 -0
ragaai_catalyst/internal_api_completion.py +83 -0
ragaai_catalyst/prompt_manager.py +1 -1
ragaai_catalyst/proxy_call.py +1 -1
ragaai_catalyst/ragaai_catalyst.py +1 -1
ragaai_catalyst/synthetic_data_generation.py +206 -77
ragaai_catalyst/tracers/llamaindex_callback.py +361 -0
ragaai_catalyst/tracers/tracer.py +62 -28
ragaai_catalyst-2.0.6.dist-info/METADATA +386 -0
ragaai_catalyst-2.0.6.dist-info/RECORD +29 -0
{ragaai_catalyst-2.0.5.dist-info → ragaai_catalyst-2.0.6.dist-info}/WHEEL +1 -1
ragaai_catalyst-2.0.5.dist-info/METADATA +0 -228
ragaai_catalyst-2.0.5.dist-info/RECORD +0 -25
{ragaai_catalyst-2.0.5.dist-info → ragaai_catalyst-2.0.6.dist-info}/top_level.txt +0 -0

ragaai_catalyst/internal_api_completion.py ADDED Viewed

@@ -0,0 +1,83 @@
+import requests
+import json
+import subprocess
+import logging
+import traceback
+import pandas as pd
+logger = logging.getLogger(__name__)
+def api_completion(messages, model_config, kwargs):
+    attempts = 0
+    while attempts < 3:
+        user_id = kwargs.get('user_id', '1')
+        internal_llm_proxy = kwargs.get('internal_llm_proxy', -1)
+        job_id = model_config.get('job_id',-1)
+        converted_message = convert_input(messages,model_config, user_id)
+        payload = json.dumps(converted_message)
+        headers = {
+            'Content-Type': 'application/json',
+            # 'Wd-PCA-Feature-Key':f'your_feature_key, $(whoami)'
+        }
+        try:
+            response = requests.request("POST", internal_llm_proxy, headers=headers, data=payload)
+            if model_config.get('log_level','')=='debug':
+                logger.info(f'Model response Job ID {job_id} {response.text}')
+            if response.status_code!=200:
+                # logger.error(f'Error in model response Job ID {job_id}:',str(response.text))
+                raise ValueError(str(response.text))
+            if response.status_code==200:
+                response = response.json()
+                if "error" in response:
+                    raise ValueError(response["error"]["message"])
+                else:
+                    result=  response["choices"][0]["message"]["content"]
+                    response1 = result.replace('\n', '')
+                    try:
+                        json_data = json.loads(response1)
+                        df = pd.DataFrame(json_data)
+                        return(df)
+                    except json.JSONDecodeError:
+                        attempts += 1  # Increment attempts if JSON parsing fails
+                        if attempts == 3:
+                            raise Exception("Failed to generate a valid response after multiple attempts.")
+        except Exception as e:
+            raise ValueError(f"{e}")
+def get_username():
+    result = subprocess.run(['whoami'], capture_output=True, text=True)
+    result = result.stdout
+    return result
+def convert_input(messages, model_config, user_id):
+    doc_input = {
+      "model": model_config.get('model'),
+      **model_config,
+      "messages": messages,
+      "user_id": user_id
+    }
+    return doc_input
+if __name__=='__main__':
+    messages = [
+        {
+            "role": "system",
+            "content": "you are a poet well versed in shakespeare literature"
+        },
+        {
+          "role": "user",
+          "content": "write a poem on pirates and penguins"
+        }
+      ]
+    kwargs = {"internal_llm_proxy": "http://13.200.11.66:4000/chat/completions", "user_id": 1}
+    model_config = {"model": "workday_gateway", "provider":"openai", "max_tokens": 10}
+    answer = api_completion(messages, model_config, kwargs)
+    print(answer)

ragaai_catalyst/prompt_manager.py CHANGED Viewed

@@ -23,7 +23,7 @@ class PromptManager:
         self.project_name = project_name
         self.base_url = f"{RagaAICatalyst.BASE_URL}/playground/prompt"
         self.timeout = 10
-        self.size = 100 #Number of projects to fetch
+        self.size = 99999 #Number of projects to fetch
         try:
             response = requests.get(

ragaai_catalyst/proxy_call.py CHANGED Viewed

@@ -23,7 +23,7 @@ def api_completion(model,messages, api_base='http://127.0.0.1:8000',
         if model_config.get('log_level','')=='debug':
             logger.info(f'Model response Job ID {job_id} {response.text}')
         if response.status_code!=200:
-            logger.error(f'Error in model response Job ID {job_id}:',str(response.text))
+            # logger.error(f'Error in model response Job ID {job_id}:',str(response.text))
             raise ValueError(str(response.text))
     except Exception as e:
         logger.error(f'Error in calling api Job ID {job_id}:',str(e))

ragaai_catalyst/ragaai_catalyst.py CHANGED Viewed

@@ -287,7 +287,7 @@ class RagaAICatalyst:
     def get_project_id(self, project_name):
         pass
-    def list_projects(self, num_projects=100):
+    def list_projects(self, num_projects=99999):
         """
         Retrieves a list of projects with the specified number of projects.

ragaai_catalyst/synthetic_data_generation.py CHANGED Viewed

@@ -7,7 +7,14 @@ import csv
 import markdown
 import pandas as pd
 import json
-from ragaai_catalyst import proxy_call
+from litellm import completion
+from tqdm import tqdm
+# import internal_api_completion
+# import proxy_call
+from .internal_api_completion import api_completion as internal_api_completion
+from .proxy_call import api_completion as proxy_api_completion
+# from ragaai_catalyst import internal_api_completion
+# from ragaai_catalyst import proxy_call
 import ast
 # dotenv.load_dotenv()
@@ -21,55 +28,170 @@ class SyntheticDataGeneration:
         """
         Initialize the SyntheticDataGeneration class with API clients for Groq, Gemini, and OpenAI.
         """
-    def generate_qna(self, text, question_type="simple", n=5,model_config=dict(),api_key=None):
+    def generate_qna(self, text, question_type="simple", n=5, model_config=dict(), api_key=None, **kwargs):
         """
         Generate questions based on the given text using the specified model and provider.
+        Uses batch processing for larger values of n to maintain response quality.
         Args:
             text (str): The input text to generate questions from.
             question_type (str): The type of questions to generate ('simple', 'mcq', or 'complex').
-            model (str): The specific model to use for generation.
-            provider (str): The AI provider to use ('groq', 'gemini', or 'openai').
             n (int): The number of question/answer pairs to generate.
+            model_config (dict): Configuration for the model including provider and model name.
+            api_key (str, optional): The API key for the selected provider.
+            **kwargs: Additional keyword arguments.
         Returns:
-            pandas.DataFrame: A DataFrame containing the generated questions and answers.
+            pandas.DataFrame: A DataFrame containing exactly n generated questions and answers.
         Raises:
-            ValueError: If an invalid provider is specified.
+            ValueError: If an invalid provider is specified or API key is missing.
         """
+        BATCH_SIZE = 5  # Optimal batch size for maintaining response quality
         provider = model_config.get("provider")
         model = model_config.get("model")
         api_base = model_config.get("api_base")
-        system_message = self._get_system_message(question_type, n)
+        # Initialize the appropriate client based on provider
+        self._initialize_client(provider, api_key, api_base, internal_llm_proxy=kwargs.get("internal_llm_proxy", None))
+        # Initialize progress bar
+        pbar = tqdm(total=n, desc="Generating QA pairs")
+        # Initial generation phase
+        num_batches = (n + BATCH_SIZE - 1) // BATCH_SIZE
+        all_responses = []
+        FAILURE_CASES = [
+            "Invalid API key provided",
+            "No connection adapters",
+            "Required API Keys are not set",
+            "litellm.BadRequestError",
+            "litellm.AuthenticationError"]
+        for _ in range(num_batches):
+            current_batch_size = min(BATCH_SIZE, n - len(all_responses))
+            if current_batch_size <= 0:
+                break
+            try:
+                system_message = self._get_system_message(question_type, current_batch_size)
+                if "internal_llm_proxy" in kwargs:
+                    batch_df = self._generate_internal_response(text, system_message, model_config, kwargs)
+                else:
+                    batch_df = self._generate_batch_response(text, system_message, provider, model_config, api_key, api_base)
+                if not batch_df.empty and len(batch_df) > 0:
+                    all_responses.extend(batch_df.to_dict('records'))
+                    pbar.update(len(batch_df))
+            except Exception as e:
+                print(f"Batch generation failed.")
+                if any(error in str(e) for error in FAILURE_CASES):
+                    raise Exception(f"{e}")
+                else:
+                    print(f"Retrying...")
+                    continue
+        # Convert to DataFrame and remove duplicates
+        result_df = pd.DataFrame(all_responses)
+        result_df = result_df.drop_duplicates(subset=['Question'])
+        # Replenish phase - generate additional questions if needed due to duplicates
+        while (len(result_df) < n) and ((len(result_df) >= 1)):
+            questions_needed = n - len(result_df)
+            try:
+                system_message = self._get_system_message(question_type, questions_needed)
+                if "internal_llm_proxy" in kwargs:
+                    additional_df = self._generate_internal_response(text, system_message, model_config, kwargs)
+                else:
+                    additional_df = self._generate_batch_response(text, system_message, provider, model_config, api_key, api_base)
+                if not additional_df.empty and len(additional_df) > 0:
+                    # Only add questions that aren't already in result_df
+                    new_questions = additional_df[~additional_df['Question'].isin(result_df['Question'])]
+                    if not new_questions.empty:
+                        result_df = pd.concat([result_df, new_questions], ignore_index=True)
+                        result_df = result_df.drop_duplicates(subset=['Question'])
+                        pbar.update(len(new_questions))
+            except Exception as e:
+                print(f"Replenishment generation failed")
+                if any(error in str(e) for error in FAILURE_CASES):
+                    raise Exception(f"{e}")
+                else:
+                    print("An unexpected error occurred. Retrying...")
+                    continue
+        pbar.close()
+        # Ensure exactly n rows and reset index starting from 1
+        final_df = result_df.head(n)
+        final_df.index = range(1, len(final_df) + 1)
+        return final_df
+    def _initialize_client(self, provider, api_key, api_base=None, internal_llm_proxy=None):
+        """Initialize the appropriate client based on provider."""
+        if not provider:
+            raise ValueError("Model configuration must be provided with a valid provider and model.")
         if provider == "groq":
             if api_key is None and os.getenv("GROQ_API_KEY") is None:
                 raise ValueError("API key must be provided for Groq.")
             self.groq_client = Groq(api_key=api_key or os.getenv("GROQ_API_KEY"))
-            return self._generate_groq(text, system_message, model)
         elif provider == "gemini":
+            if api_key is None and os.getenv("GEMINI_API_KEY") is None and api_base is None and internal_llm_proxy is None:
+                raise ValueError("API key must be provided for Gemini.")
             genai.configure(api_key=api_key or os.getenv("GEMINI_API_KEY"))
-            if api_base is None:
-                if api_key is None and os.getenv("GEMINI_API_KEY") is None:
-                    raise ValueError("API key must be provided for Gemini.")
-                genai.configure(api_key=api_key or os.getenv("GEMINI_API_KEY"))
-                return self._generate_gemini(text, system_message, model)
-            else:
-                messages=[
-                {'role': 'user', 'content': system_message+text}
-            ]
-                a= proxy_call.api_completion(messages=messages ,model=model ,api_base=api_base)
-                b= ast.literal_eval(a[0])
-                return pd.DataFrame(b)
         elif provider == "openai":
-            if api_key is None and os.getenv("OPENAI_API_KEY") is None:
+            if api_key is None and os.getenv("OPENAI_API_KEY") is None and internal_llm_proxy is None:
                 raise ValueError("API key must be provided for OpenAI.")
             openai.api_key = api_key or os.getenv("OPENAI_API_KEY")
-            return self._generate_openai(text, system_message, model,api_key=api_key)
         else:
-            raise ValueError("Invalid provider. Choose 'groq', 'gemini', or 'openai'.")
+            raise ValueError(f"Provider is not recognized.")
+    def _generate_batch_response(self, text, system_message, provider, model_config, api_key, api_base):
+        """Generate a batch of responses using the specified provider."""
+        MAX_RETRIES = 3
+        for attempt in range(MAX_RETRIES):
+            try:
+                if provider == "gemini" and api_base:
+                    messages = [{'role': 'user', 'content': system_message + text}]
+                    response = proxy_api_completion(messages=messages, model=model_config["model"], api_base=api_base)
+                    # response = proxy_call.api_completion(messages=messages, model=model_config["model"], api_base=api_base)
+                    return pd.DataFrame(ast.literal_eval(response[0]))
+                else:
+                    return self._generate_llm_response(text, system_message, model_config, api_key)
+            except (json.JSONDecodeError, ValueError) as e:
+                if attempt == MAX_RETRIES - 1:
+                    raise Exception(f"Failed to generate valid response after {MAX_RETRIES} attempts: {str(e)}")
+                continue
+    def _generate_internal_response(self, text, system_message, model_config, kwargs):
+        """Generate response using internal API."""
+        messages = [{'role': 'user', 'content': system_message + text}]
+        return internal_api_completion(
+            messages=messages,
+            model_config=model_config,
+            kwargs=kwargs
+        )
     def _get_system_message(self, question_type, n):
         """
         Get the appropriate system message for the specified question type.
@@ -113,64 +235,68 @@ class SyntheticDataGeneration:
         else:
             raise ValueError("Invalid question type")
-    def _generate_groq(self, text, system_message, model):
+    def _generate_llm_response(self, text, system_message, model_config, api_key=None):
         """
-        Generate questions using the Groq API.
+        Generate questions using LiteLLM which supports multiple providers (OpenAI, Groq, Gemini, etc.).
         Args:
             text (str): The input text to generate questions from.
             system_message (str): The system message for the AI model.
-            model (str): The specific Groq model to use.
+            model_config (dict): Configuration dictionary containing model details.
+                Required keys:
+                - model: The model identifier (e.g., "gpt-4", "gemini-pro", "mixtral-8x7b-32768")
+                Optional keys:
+                - api_base: Custom API base URL if needed
+                - max_tokens: Maximum tokens in response
+                - temperature: Temperature for response generation
+            api_key (str, optional): The API key for the model provider.
         Returns:
             pandas.DataFrame: A DataFrame containing the generated questions and answers.
-        """
-        response = self.groq_client.chat.completions.create(
-            model=model,
-            messages=[
-                {'role': 'system', 'content': system_message},
-                {'role': 'user', 'content': text}
-            ]
-        )
-        return self._parse_response(response, provider="groq")
-    def _generate_gemini(self, text, system_message, model):
+        Raises:
+            Exception: If there's an error in generating the response.
         """
-        Generate questions using the Gemini API.
-        Args:
-            text (str): The input text to generate questions from.
-            system_message (str): The system message for the AI model.
-            model (str): The specific Gemini model to use.
-        Returns:
-            pandas.DataFrame: A DataFrame containing the generated questions and answers.
-        """
-        model = genai.GenerativeModel(model)
-        response = model.generate_content([system_message, text])
-        return self._parse_response(response, provider="gemini")
+            # Prepare the messages in the format expected by LiteLLM
+        messages = [
+            {"role": "system", "content": system_message},
+            {"role": "user", "content": text}
+        ]
+        # Set up the completion parameters
+        completion_params = {
+            "model": model_config["model"],
+            "messages": messages,
+            "api_key": api_key
+        }
+        # Add optional parameters if they exist in model_config
+        if "api_base" in model_config:
+            completion_params["api_base"] = model_config["api_base"]
+        if "max_tokens" in model_config:
+            completion_params["max_tokens"] = model_config["max_tokens"]
+        if "temperature" in model_config:
+            completion_params["temperature"] = model_config["temperature"]
+        # Make the API call using LiteLLM
+        try:
+            response = completion(**completion_params)
+        except Exception as e:
+            if any(error in str(e).lower() for error in ["invalid api key", "incorrect api key", "unauthorized", "authentication"]):
+                raise ValueError(f"Invalid API key provided for {model_config.get('provider', 'the specified')} provider")
+            raise Exception(f"Error calling LLM API: {str(e)}")
-    def _generate_openai(self, text, system_message, model,api_key=None):
-        """
-        Generate questions using the OpenAI API.
+        # Extract the content from the response
+        content = response.choices[0].message.content
-        Args:+
-            text (str): The input text to generate questions from.
-            system_message (str): The system message for the AI model.
-            model (str): The specific OpenAI model to use.
+        # Clean the response if needed (remove any prefix before the JSON list)
+        list_start_index = content.find('[')
+        if list_start_index != -1:
+            content = content[list_start_index:]
-        Returns:
-            pandas.DataFrame: A DataFrame containing the generated questions and answers.
-        """
-        client = openai.OpenAI(api_key=api_key)
-        response = client.chat.completions.create(
-            model=model,
-            messages=[
-                {"role": "system", "content": system_message},
-                {"role": "user", "content": text}
-            ]
-        )
-        return self._parse_response(response, provider="openai")
+        json_data = json.loads(content)
+        return pd.DataFrame(json_data)
     def _parse_response(self, response, provider):
         """
@@ -218,16 +344,19 @@ class SyntheticDataGeneration:
             if os.path.isfile(input_data):
                 # If input_data is a file path
                 _, file_extension = os.path.splitext(input_data)
-                if file_extension.lower() == '.pdf':
-                    return self._read_pdf(input_data)
-                elif file_extension.lower() == '.txt':
-                    return self._read_text(input_data)
-                elif file_extension.lower() == '.md':
-                    return self._read_markdown(input_data)
-                elif file_extension.lower() == '.csv':
-                    return self._read_csv(input_data)
-                else:
-                    raise ValueError(f"Unsupported file type: {file_extension}")
+                try:
+                    if file_extension.lower() == '.pdf':
+                        return self._read_pdf(input_data)
+                    elif file_extension.lower() == '.txt':
+                        return self._read_text(input_data)
+                    elif file_extension.lower() == '.md':
+                        return self._read_markdown(input_data)
+                    elif file_extension.lower() == '.csv':
+                        return self._read_csv(input_data)
+                    else:
+                        raise ValueError(f"Unsupported file type: {file_extension}")
+                except Exception as e:
+                    raise ValueError(f"Error reading the file. Upload a valid file. \n{e}")
             else:
                 # If input_data is a string of text
                 return input_data

ragaai-catalyst 2.0.5__py3-none-any.whl → 2.0.6__py3-none-any.whl

ragaai-catalyst 2.0.5py3-none-any.whl → 2.0.6py3-none-any.whl