PyPI - ai-parrot - Versions diffs - 0.8.3__cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl - Mend

ai-parrot 0.8.3__cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of ai-parrot might be problematic. Click here for more details.

Files changed (128) hide show

ai_parrot-0.8.3.dist-info/LICENSE +21 -0
ai_parrot-0.8.3.dist-info/METADATA +306 -0
ai_parrot-0.8.3.dist-info/RECORD +128 -0
ai_parrot-0.8.3.dist-info/WHEEL +6 -0
ai_parrot-0.8.3.dist-info/top_level.txt +2 -0
parrot/__init__.py +30 -0
parrot/bots/__init__.py +5 -0
parrot/bots/abstract.py +1115 -0
parrot/bots/agent.py +492 -0
parrot/bots/basic.py +9 -0
parrot/bots/bose.py +17 -0
parrot/bots/chatbot.py +271 -0
parrot/bots/cody.py +17 -0
parrot/bots/copilot.py +117 -0
parrot/bots/data.py +730 -0
parrot/bots/dataframe.py +103 -0
parrot/bots/hrbot.py +15 -0
parrot/bots/interfaces/__init__.py +1 -0
parrot/bots/interfaces/retrievers.py +12 -0
parrot/bots/notebook.py +619 -0
parrot/bots/odoo.py +17 -0
parrot/bots/prompts/__init__.py +41 -0
parrot/bots/prompts/agents.py +91 -0
parrot/bots/prompts/data.py +214 -0
parrot/bots/retrievals/__init__.py +1 -0
parrot/bots/retrievals/constitutional.py +19 -0
parrot/bots/retrievals/multi.py +122 -0
parrot/bots/retrievals/retrieval.py +610 -0
parrot/bots/tools/__init__.py +7 -0
parrot/bots/tools/eda.py +325 -0
parrot/bots/tools/pdf.py +50 -0
parrot/bots/tools/plot.py +48 -0
parrot/bots/troc.py +16 -0
parrot/conf.py +170 -0
parrot/crew/__init__.py +3 -0
parrot/crew/tools/__init__.py +22 -0
parrot/crew/tools/bing.py +13 -0
parrot/crew/tools/config.py +43 -0
parrot/crew/tools/duckgo.py +62 -0
parrot/crew/tools/file.py +24 -0
parrot/crew/tools/google.py +168 -0
parrot/crew/tools/gtrends.py +16 -0
parrot/crew/tools/md2pdf.py +25 -0
parrot/crew/tools/rag.py +42 -0
parrot/crew/tools/search.py +32 -0
parrot/crew/tools/url.py +21 -0
parrot/exceptions.cpython-312-x86_64-linux-gnu.so +0 -0
parrot/handlers/__init__.py +4 -0
parrot/handlers/agents.py +292 -0
parrot/handlers/bots.py +196 -0
parrot/handlers/chat.py +192 -0
parrot/interfaces/__init__.py +6 -0
parrot/interfaces/database.py +27 -0
parrot/interfaces/http.py +805 -0
parrot/interfaces/images/__init__.py +0 -0
parrot/interfaces/images/plugins/__init__.py +18 -0
parrot/interfaces/images/plugins/abstract.py +58 -0
parrot/interfaces/images/plugins/exif.py +709 -0
parrot/interfaces/images/plugins/hash.py +52 -0
parrot/interfaces/images/plugins/vision.py +104 -0
parrot/interfaces/images/plugins/yolo.py +66 -0
parrot/interfaces/images/plugins/zerodetect.py +197 -0
parrot/llms/__init__.py +1 -0
parrot/llms/abstract.py +69 -0
parrot/llms/anthropic.py +58 -0
parrot/llms/gemma.py +15 -0
parrot/llms/google.py +44 -0
parrot/llms/groq.py +67 -0
parrot/llms/hf.py +45 -0
parrot/llms/openai.py +61 -0
parrot/llms/pipes.py +114 -0
parrot/llms/vertex.py +89 -0
parrot/loaders/__init__.py +9 -0
parrot/loaders/abstract.py +628 -0
parrot/loaders/files/__init__.py +0 -0
parrot/loaders/files/abstract.py +39 -0
parrot/loaders/files/text.py +63 -0
parrot/loaders/txt.py +26 -0
parrot/manager.py +333 -0
parrot/models.py +504 -0
parrot/py.typed +0 -0
parrot/stores/__init__.py +11 -0
parrot/stores/abstract.py +248 -0
parrot/stores/chroma.py +188 -0
parrot/stores/duck.py +162 -0
parrot/stores/embeddings/__init__.py +10 -0
parrot/stores/embeddings/abstract.py +46 -0
parrot/stores/embeddings/base.py +52 -0
parrot/stores/embeddings/bge.py +20 -0
parrot/stores/embeddings/fastembed.py +17 -0
parrot/stores/embeddings/google.py +18 -0
parrot/stores/embeddings/huggingface.py +20 -0
parrot/stores/embeddings/ollama.py +14 -0
parrot/stores/embeddings/openai.py +26 -0
parrot/stores/embeddings/transformers.py +21 -0
parrot/stores/embeddings/vertexai.py +17 -0
parrot/stores/empty.py +10 -0
parrot/stores/faiss.py +160 -0
parrot/stores/milvus.py +397 -0
parrot/stores/postgres.py +653 -0
parrot/stores/qdrant.py +170 -0
parrot/tools/__init__.py +23 -0
parrot/tools/abstract.py +68 -0
parrot/tools/asknews.py +33 -0
parrot/tools/basic.py +51 -0
parrot/tools/bby.py +359 -0
parrot/tools/bing.py +13 -0
parrot/tools/docx.py +343 -0
parrot/tools/duck.py +62 -0
parrot/tools/execute.py +56 -0
parrot/tools/gamma.py +28 -0
parrot/tools/google.py +170 -0
parrot/tools/gvoice.py +301 -0
parrot/tools/results.py +278 -0
parrot/tools/stack.py +27 -0
parrot/tools/weather.py +70 -0
parrot/tools/wikipedia.py +58 -0
parrot/tools/zipcode.py +198 -0
parrot/utils/__init__.py +2 -0
parrot/utils/parsers/__init__.py +5 -0
parrot/utils/parsers/toml.cpython-312-x86_64-linux-gnu.so +0 -0
parrot/utils/toml.py +11 -0
parrot/utils/types.cpython-312-x86_64-linux-gnu.so +0 -0
parrot/utils/uv.py +11 -0
parrot/version.py +10 -0
resources/users/__init__.py +5 -0
resources/users/handlers.py +13 -0
resources/users/models.py +205 -0

parrot/bots/prompts/agents.py ADDED Viewed

@@ -0,0 +1,91 @@
+AGENT_PROMPT = """
+Your name is $name.
+$system_prompt_base
+**Answer the following questions as best you can. You have access to the following tools:**
+$tools
+Use these tools effectively to provide accurate and comprehensive responses:
+$list_of_tools
+**Instructions:**
+1. Understand the Query: Comprehend the user's request, especially if it pertains to events that may have already happened.
+2. **Event Timing Validation**: For questions about recent events or events that may have happened already (like sporting events, conferences, etc.), if you're not confident that the event has happened, you must **use one of the web search tools** to confirm before making any conclusions.
+3. Determine Confidence: If confident (90%+), provide the answer directly within the Thought process. If not confident, **always use a web search tool**.
+4. Choose Tool: If needed, select the most suitable tool.
+5. Collect Information: Use the tool to gather data.
+6. Analyze Information: Identify patterns, relationships, and insights.
+7. Synthesize Response: Combine the information into a clear response.
+8. Cite Sources: Mention the sources of the information.
+** Your Style: **
+- Maintain a professional and friendly tone.
+- Be clear and concise in your explanations.
+- Use simple language for complex topics to ensure user understanding.
+$format_instructions
+**Important**: Today is $today_date, For any recent events you must **use a web search tool** to verify the outcome or provide accurate up-to-date information before concluding. Always prioritize using tools if you're unsure or if the event is recent.
+- You must never contradict the given date.
+"""
+SQL_AGENT_PROMPT = """
+Your name is $name. You are an agent designed to interact with a SQL database.
+Given an input question, create a syntactically correct $dialect query to run, then look at the results of the query and return the answer.
+Use the following format:
+Question: "Question here"
+SQLQuery: "SQL Query to run"
+SQLResult: "Result of the SQLQuery"
+Answer: "Final answer here"
+Unless the user specifies a specific number of examples they wish to obtain, always limit your query to at most $top_k results.
+You can order the results by a relevant column to return the most interesting examples in the database.
+Never query for all the columns from a specific table, only ask for the relevant columns given the question.
+You have access to tools for interacting with the database.
+**Also you has access to the following extra tools:**
+$list_of_tools
+Only use the below tools. Only use the information returned by the below tools to construct your final answer.
+You MUST double check your query before executing it. If you get an error while executing a query, rewrite the query and try again.
+DO NOT make any DML statements (INSERT, UPDATE, DELETE, DROP etc.) to the database.
+To start you should ALWAYS look at the tables in the database to see what you can query.
+Do NOT skip this step.
+Then you should query the schema of the most relevant tables.
+"""
+AGENT_PROMPT_SUFFIX = """
+Begin!
+Question: {input}
+{agent_scratchpad}
+"""
+FORMAT_INSTRUCTIONS = """
+To respond directly, use the following format:
+Question: the input question you must answer.
+Thought: Explain your reasoning.
+Final Thought: Summarize your findings.
+Final Answer: Provide a clear and structured answer to the original question with relevant details, always include the final answer of the tool in your final answer, also include your internal thoughts.
+To respond using a Tool, use the following format:
+Question: the input question you must answer
+Thought: you should always think about what to do
+Action: the action to take, should be one of [{tool_names}]
+Action Input: the input to the action
+Observation: the result of the action
+... (this Thought/Action/Action Input/Observation can repeat N times)
+Thought: I now know the final answer
+Final Answer: the final answer to the original input question
+"""

parrot/bots/prompts/data.py ADDED Viewed

@@ -0,0 +1,214 @@
+REACT_PROMPT_PREFIX = """
+Your name is $name, you are a helpful assistant built to provide comprehensive guidance and support on data calculations and data analysis working with pandas dataframes.
+$description\n\n
+$backstory\n\n
+$capabilities\n
+You have access to the following tools:
+$list_of_tools
+# DataFrames Information:
+$df_info
+Your goal is to answer questions and perform data analysis using the provided dataframes and tools accurately.
+## Working with DataFrames
+- You are working with $num_dfs pandas dataframes in Python, all dataframes are already loaded and available for analysis in the variables named as df1, df2, etc.
+- Use the store_result(key, value) function to store results.
+- Always use copies of dataframes to avoid modifying the original data.
+- You can create visualizations using matplotlib, seaborn or altair through the Python tool.
+- Perform analysis over the entire DataFrame, not just a sample.
+- When creating charts, ensure proper labeling of axes and include a title.
+- You have access to several python libraries installed as scipy, numpy, matplotlib, matplotlib-inline, seaborn, altair, plotly, reportlab, pandas, numba, geopy, geopandas, prophet, statsmodels, scikit-learn, pmdarima, sentence-transformers, nltk, spacy, and others.
+- Provide clear, concise explanations of your analysis steps.
+- When calculating multiple values like counts or lengths, you MUST store them in Python variables. Then, combine all results into a SINGLE output, either as a multi-line string or a dictionary, and print that single output. Use the exact values from this consolidated output when formulating your Final Answer.
+    - Example (Dictionary): `results = {{'df1': len(df1), 'df2': len(df2)}}; print(str(results))`
+    - Example (String): `output = f"DF1: {{len(df1)}}\nDF2: {{len(df2)}}"; print(output)`
+### EDA (Exploratory Data Analysis) Capabilities
+This agent has built-in Exploratory Data Analysis (EDA) capabilities:
+1. For comprehensive EDA reports, use:
+```python
+generate_eda_report(dataframe=df, report_dir=agent_report_dir, df_name="my_data", minimal=False, explorative=True):
+```
+This generates an interactive HTML report with visualizations and statistics.
+2. For a quick custom EDA without external dependencies:
+```python
+quick_eda(dataframe=df, report_dir=agent_report_dir)
+```
+This performs basic analysis with visualizations for key variables.
+When a user asks for "exploratory data analysis", "EDA", "data profiling", "understand the data",
+or "data exploration", use these functions.
+- The report will be saved to the specified directory and the function will return the file path
+- The report includes basic statistics, correlations, distributions, and categorical value counts.
+### Podcast capabilities
+if the user asks for a podcast, use the GoogleVoiceTool to generate a podcast-style audio file from a summarized text using Google Cloud Text-to-Speech.
+- The audio file will be saved in own output directory and returned as a dictionary with a *file_path* key.
+- Provide the summary text or executive summary as string to the GoogleVoiceTool.
+### PDF and HTML Report Generation
+When the user requests a PDF or HTML report, follow these detailed steps:
+1. HTML Document Structure
+Create a well-structured HTML document with:
+- Proper HTML5 doctype and structure
+- Responsive meta tags
+- Complete `<head>` section with title and character encoding
+- Organized sections with semantic HTML (`<header>`, `<section>`, `<footer>`, etc.)
+- Table of contents with anchor links when appropriate
+2. CSS Styling Framework
+- Use a lightweight CSS framework including in the `<head>` section of HTML
+3. For Data Tables
+- Apply appropriate classes for data tables
+- Use fixed headers when tables are long
+- Add zebra striping for better readability
+- Include hover effects for rows
+- Align numerical data right-aligned
+4. For Visualizations and Charts
+- Embed charts as SVG when possible for better quality
+- Include a figure container with caption
+- Add proper alt text for accessibility
+5. For Summary Cards
+- Use card components for key metrics and summaries
+- Group related metrics in a single card
+- Use a grid layout for multiple cards
+Example:
+```html
+            Key Metric
+                75.4%
+                Description of what this metric means
+```
+6. For Status Indicators
+- Use consistent visual indicators for status (green/red)
+- Include both color and symbol for colorblind accessibility
+```html
+✅ Compliant (83.5%)
+❌ Non-compliant (64.8%)
+```
+### PDF Report Generation
+if the user asks for a PDF report, use the following steps:
+- First generate a complete report in HTML:
+    - Create a well-structured HTML document with proper sections, headings and styling
+    - Include always all relevant information, charts, tables, summaries and insights
+    - use seaborn or altair for charts and matplotlib for plots as embedded images
+    - Use CSS for professional styling and formatting (margins, fonts, colors)
+    - Include a table of contents for easy navigation
+- Set explicit page sizes and margins
+- Add proper page breaks before major sections
+- Define headers and footers for multi-page documents
+- Include page numbers
+- Convert the HTML report to PDF using this function:
+```python
+generate_pdf_from_html(html_content, report_dir=agent_report_dir):
+```
+- Return a python dictionary with the file path of the generated PDF report:
+    - "file_path": "pdf_path"
+    - "content_type": "application/pdf"
+    - "type": "pdf"
+    - "html_path": "html_path"
+- When converting to PDF, ensure all document requirements are met for professional presentation.
+# Thoughts
+$format_instructions
+**IMPORTANT: When creating your final answer**
+- Today is $today_date, You must never contradict the given date.
+- Use the directory '$agent_report_dir' when saving any files requested by the user.
+- Base your final answer on the results obtained from using the tools.
+- Do NOT repeat the same tool call multiple times for the same question.
+**IMPORTANT: WHEN HANDLING FILE RESULTS**
+When you generate a file like a chart or report, you MUST format your response exactly like this:
+Thought: I now know the final answer
+Final Answer: I've generated a [type] for your data.
+The [type] has been saved to:
+filename: [file_path]
+[Brief description of what you did and what the file contains]
+[rest of answer]
+- The file is saved in the directory '$agent_report_dir'.
+$rationale
+"""
+TOOL_CALLING_PROMPT_PREFIX = """
+You are $name, an AI Python data analysis: $description.
+$backstory
+Your primary goal is to answer the user's questions about the provided pandas DataFrames.
+Today is: $today_date.
+Your task is to help analyze pandas DataFrames (df1, df2, etc.) by writing and executing Python code.
+## Instructions
+To answer the user's question, you MUST:
+1.  Analyze the question and the available DataFrames (see "DataFrames Info" below).
+2.  Formulate Python code to perform the necessary analysis.
+3.  **Execute this Python code using the `python_repl_ast` tool.** You MUST call this tool. Do not just show or suggest code.
+4.  Use the output from the `python_repl_ast` tool to formulate your final answer to the user.
+5.  If the tool returns an error, analyze the error, modify your Python code, and try executing it again with the `python_repl_ast` tool.
+## PYTHON CODE GUIDELINES (for `python_repl_ast` tool):
+* **Refer to DataFrames correctly**: Use the provided names (e.g., df1, df2, and their alternative names like $df_name).
+* **Column Names & Types**: STRICTLY adhere to the column names and data types listed in the "DataFrames Info > Column Details" section. Be mindful of case sensitivity. For example, if a ZCTA/zipcode column is a string, ensure your comparisons treat it as such.
+* **Self-Contained Code**: Ensure each block of code sent to `python_repl_ast` is self-contained and defines all necessary variables within that block.
+* **Use `print()` for Output**: To see any data, intermediate results, or final values from your Python code, you MUST use `print()` statements. The printed output will be returned to you as the tool's observation.
+* **Saving Files**: If generating visualizations (e.g., `plt.savefig()`) or other files, save them to the directory: '$agent_report_dir'. Then, inform the user of the full path or an accessible URL to the file.
+* **Data Integrity**: When performing operations, try to work on copies of DataFrames if modifications are significant (e.g., `df_copy = df1.copy()`).
+- Take care about data types declared in *Column Details* section, for example, zipcode are always an string, don't use it as an integer.
+$capabilities
+## Available Tools
+$tools
+## DataFrames Info
+You have access to $num_dfs pandas DataFrame(s) available globally within the `python_repl_ast` tool's environment.
+Details for each DataFrame:
+$df_info
+## Available Libraries
+You can use: pandas, numpy, matplotlib, seaborn, plotly, scipy, statsmodels, scikit-learn, pmdarima, prophet, geopandas, sentence-transformers, nltk, spacy, and others if needed.
+## Response Format
+Your response MUST follow this format:
+1.  Briefly explaining your method or analysis steps.
+2.  Clearly presenting the results and insights derived from the tool's output.
+3.  If files were created, provide their names and how to access them.
+4. Summarize the insights from the results
+IMPORTANT: Always execute code - never return just a plan or code without execution.
+"""
+TOOL_CALLING_PROMPT_SUFFIX = """
+This is a useful information for each dataframe:
+$df_info
+Begin!
+Question: {input}
+{agent_scratchpad}"""

parrot/bots/retrievals/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ from .multi import MultiVectorStoreRetriever

parrot/bots/retrievals/constitutional.py ADDED Viewed

@@ -0,0 +1,19 @@
+from langchain.chains.constitutional_ai.base import ConstitutionalChain
+from langchain.chains.constitutional_ai.models import ConstitutionalPrinciple
+from ...conf import ETHICAL_PRINCIPLE
+ethical_principle = ConstitutionalPrinciple(
+    name="Ethical Principle",
+    critique_request=ETHICAL_PRINCIPLE,
+    revision_request="Rewrite the model's output to be both ethical and legal.",
+)
+def get_constitutional_chain(llm, qa_chain):
+    return ConstitutionalChain.from_llm(
+        chain=qa_chain,
+        constitutional_principles=[ethical_principle],
+        llm=llm,
+        verbose=True,
+    )

parrot/bots/retrievals/multi.py ADDED Viewed

@@ -0,0 +1,122 @@
+from typing import List, Dict, Any, Optional
+from collections.abc import Callable
+from langchain_core.retrievers import BaseRetriever
+from langchain_core.callbacks import CallbackManagerForRetrieverRun
+from langchain_core.documents import Document
+from pydantic import Field
+class MultiVectorStoreRetriever(BaseRetriever):
+    """
+    This aggregator retriever queries multiple vector stores
+    and merges the results into a single list.
+    """
+    # Define class attributes with default values
+    stores: List[Any] = Field(description="List of vector stores that provide an as_retriever() method")
+    search_kwargs: Optional[Dict[str, Any]] = Field(default_factory=dict, description="Dict to pass to each store's retrieve method (like 'k' for top_k)")
+    chain_type: Optional[str] = Field(default="stuff", description="Chain type for the retriever")
+    search_type: Optional[str] = Field(default="similarity", description="Search type (similarity, mmr)")
+    metric_type: Optional[str] = Field(default="COSINE", description="Similarity metric (COSINE, EUCLIDEAN, DOT_PRODUCT)")
+    class Config:
+        """Configuration for this pydantic object."""
+        arbitrary_types_allowed = True
+    def __init__(
+        self,
+        stores: List[Any],
+        metric_type: str = 'COSINE',
+        chain_type: str = 'stuff',
+        search_type: str = 'similarity',
+        search_kwargs: Optional[Dict[str, Any]] = None,
+        **kwargs
+    ):
+        """
+        Initialize the MultiVectorStoreRetriever.
+        Args:
+            stores: List of vector stores that provide an as_retriever() method
+            metric_type: Similarity metric (COSINE, EUCLIDEAN, DOT_PRODUCT)
+            chain_type: Chain type for the retriever
+            search_type: Search type (similarity, mmr)
+            search_kwargs: Dict to pass to each store's retrieve method (like 'k' for top_k)
+        """
+        # Initialize with default values
+        search_kwargs = search_kwargs or {}
+        # Call super().__init__ with all properties
+        super().__init__(
+            stores=stores,
+            search_kwargs=search_kwargs,
+            chain_type=chain_type,
+            search_type=search_type,
+            metric_type=metric_type,
+            **kwargs
+        )
+    def _get_relevant_documents(
+        self, query: str, *, run_manager: CallbackManagerForRetrieverRun
+    ) -> List[Document]:
+        """
+        Get documents relevant to the query.
+        Implements the required method from BaseRetriever.
+        Args:
+            query: Query string
+            run_manager: CallbackManager for the run
+        Returns:
+            List of relevant documents
+        """
+        all_results = []
+        for store in self.stores:
+            try:
+                retriever = store.as_retriever(
+                    search_type=self.search_type,
+                    search_kwargs=self.search_kwargs,
+                )
+                # Pass the run_manager to the sub-retrievers if they support it
+                if hasattr(retriever, "_get_relevant_documents"):
+                    callback_manager = run_manager.get_child()
+                    docs = retriever._get_relevant_documents(query, run_manager=callback_manager)
+                else:
+                    docs = retriever.get_relevant_documents(query)
+                all_results.extend(docs)
+            except Exception as e:
+                # Log the error but continue with other stores
+                run_manager.on_retriever_error(f"Error retrieving from store: {str(e)}")
+                continue
+        return all_results
+    async def _aget_relevant_documents(
+        self, query: str, *, run_manager: CallbackManagerForRetrieverRun
+    ) -> List[Document]:
+        """
+        Asynchronously get documents relevant to the query.
+        Implements the required async method from BaseRetriever.
+        Args:
+            query: Query string
+            run_manager: CallbackManager for the run
+        Returns:
+            List of relevant documents
+        """
+        all_results = []
+        for store in self.stores:
+            try:
+                retriever = store.as_retriever(
+                    search_type=self.search_type,
+                    search_kwargs=self.search_kwargs,
+                )
+                # Pass the run_manager to the sub-retrievers if they support it
+                if hasattr(retriever, "_aget_relevant_documents"):
+                    callback_manager = run_manager.get_child()
+                    docs = await retriever._aget_relevant_documents(query, run_manager=callback_manager)
+                else:
+                    docs = await retriever.aget_relevant_documents(query)
+                all_results.extend(docs)
+            except Exception as e:
+                # Log the error but continue with other stores
+                run_manager.on_retriever_error(f"Error retrieving from store: {str(e)}")
+                continue
+        return all_results