PyPI - vanna - Versions diffs - 0.7.8__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

vanna 0.7.8py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (302) hide show

vanna/__init__.py +167 -395
vanna/agents/__init__.py +7 -0
vanna/capabilities/__init__.py +17 -0
vanna/capabilities/agent_memory/__init__.py +21 -0
vanna/capabilities/agent_memory/base.py +103 -0
vanna/capabilities/agent_memory/models.py +53 -0
vanna/capabilities/file_system/__init__.py +14 -0
vanna/capabilities/file_system/base.py +71 -0
vanna/capabilities/file_system/models.py +25 -0
vanna/capabilities/sql_runner/__init__.py +13 -0
vanna/capabilities/sql_runner/base.py +37 -0
vanna/capabilities/sql_runner/models.py +13 -0
vanna/components/__init__.py +92 -0
vanna/components/base.py +11 -0
vanna/components/rich/__init__.py +83 -0
vanna/components/rich/containers/__init__.py +7 -0
vanna/components/rich/containers/card.py +20 -0
vanna/components/rich/data/__init__.py +9 -0
vanna/components/rich/data/chart.py +17 -0
vanna/components/rich/data/dataframe.py +93 -0
vanna/components/rich/feedback/__init__.py +21 -0
vanna/components/rich/feedback/badge.py +16 -0
vanna/components/rich/feedback/icon_text.py +14 -0
vanna/components/rich/feedback/log_viewer.py +41 -0
vanna/components/rich/feedback/notification.py +19 -0
vanna/components/rich/feedback/progress.py +37 -0
vanna/components/rich/feedback/status_card.py +28 -0
vanna/components/rich/feedback/status_indicator.py +14 -0
vanna/components/rich/interactive/__init__.py +21 -0
vanna/components/rich/interactive/button.py +95 -0
vanna/components/rich/interactive/task_list.py +58 -0
vanna/components/rich/interactive/ui_state.py +93 -0
vanna/components/rich/specialized/__init__.py +7 -0
vanna/components/rich/specialized/artifact.py +20 -0
vanna/components/rich/text.py +16 -0
vanna/components/simple/__init__.py +15 -0
vanna/components/simple/image.py +15 -0
vanna/components/simple/link.py +15 -0
vanna/components/simple/text.py +11 -0
vanna/core/__init__.py +193 -0
vanna/core/_compat.py +19 -0
vanna/core/agent/__init__.py +10 -0
vanna/core/agent/agent.py +1407 -0
vanna/core/agent/config.py +123 -0
vanna/core/audit/__init__.py +28 -0
vanna/core/audit/base.py +299 -0
vanna/core/audit/models.py +131 -0
vanna/core/component_manager.py +329 -0
vanna/core/components.py +53 -0
vanna/core/enhancer/__init__.py +11 -0
vanna/core/enhancer/base.py +94 -0
vanna/core/enhancer/default.py +118 -0
vanna/core/enricher/__init__.py +10 -0
vanna/core/enricher/base.py +59 -0
vanna/core/errors.py +47 -0
vanna/core/evaluation/__init__.py +81 -0
vanna/core/evaluation/base.py +186 -0
vanna/core/evaluation/dataset.py +254 -0
vanna/core/evaluation/evaluators.py +376 -0
vanna/core/evaluation/report.py +289 -0
vanna/core/evaluation/runner.py +313 -0
vanna/core/filter/__init__.py +10 -0
vanna/core/filter/base.py +67 -0
vanna/core/lifecycle/__init__.py +10 -0
vanna/core/lifecycle/base.py +83 -0
vanna/core/llm/__init__.py +16 -0
vanna/core/llm/base.py +40 -0
vanna/core/llm/models.py +61 -0
vanna/core/middleware/__init__.py +10 -0
vanna/core/middleware/base.py +69 -0
vanna/core/observability/__init__.py +11 -0
vanna/core/observability/base.py +88 -0
vanna/core/observability/models.py +47 -0
vanna/core/recovery/__init__.py +11 -0
vanna/core/recovery/base.py +84 -0
vanna/core/recovery/models.py +32 -0
vanna/core/registry.py +278 -0
vanna/core/rich_component.py +156 -0
vanna/core/simple_component.py +27 -0
vanna/core/storage/__init__.py +14 -0
vanna/core/storage/base.py +46 -0
vanna/core/storage/models.py +46 -0
vanna/core/system_prompt/__init__.py +13 -0
vanna/core/system_prompt/base.py +36 -0
vanna/core/system_prompt/default.py +157 -0
vanna/core/tool/__init__.py +18 -0
vanna/core/tool/base.py +70 -0
vanna/core/tool/models.py +84 -0
vanna/core/user/__init__.py +17 -0
vanna/core/user/base.py +29 -0
vanna/core/user/models.py +25 -0
vanna/core/user/request_context.py +70 -0
vanna/core/user/resolver.py +42 -0
vanna/core/validation.py +164 -0
vanna/core/workflow/__init__.py +12 -0
vanna/core/workflow/base.py +254 -0
vanna/core/workflow/default.py +789 -0
vanna/examples/__init__.py +1 -0
vanna/examples/__main__.py +44 -0
vanna/examples/anthropic_quickstart.py +80 -0
vanna/examples/artifact_example.py +293 -0
vanna/examples/claude_sqlite_example.py +236 -0
vanna/examples/coding_agent_example.py +300 -0
vanna/examples/custom_system_prompt_example.py +174 -0
vanna/examples/default_workflow_handler_example.py +208 -0
vanna/examples/email_auth_example.py +340 -0
vanna/examples/evaluation_example.py +269 -0
vanna/examples/extensibility_example.py +262 -0
vanna/examples/minimal_example.py +67 -0
vanna/examples/mock_auth_example.py +227 -0
vanna/examples/mock_custom_tool.py +311 -0
vanna/examples/mock_quickstart.py +79 -0
vanna/examples/mock_quota_example.py +145 -0
vanna/examples/mock_rich_components_demo.py +396 -0
vanna/examples/mock_sqlite_example.py +223 -0
vanna/examples/openai_quickstart.py +83 -0
vanna/examples/primitive_components_demo.py +305 -0
vanna/examples/quota_lifecycle_example.py +139 -0
vanna/examples/visualization_example.py +251 -0
vanna/integrations/__init__.py +17 -0
vanna/integrations/anthropic/__init__.py +9 -0
vanna/integrations/anthropic/llm.py +270 -0
vanna/integrations/azureopenai/__init__.py +9 -0
vanna/integrations/azureopenai/llm.py +329 -0
vanna/integrations/azuresearch/__init__.py +7 -0
vanna/integrations/azuresearch/agent_memory.py +413 -0
vanna/integrations/bigquery/__init__.py +5 -0
vanna/integrations/bigquery/sql_runner.py +81 -0
vanna/integrations/chromadb/__init__.py +104 -0
vanna/integrations/chromadb/agent_memory.py +416 -0
vanna/integrations/clickhouse/__init__.py +5 -0
vanna/integrations/clickhouse/sql_runner.py +82 -0
vanna/integrations/duckdb/__init__.py +5 -0
vanna/integrations/duckdb/sql_runner.py +65 -0
vanna/integrations/faiss/__init__.py +7 -0
vanna/integrations/faiss/agent_memory.py +431 -0
vanna/integrations/google/__init__.py +9 -0
vanna/integrations/google/gemini.py +370 -0
vanna/integrations/hive/__init__.py +5 -0
vanna/integrations/hive/sql_runner.py +87 -0
vanna/integrations/local/__init__.py +17 -0
vanna/integrations/local/agent_memory/__init__.py +7 -0
vanna/integrations/local/agent_memory/in_memory.py +285 -0
vanna/integrations/local/audit.py +59 -0
vanna/integrations/local/file_system.py +242 -0
vanna/integrations/local/file_system_conversation_store.py +255 -0
vanna/integrations/local/storage.py +62 -0
vanna/integrations/marqo/__init__.py +7 -0
vanna/integrations/marqo/agent_memory.py +354 -0
vanna/integrations/milvus/__init__.py +7 -0
vanna/integrations/milvus/agent_memory.py +458 -0
vanna/integrations/mock/__init__.py +9 -0
vanna/integrations/mock/llm.py +65 -0
vanna/integrations/mssql/__init__.py +5 -0
vanna/integrations/mssql/sql_runner.py +66 -0
vanna/integrations/mysql/__init__.py +5 -0
vanna/integrations/mysql/sql_runner.py +92 -0
vanna/integrations/ollama/__init__.py +7 -0
vanna/integrations/ollama/llm.py +252 -0
vanna/integrations/openai/__init__.py +10 -0
vanna/integrations/openai/llm.py +267 -0
vanna/integrations/openai/responses.py +163 -0
vanna/integrations/opensearch/__init__.py +7 -0
vanna/integrations/opensearch/agent_memory.py +411 -0
vanna/integrations/oracle/__init__.py +5 -0
vanna/integrations/oracle/sql_runner.py +75 -0
vanna/integrations/pinecone/__init__.py +7 -0
vanna/integrations/pinecone/agent_memory.py +329 -0
vanna/integrations/plotly/__init__.py +5 -0
vanna/integrations/plotly/chart_generator.py +313 -0
vanna/integrations/postgres/__init__.py +9 -0
vanna/integrations/postgres/sql_runner.py +112 -0
vanna/integrations/premium/agent_memory/__init__.py +7 -0
vanna/integrations/premium/agent_memory/premium.py +186 -0
vanna/integrations/presto/__init__.py +5 -0
vanna/integrations/presto/sql_runner.py +107 -0
vanna/integrations/qdrant/__init__.py +7 -0
vanna/integrations/qdrant/agent_memory.py +461 -0
vanna/integrations/snowflake/__init__.py +5 -0
vanna/integrations/snowflake/sql_runner.py +147 -0
vanna/integrations/sqlite/__init__.py +9 -0
vanna/integrations/sqlite/sql_runner.py +65 -0
vanna/integrations/weaviate/__init__.py +7 -0
vanna/integrations/weaviate/agent_memory.py +428 -0
vanna/{ZhipuAI → legacy/ZhipuAI}/ZhipuAI_embeddings.py +11 -11
vanna/legacy/__init__.py +403 -0
vanna/legacy/adapter.py +463 -0
vanna/{advanced → legacy/advanced}/__init__.py +3 -1
vanna/{anthropic → legacy/anthropic}/anthropic_chat.py +9 -7
vanna/{azuresearch → legacy/azuresearch}/azuresearch_vector.py +79 -41
vanna/{base → legacy/base}/base.py +247 -223
vanna/legacy/bedrock/__init__.py +1 -0
vanna/{bedrock → legacy/bedrock}/bedrock_converse.py +13 -12
vanna/{chromadb → legacy/chromadb}/chromadb_vector.py +3 -1
vanna/legacy/cohere/__init__.py +2 -0
vanna/{cohere → legacy/cohere}/cohere_chat.py +19 -14
vanna/{cohere → legacy/cohere}/cohere_embeddings.py +25 -19
vanna/{deepseek → legacy/deepseek}/deepseek_chat.py +5 -6
vanna/legacy/faiss/__init__.py +1 -0
vanna/{faiss → legacy/faiss}/faiss.py +113 -59
vanna/{flask → legacy/flask}/__init__.py +84 -43
vanna/{flask → legacy/flask}/assets.py +5 -5
vanna/{flask → legacy/flask}/auth.py +5 -4
vanna/{google → legacy/google}/bigquery_vector.py +75 -42
vanna/{google → legacy/google}/gemini_chat.py +7 -3
vanna/{hf → legacy/hf}/hf.py +0 -1
vanna/{milvus → legacy/milvus}/milvus_vector.py +58 -35
vanna/{mock → legacy/mock}/llm.py +0 -1
vanna/legacy/mock/vectordb.py +67 -0
vanna/legacy/ollama/ollama.py +110 -0
vanna/{openai → legacy/openai}/openai_chat.py +2 -6
vanna/legacy/opensearch/opensearch_vector.py +369 -0
vanna/legacy/opensearch/opensearch_vector_semantic.py +200 -0
vanna/legacy/oracle/oracle_vector.py +584 -0
vanna/{pgvector → legacy/pgvector}/pgvector.py +42 -13
vanna/{qdrant → legacy/qdrant}/qdrant.py +2 -6
vanna/legacy/qianfan/Qianfan_Chat.py +170 -0
vanna/legacy/qianfan/Qianfan_embeddings.py +36 -0
vanna/legacy/qianwen/QianwenAI_chat.py +132 -0
vanna/{remote.py → legacy/remote.py} +28 -26
vanna/{utils.py → legacy/utils.py} +6 -11
vanna/{vannadb → legacy/vannadb}/vannadb_vector.py +115 -46
vanna/{vllm → legacy/vllm}/vllm.py +5 -6
vanna/{weaviate → legacy/weaviate}/weaviate_vector.py +59 -40
vanna/{xinference → legacy/xinference}/xinference.py +6 -6
vanna/py.typed +0 -0
vanna/servers/__init__.py +16 -0
vanna/servers/__main__.py +8 -0
vanna/servers/base/__init__.py +18 -0
vanna/servers/base/chat_handler.py +65 -0
vanna/servers/base/models.py +111 -0
vanna/servers/base/rich_chat_handler.py +141 -0
vanna/servers/base/templates.py +331 -0
vanna/servers/cli/__init__.py +7 -0
vanna/servers/cli/server_runner.py +204 -0
vanna/servers/fastapi/__init__.py +7 -0
vanna/servers/fastapi/app.py +163 -0
vanna/servers/fastapi/routes.py +183 -0
vanna/servers/flask/__init__.py +7 -0
vanna/servers/flask/app.py +132 -0
vanna/servers/flask/routes.py +137 -0
vanna/tools/__init__.py +41 -0
vanna/tools/agent_memory.py +322 -0
vanna/tools/file_system.py +879 -0
vanna/tools/python.py +222 -0
vanna/tools/run_sql.py +165 -0
vanna/tools/visualize_data.py +195 -0
vanna/utils/__init__.py +0 -0
vanna/web_components/__init__.py +44 -0
vanna-2.0.0.dist-info/METADATA +485 -0
vanna-2.0.0.dist-info/RECORD +289 -0
vanna-2.0.0.dist-info/entry_points.txt +3 -0
vanna/bedrock/__init__.py +0 -1
vanna/cohere/__init__.py +0 -2
vanna/faiss/__init__.py +0 -1
vanna/mock/vectordb.py +0 -55
vanna/ollama/ollama.py +0 -103
vanna/opensearch/opensearch_vector.py +0 -392
vanna/opensearch/opensearch_vector_semantic.py +0 -175
vanna/oracle/oracle_vector.py +0 -585
vanna/qianfan/Qianfan_Chat.py +0 -165
vanna/qianfan/Qianfan_embeddings.py +0 -36
vanna/qianwen/QianwenAI_chat.py +0 -133
vanna-0.7.8.dist-info/METADATA +0 -408
vanna-0.7.8.dist-info/RECORD +0 -79
/vanna/{ZhipuAI → legacy/ZhipuAI}/ZhipuAI_Chat.py +0 -0
/vanna/{ZhipuAI → legacy/ZhipuAI}/__init__.py +0 -0
/vanna/{anthropic → legacy/anthropic}/__init__.py +0 -0
/vanna/{azuresearch → legacy/azuresearch}/__init__.py +0 -0
/vanna/{base → legacy/base}/__init__.py +0 -0
/vanna/{chromadb → legacy/chromadb}/__init__.py +0 -0
/vanna/{deepseek → legacy/deepseek}/__init__.py +0 -0
/vanna/{exceptions → legacy/exceptions}/__init__.py +0 -0
/vanna/{google → legacy/google}/__init__.py +0 -0
/vanna/{hf → legacy/hf}/__init__.py +0 -0
/vanna/{local.py → legacy/local.py} +0 -0
/vanna/{marqo → legacy/marqo}/__init__.py +0 -0
/vanna/{marqo → legacy/marqo}/marqo.py +0 -0
/vanna/{milvus → legacy/milvus}/__init__.py +0 -0
/vanna/{mistral → legacy/mistral}/__init__.py +0 -0
/vanna/{mistral → legacy/mistral}/mistral.py +0 -0
/vanna/{mock → legacy/mock}/__init__.py +0 -0
/vanna/{mock → legacy/mock}/embedding.py +0 -0
/vanna/{ollama → legacy/ollama}/__init__.py +0 -0
/vanna/{openai → legacy/openai}/__init__.py +0 -0
/vanna/{openai → legacy/openai}/openai_embeddings.py +0 -0
/vanna/{opensearch → legacy/opensearch}/__init__.py +0 -0
/vanna/{oracle → legacy/oracle}/__init__.py +0 -0
/vanna/{pgvector → legacy/pgvector}/__init__.py +0 -0
/vanna/{pinecone → legacy/pinecone}/__init__.py +0 -0
/vanna/{pinecone → legacy/pinecone}/pinecone_vector.py +0 -0
/vanna/{qdrant → legacy/qdrant}/__init__.py +0 -0
/vanna/{qianfan → legacy/qianfan}/__init__.py +0 -0
/vanna/{qianwen → legacy/qianwen}/QianwenAI_embeddings.py +0 -0
/vanna/{qianwen → legacy/qianwen}/__init__.py +0 -0
/vanna/{types → legacy/types}/__init__.py +0 -0
/vanna/{vannadb → legacy/vannadb}/__init__.py +0 -0
/vanna/{vllm → legacy/vllm}/__init__.py +0 -0
/vanna/{weaviate → legacy/weaviate}/__init__.py +0 -0
/vanna/{xinference → legacy/xinference}/__init__.py +0 -0
{vanna-0.7.8.dist-info → vanna-2.0.0.dist-info}/WHEEL +0 -0
{vanna-0.7.8.dist-info → vanna-2.0.0.dist-info}/licenses/LICENSE +0 -0

vanna/{base → legacy/base}/base.py RENAMED Viewed

@@ -136,7 +136,7 @@ class VannaBase(ABC):
         llm_response = self.submit_prompt(prompt, **kwargs)
         self.log(title="LLM Response", message=llm_response)
-        if 'intermediate_sql' in llm_response:
+        if "intermediate_sql" in llm_response:
             if not allow_llm_to_see_data:
                 return "The LLM is not allowed to see the data in your database. Your question requires database introspection to generate the necessary SQL. Please set allow_llm_to_see_data=True to enable this."
@@ -152,7 +152,11 @@ class VannaBase(ABC):
                         question=question,
                         question_sql_list=question_sql_list,
                         ddl_list=ddl_list,
-                        doc_list=doc_list+[f"The following is a pandas DataFrame with the results of the intermediate SQL query {intermediate_sql}: \n" + df.to_markdown()],
+                        doc_list=doc_list
+                        + [
+                            f"The following is a pandas DataFrame with the results of the intermediate SQL query {intermediate_sql}: \n"
+                            + df.to_markdown()
+                        ],
                         **kwargs,
                     )
                     self.log(title="Final SQL Prompt", message=prompt)
@@ -161,7 +165,6 @@ class VannaBase(ABC):
                 except Exception as e:
                     return f"Error running intermediate SQL: {e}"
         return self.extract_sql(llm_response)
     def extract_sql(self, llm_response: str) -> str:
@@ -181,30 +184,52 @@ class VannaBase(ABC):
             str: The extracted SQL query.
         """
-        # If the llm_response contains a CTE (with clause), extract the last sql between WITH and ;
-        sqls = re.findall(r"\bWITH\b .*?;", llm_response, re.DOTALL)
+        import re
+        """
+        Extracts the SQL query from the LLM response, handling various formats including:
+        - WITH clause
+        - SELECT statement
+        - CREATE TABLE AS SELECT
+        - Markdown code blocks
+        """
+        # Match CREATE TABLE ... AS SELECT
+        sqls = re.findall(
+            r"\bCREATE\s+TABLE\b.*?\bAS\b.*?;", llm_response, re.DOTALL | re.IGNORECASE
+        )
         if sqls:
             sql = sqls[-1]
             self.log(title="Extracted SQL", message=f"{sql}")
             return sql
-        # If the llm_response is not markdown formatted, extract last sql by finding select and ; in the response
-        sqls = re.findall(r"SELECT.*?;", llm_response, re.DOTALL)
+        # Match WITH clause (CTEs)
+        sqls = re.findall(r"\bWITH\b .*?;", llm_response, re.DOTALL | re.IGNORECASE)
         if sqls:
             sql = sqls[-1]
             self.log(title="Extracted SQL", message=f"{sql}")
             return sql
-        # If the llm_response contains a markdown code block, with or without the sql tag, extract the last sql from it
-        sqls = re.findall(r"```sql\n(.*)```", llm_response, re.DOTALL)
+        # Match SELECT ... ;
+        sqls = re.findall(r"\bSELECT\b .*?;", llm_response, re.DOTALL | re.IGNORECASE)
         if sqls:
             sql = sqls[-1]
             self.log(title="Extracted SQL", message=f"{sql}")
             return sql
-        sqls = re.findall(r"```(.*)```", llm_response, re.DOTALL)
+        # Match ```sql ... ``` blocks
+        sqls = re.findall(
+            r"```sql\s*\n(.*?)```", llm_response, re.DOTALL | re.IGNORECASE
+        )
         if sqls:
-            sql = sqls[-1]
+            sql = sqls[-1].strip()
+            self.log(title="Extracted SQL", message=f"{sql}")
+            return sql
+        # Match any ``` ... ``` code blocks
+        sqls = re.findall(r"```(.*?)```", llm_response, re.DOTALL | re.IGNORECASE)
+        if sqls:
+            sql = sqls[-1].strip()
             self.log(title="Extracted SQL", message=f"{sql}")
             return sql
@@ -229,7 +254,7 @@ class VannaBase(ABC):
         parsed = sqlparse.parse(sql)
         for statement in parsed:
-            if statement.get_type() == 'SELECT':
+            if statement.get_type() == "SELECT":
                 return True
         return False
@@ -251,12 +276,14 @@ class VannaBase(ABC):
             bool: True if a chart should be generated, False otherwise.
         """
-        if len(df) > 1 and df.select_dtypes(include=['number']).shape[1] > 0:
+        if len(df) > 1 and df.select_dtypes(include=["number"]).shape[1] > 0:
             return True
         return False
-    def generate_rewritten_question(self, last_question: str, new_question: str, **kwargs) -> str:
+    def generate_rewritten_question(
+        self, last_question: str, new_question: str, **kwargs
+    ) -> str:
         """
         **Example:**
         ```python
@@ -277,8 +304,15 @@ class VannaBase(ABC):
             return new_question
         prompt = [
-            self.system_message("Your goal is to combine a sequence of questions into a singular question if they are related. If the second question does not relate to the first question and is fully self-contained, return the second question. Return just the new combined question with no additional explanations. The question should theoretically be answerable with a single SQL statement."),
-            self.user_message("First question: " + last_question + "\nSecond question: " + new_question),
+            self.system_message(
+                "Your goal is to combine a sequence of questions into a singular question if they are related. If the second question does not relate to the first question and is fully self-contained, return the second question. Return just the new combined question with no additional explanations. The question should theoretically be answerable with a single SQL statement."
+            ),
+            self.user_message(
+                "First question: "
+                + last_question
+                + "\nSecond question: "
+                + new_question
+            ),
         ]
         return self.submit_prompt(prompt=prompt, **kwargs)
@@ -309,8 +343,8 @@ class VannaBase(ABC):
                 f"You are a helpful data assistant. The user asked the question: '{question}'\n\nThe SQL query for this question was: {sql}\n\nThe following is a pandas DataFrame with the results of the query: \n{df.head(25).to_markdown()}\n\n"
             ),
             self.user_message(
-                f"Generate a list of {n_questions} followup questions that the user might ask about this data. Respond with a list of questions, one per line. Do not answer with any explanations -- just the questions. Remember that there should be an unambiguous SQL query that can be generated from the question. Prefer questions that are answerable outside of the context of this conversation. Prefer questions that are slight modifications of the SQL query that was generated that allow digging deeper into the data. Each question will be turned into a button that the user can click to generate a new SQL query so don't use 'example' type questions. Each question must have a one-to-one correspondence with an instantiated SQL query." +
-                self._response_language()
+                f"Generate a list of {n_questions} followup questions that the user might ask about this data. Respond with a list of questions, one per line. Do not answer with any explanations -- just the questions. Remember that there should be an unambiguous SQL query that can be generated from the question. Prefer questions that are answerable outside of the context of this conversation. Prefer questions that are slight modifications of the SQL query that was generated that allow digging deeper into the data. Each question will be turned into a button that the user can click to generate a new SQL query so don't use 'example' type questions. Each question must have a one-to-one correspondence with an instantiated SQL query."
+                + self._response_language()
             ),
         ]
@@ -354,8 +388,8 @@ class VannaBase(ABC):
                 f"You are a helpful data assistant. The user asked the question: '{question}'\n\nThe following is a pandas DataFrame with the results of the query: \n{df.to_markdown()}\n\n"
             ),
             self.user_message(
-                "Briefly summarize the data based on the question that was asked. Do not respond with any additional explanation beyond the summary." +
-                self._response_language()
+                "Briefly summarize the data based on the question that was asked. Do not respond with any additional explanation beyond the summary."
+                + self._response_language()
             ),
         ]
@@ -551,7 +585,7 @@ class VannaBase(ABC):
     def get_sql_prompt(
         self,
-        initial_prompt : str,
+        initial_prompt: str,
         question: str,
         question_sql_list: list,
         ddl_list: list,
@@ -583,8 +617,10 @@ class VannaBase(ABC):
         """
         if initial_prompt is None:
-            initial_prompt = f"You are a {self.dialect} expert. " + \
-            "Please help to generate a SQL query to answer the question. Your response should ONLY be based on the given context and follow the response guidelines and format instructions. "
+            initial_prompt = (
+                f"You are a {self.dialect} expert. "
+                + "Please help to generate a SQL query to answer the question. Your response should ONLY be based on the given context and follow the response guidelines and format instructions. "
+            )
         initial_prompt = self.add_ddl_to_prompt(
             initial_prompt, ddl_list, max_tokens=self.max_tokens
@@ -749,7 +785,7 @@ class VannaBase(ABC):
         database: str,
         role: Union[str, None] = None,
         warehouse: Union[str, None] = None,
-        **kwargs
+        **kwargs,
     ):
         try:
             snowflake = __import__("snowflake.connector")
@@ -797,7 +833,7 @@ class VannaBase(ABC):
             account=account,
             database=database,
             client_session_keep_alive=True,
-            **kwargs
+            **kwargs,
         )
         def run_sql_snowflake(sql: str) -> pd.DataFrame:
@@ -823,7 +859,7 @@ class VannaBase(ABC):
         self.run_sql = run_sql_snowflake
         self.run_sql_is_set = True
-    def connect_to_sqlite(self, url: str, check_same_thread: bool = False,  **kwargs):
+    def connect_to_sqlite(self, url: str, check_same_thread: bool = False, **kwargs):
         """
         Connect to a SQLite database. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
@@ -848,11 +884,7 @@ class VannaBase(ABC):
             url = path
         # Connect to the database
-        conn = sqlite3.connect(
-            url,
-            check_same_thread=check_same_thread,
-            **kwargs
-        )
+        conn = sqlite3.connect(url, check_same_thread=check_same_thread, **kwargs)
         def run_sql_sqlite(sql: str):
             return pd.read_sql_query(sql, conn)
@@ -868,9 +900,8 @@ class VannaBase(ABC):
         user: str = None,
         password: str = None,
         port: int = None,
-        **kwargs
+        **kwargs,
     ):
         """
         Connect to postgres using the psycopg2 connector. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
         **Example:**
@@ -939,15 +970,20 @@ class VannaBase(ABC):
                 user=user,
                 password=password,
                 port=port,
-                **kwargs
+                **kwargs,
             )
         except psycopg2.Error as e:
             raise ValidationError(e)
         def connect_to_db():
-            return psycopg2.connect(host=host, dbname=dbname,
-                        user=user, password=password, port=port, **kwargs)
+            return psycopg2.connect(
+                host=host,
+                dbname=dbname,
+                user=user,
+                password=password,
+                port=port,
+                **kwargs,
+            )
         def run_sql_postgres(sql: str) -> Union[pd.DataFrame, None]:
             conn = None
@@ -980,14 +1016,13 @@ class VannaBase(ABC):
                     raise ValidationError(e)
             except Exception as e:
-                        conn.rollback()
-                        raise e
+                conn.rollback()
+                raise e
         self.dialect = "PostgreSQL"
         self.run_sql_is_set = True
         self.run_sql = run_sql_postgres
     def connect_to_mysql(
         self,
         host: str = None,
@@ -995,9 +1030,8 @@ class VannaBase(ABC):
         user: str = None,
         password: str = None,
         port: int = None,
-        **kwargs
+        **kwargs,
     ):
         try:
             import pymysql.cursors
         except ImportError:
@@ -1046,7 +1080,7 @@ class VannaBase(ABC):
                 database=dbname,
                 port=port,
                 cursorclass=pymysql.cursors.DictCursor,
-                **kwargs
+                **kwargs,
             )
         except pymysql.Error as e:
             raise ValidationError(e)
@@ -1083,9 +1117,8 @@ class VannaBase(ABC):
         user: str = None,
         password: str = None,
         port: int = None,
-        **kwargs
+        **kwargs,
     ):
         try:
             import clickhouse_connect
         except ImportError:
@@ -1133,7 +1166,7 @@ class VannaBase(ABC):
                 username=user,
                 password=password,
                 database=dbname,
-                **kwargs
+                **kwargs,
             )
             print(conn)
         except Exception as e:
@@ -1156,13 +1189,8 @@ class VannaBase(ABC):
         self.run_sql = run_sql_clickhouse
     def connect_to_oracle(
-        self,
-        user: str = None,
-        password: str = None,
-        dsn: str = None,
-        **kwargs
+        self, user: str = None, password: str = None, dsn: str = None, **kwargs
     ):
         """
         Connect to an Oracle db using oracledb package. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
         **Example:**
@@ -1182,7 +1210,6 @@ class VannaBase(ABC):
         try:
             import oracledb
         except ImportError:
             raise DependencyError(
                 "You need to install required dependencies to execute this method,"
                 " run command: \npip install oracledb"
@@ -1192,7 +1219,9 @@ class VannaBase(ABC):
             dsn = os.getenv("DSN")
         if not dsn:
-            raise ImproperlyConfigured("Please set your Oracle dsn which should include host:port/sid")
+            raise ImproperlyConfigured(
+                "Please set your Oracle dsn which should include host:port/sid"
+            )
         if not user:
             user = os.getenv("USER")
@@ -1209,12 +1238,7 @@ class VannaBase(ABC):
         conn = None
         try:
-            conn = oracledb.connect(
-                user=user,
-                password=password,
-                dsn=dsn,
-                **kwargs
-            )
+            conn = oracledb.connect(user=user, password=password, dsn=dsn, **kwargs)
         except oracledb.Error as e:
             raise ValidationError(e)
@@ -1222,7 +1246,9 @@ class VannaBase(ABC):
             if conn:
                 try:
                     sql = sql.rstrip()
-                    if sql.endswith(';'): #fix for a known problem with Oracle db where an extra ; will cause an error.
+                    if sql.endswith(
+                        ";"
+                    ):  # fix for a known problem with Oracle db where an extra ; will cause an error.
                         sql = sql[:-1]
                     cs = conn.cursor()
@@ -1247,10 +1273,7 @@ class VannaBase(ABC):
         self.run_sql = run_sql_oracle
     def connect_to_bigquery(
-        self,
-        cred_file_path: str = None,
-        project_id: str = None,
-        **kwargs
+        self, cred_file_path: str = None, project_id: str = None, **kwargs
     ):
         """
         Connect to gcs using the bigquery connector. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
@@ -1299,7 +1322,7 @@ class VannaBase(ABC):
         if not cred_file_path:
             try:
                 conn = bigquery.Client(project=project_id)
-            except:
+            except Exception:
                 print("Could not found any google cloud implicit credentials")
         else:
             # Validate file path and pemissions
@@ -1314,11 +1337,9 @@ class VannaBase(ABC):
             try:
                 conn = bigquery.Client(
-                    project=project_id,
-                    credentials=credentials,
-                    **kwargs
+                    project=project_id, credentials=credentials, **kwargs
                 )
-            except:
+            except Exception:
                 raise ImproperlyConfigured(
                     "Could not connect to bigquery please correct credentials"
                 )
@@ -1430,20 +1451,21 @@ class VannaBase(ABC):
         self.dialect = "T-SQL / Microsoft SQL Server"
         self.run_sql = run_sql_mssql
         self.run_sql_is_set = True
     def connect_to_presto(
         self,
         host: str,
-        catalog: str = 'hive',
-        schema: str = 'default',
+        catalog: str = "hive",
+        schema: str = "default",
         user: str = None,
         password: str = None,
         port: int = None,
         combined_pem_path: str = None,
-        protocol: str = 'https',
+        protocol: str = "https",
         requests_kwargs: dict = None,
-        **kwargs
+        **kwargs,
     ):
-      """
+        """
         Connect to a Presto database using the specified parameters.
         Args:
@@ -1463,101 +1485,103 @@ class VannaBase(ABC):
         Returns:
             None
-      """
-      try:
-        from pyhive import presto
-      except ImportError:
-        raise DependencyError(
-          "You need to install required dependencies to execute this method,"
-          " run command: \npip install pyhive"
-        )
+        """
+        try:
+            from pyhive import presto
+        except ImportError:
+            raise DependencyError(
+                "You need to install required dependencies to execute this method,"
+                " run command: \npip install pyhive"
+            )
-      if not host:
-        host = os.getenv("PRESTO_HOST")
-      if not host:
-        raise ImproperlyConfigured("Please set your presto host")
-      if not catalog:
-        catalog = os.getenv("PRESTO_CATALOG")
-      if not catalog:
-        raise ImproperlyConfigured("Please set your presto catalog")
-      if not user:
-        user = os.getenv("PRESTO_USER")
-      if not user:
-        raise ImproperlyConfigured("Please set your presto user")
-      if not password:
-        password = os.getenv("PRESTO_PASSWORD")
-      if not port:
-        port = os.getenv("PRESTO_PORT")
-      if not port:
-        raise ImproperlyConfigured("Please set your presto port")
-      conn = None
-      try:
-        if requests_kwargs is None and combined_pem_path is not None:
-          # use the combined pem file to verify the SSL connection
-          requests_kwargs = {
-            'verify': combined_pem_path,  # 使用转换后得到的 PEM 文件进行 SSL 验证
-          }
-        conn = presto.Connection(host=host,
-                                 username=user,
-                                 password=password,
-                                 catalog=catalog,
-                                 schema=schema,
-                                 port=port,
-                                 protocol=protocol,
-                                 requests_kwargs=requests_kwargs,
-                                 **kwargs)
-      except presto.Error as e:
-        raise ValidationError(e)
-      def run_sql_presto(sql: str) -> Union[pd.DataFrame, None]:
-        if conn:
-          try:
-            sql = sql.rstrip()
-            # fix for a known problem with presto db where an extra ; will cause an error.
-            if sql.endswith(';'):
-                sql = sql[:-1]
-            cs = conn.cursor()
-            cs.execute(sql)
-            results = cs.fetchall()
+        if not host:
+            host = os.getenv("PRESTO_HOST")
-            # Create a pandas dataframe from the results
-            df = pd.DataFrame(
-              results, columns=[desc[0] for desc in cs.description]
-            )
-            return df
+        if not host:
+            raise ImproperlyConfigured("Please set your presto host")
-          except presto.Error as e:
-            print(e)
+        if not catalog:
+            catalog = os.getenv("PRESTO_CATALOG")
+        if not catalog:
+            raise ImproperlyConfigured("Please set your presto catalog")
+        if not user:
+            user = os.getenv("PRESTO_USER")
+        if not user:
+            raise ImproperlyConfigured("Please set your presto user")
+        if not password:
+            password = os.getenv("PRESTO_PASSWORD")
+        if not port:
+            port = os.getenv("PRESTO_PORT")
+        if not port:
+            raise ImproperlyConfigured("Please set your presto port")
+        conn = None
+        try:
+            if requests_kwargs is None and combined_pem_path is not None:
+                # use the combined pem file to verify the SSL connection
+                requests_kwargs = {
+                    "verify": combined_pem_path,  # 使用转换后得到的 PEM 文件进行 SSL 验证
+                }
+            conn = presto.Connection(
+                host=host,
+                username=user,
+                password=password,
+                catalog=catalog,
+                schema=schema,
+                port=port,
+                protocol=protocol,
+                requests_kwargs=requests_kwargs,
+                **kwargs,
+            )
+        except presto.Error as e:
             raise ValidationError(e)
-          except Exception as e:
-            print(e)
-            raise e
+        def run_sql_presto(sql: str) -> Union[pd.DataFrame, None]:
+            if conn:
+                try:
+                    sql = sql.rstrip()
+                    # fix for a known problem with presto db where an extra ; will cause an error.
+                    if sql.endswith(";"):
+                        sql = sql[:-1]
+                    cs = conn.cursor()
+                    cs.execute(sql)
+                    results = cs.fetchall()
+                    # Create a pandas dataframe from the results
+                    df = pd.DataFrame(
+                        results, columns=[desc[0] for desc in cs.description]
+                    )
+                    return df
-      self.run_sql_is_set = True
-      self.run_sql = run_sql_presto
+                except presto.Error as e:
+                    print(e)
+                    raise ValidationError(e)
+                except Exception as e:
+                    print(e)
+                    raise e
+        self.run_sql_is_set = True
+        self.run_sql = run_sql_presto
     def connect_to_hive(
         self,
         host: str = None,
-        dbname: str = 'default',
+        dbname: str = "default",
         user: str = None,
         password: str = None,
         port: int = None,
-        auth: str = 'CUSTOM',
-        **kwargs
+        auth: str = "CUSTOM",
+        **kwargs,
     ):
-      """
+        """
         Connect to a Hive database. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
         Connect to a Hive database. This is just a helper function to set [`vn.run_sql`][vanna.base.base.VannaBase.run_sql]
@@ -1571,78 +1595,80 @@ class VannaBase(ABC):
         Returns:
             None
-      """
-      try:
-        from pyhive import hive
-      except ImportError:
-        raise DependencyError(
-          "You need to install required dependencies to execute this method,"
-          " run command: \npip install pyhive"
-        )
-      if not host:
-        host = os.getenv("HIVE_HOST")
+        """
-      if not host:
-        raise ImproperlyConfigured("Please set your hive host")
+        try:
+            from pyhive import hive
+        except ImportError:
+            raise DependencyError(
+                "You need to install required dependencies to execute this method,"
+                " run command: \npip install pyhive"
+            )
-      if not dbname:
-        dbname = os.getenv("HIVE_DATABASE")
+        if not host:
+            host = os.getenv("HIVE_HOST")
-      if not dbname:
-        raise ImproperlyConfigured("Please set your hive database")
+        if not host:
+            raise ImproperlyConfigured("Please set your hive host")
-      if not user:
-        user = os.getenv("HIVE_USER")
+        if not dbname:
+            dbname = os.getenv("HIVE_DATABASE")
-      if not user:
-        raise ImproperlyConfigured("Please set your hive user")
+        if not dbname:
+            raise ImproperlyConfigured("Please set your hive database")
-      if not password:
-        password = os.getenv("HIVE_PASSWORD")
+        if not user:
+            user = os.getenv("HIVE_USER")
-      if not port:
-        port = os.getenv("HIVE_PORT")
+        if not user:
+            raise ImproperlyConfigured("Please set your hive user")
-      if not port:
-        raise ImproperlyConfigured("Please set your hive port")
+        if not password:
+            password = os.getenv("HIVE_PASSWORD")
-      conn = None
+        if not port:
+            port = os.getenv("HIVE_PORT")
-      try:
-        conn = hive.Connection(host=host,
-                               username=user,
-                               password=password,
-                               database=dbname,
-                               port=port,
-                               auth=auth)
-      except hive.Error as e:
-        raise ValidationError(e)
+        if not port:
+            raise ImproperlyConfigured("Please set your hive port")
-      def run_sql_hive(sql: str) -> Union[pd.DataFrame, None]:
-        if conn:
-          try:
-            cs = conn.cursor()
-            cs.execute(sql)
-            results = cs.fetchall()
+        conn = None
-            # Create a pandas dataframe from the results
-            df = pd.DataFrame(
-              results, columns=[desc[0] for desc in cs.description]
+        try:
+            conn = hive.Connection(
+                host=host,
+                username=user,
+                password=password,
+                database=dbname,
+                port=port,
+                auth=auth,
             )
-            return df
-          except hive.Error as e:
-            print(e)
+        except hive.Error as e:
             raise ValidationError(e)
-          except Exception as e:
-            print(e)
-            raise e
+        def run_sql_hive(sql: str) -> Union[pd.DataFrame, None]:
+            if conn:
+                try:
+                    cs = conn.cursor()
+                    cs.execute(sql)
+                    results = cs.fetchall()
-      self.run_sql_is_set = True
-      self.run_sql = run_sql_hive
+                    # Create a pandas dataframe from the results
+                    df = pd.DataFrame(
+                        results, columns=[desc[0] for desc in cs.description]
+                    )
+                    return df
+                except hive.Error as e:
+                    print(e)
+                    raise ValidationError(e)
+                except Exception as e:
+                    print(e)
+                    raise e
+        self.run_sql_is_set = True
+        self.run_sql = run_sql_hive
     def run_sql(self, sql: str, **kwargs) -> pd.DataFrame:
         """
@@ -1700,22 +1726,23 @@ class VannaBase(ABC):
             question = input("Enter a question: ")
         try:
-            sql = self.generate_sql(question=question, allow_llm_to_see_data=allow_llm_to_see_data)
+            sql = self.generate_sql(
+                question=question, allow_llm_to_see_data=allow_llm_to_see_data
+            )
         except Exception as e:
             print(e)
             return None, None, None
         if print_results:
             try:
-                Code = __import__("IPython.display", fromList=["Code"]).Code
+                from IPython.display import Code, display
                 display(Code(sql))
             except Exception as e:
                 print(sql)
         if self.run_sql_is_set is False:
-            print(
-                "If you want to run the SQL query, connect to a database first."
-            )
+            print("If you want to run the SQL query, connect to a database first.")
             if print_results:
                 return None
@@ -1759,6 +1786,7 @@ class VannaBase(ABC):
                             fig.show()
                 except Exception as e:
                     # Print stack trace
+                    traceback.print_stack()
                     traceback.print_exc()
                     print("Couldn't run plotly code: ", e)
                     if print_results:
@@ -1874,12 +1902,8 @@ class VannaBase(ABC):
         table_column = df.columns[
             df.columns.str.lower().str.contains("table_name")
         ].to_list()[0]
-        columns = [database_column,
-                    schema_column,
-                    table_column]
-        candidates = ["column_name",
-                      "data_type",
-                      "comment"]
+        columns = [database_column, schema_column, table_column]
+        candidates = ["column_name", "data_type", "comment"]
         matches = df.columns.str.lower().str.contains("|".join(candidates), regex=True)
         columns += df.columns[matches].to_list()

vanna 0.7.8__py3-none-any.whl → 2.0.0__py3-none-any.whl

vanna 0.7.8py3-none-any.whl → 2.0.0py3-none-any.whl