PyPI - vectara-agentic - Versions diffs - 0.4.6__py3-none-any.whl → 0.4.8__py3-none-any.whl - Mend

vectara-agentic 0.4.6py3-none-any.whl → 0.4.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of vectara-agentic might be problematic. Click here for more details.

Files changed (17) hide show

tests/test_bedrock.py +101 -0
tests/test_gemini.py +64 -0
tests/test_groq.py +196 -11
tests/test_openai.py +101 -0
tests/test_tools.py +161 -0
vectara_agentic/_version.py +1 -1
vectara_agentic/agent.py +1 -1
vectara_agentic/agent_core/prompts.py +12 -11
vectara_agentic/agent_core/streaming.py +178 -195
vectara_agentic/llm_utils.py +1 -1
vectara_agentic/sub_query_workflow.py +31 -31
vectara_agentic/tools.py +108 -4
{vectara_agentic-0.4.6.dist-info → vectara_agentic-0.4.8.dist-info}/METADATA +32 -31
{vectara_agentic-0.4.6.dist-info → vectara_agentic-0.4.8.dist-info}/RECORD +17 -17
{vectara_agentic-0.4.6.dist-info → vectara_agentic-0.4.8.dist-info}/WHEEL +0 -0
{vectara_agentic-0.4.6.dist-info → vectara_agentic-0.4.8.dist-info}/licenses/LICENSE +0 -0
{vectara_agentic-0.4.6.dist-info → vectara_agentic-0.4.8.dist-info}/top_level.txt +0 -0

tests/test_tools.py CHANGED Viewed

@@ -15,6 +15,8 @@ from vectara_agentic.tools import (
     VectaraToolFactory,
     ToolsFactory,
     ToolType,
+    normalize_url,
+    citation_appears_in_text,
 )
 from vectara_agentic.agent import Agent
 from vectara_agentic.agent_config import AgentConfig
@@ -367,6 +369,165 @@ class TestToolsPackage(unittest.TestCase):
         self.assertIn("Returns:", doc)
         self.assertIn("dict[str, Any]: A dictionary containing the result data.", doc)
+    def test_normalize_url(self):
+        """Test URL normalization function"""
+        # Test space encoding normalization
+        self.assertEqual(
+            normalize_url("http://example.com/file with spaces.pdf"),
+            "http://example.com/file%20with%20spaces.pdf",
+        )
+        # Test that already encoded URLs remain normalized
+        self.assertEqual(
+            normalize_url("http://example.com/file%20with%20spaces.pdf"),
+            "http://example.com/file%20with%20spaces.pdf",
+        )
+        # Test special characters
+        self.assertEqual(
+            normalize_url("http://example.com/path?query=hello world&foo=bar"),
+            "http://example.com/path?query=hello%20world&foo=bar",
+        )
+        # Test empty/None input
+        self.assertEqual(normalize_url(""), "")
+        self.assertEqual(normalize_url(None), None)
+        # Test complex URL with multiple encodable characters
+        result = normalize_url("http://example.com/docs/My Document [v2].pdf#section 1")
+        expected = "http://example.com/docs/My%20Document%20[v2].pdf#section%201"
+        self.assertEqual(result, expected)
+    def test_citation_appears_in_text_exact_match(self):
+        """Test citation matching with exact format"""
+        response_text = "Here's the info [Document Title](http://example.com/doc.pdf) for reference."
+        # Should match exact citation
+        self.assertTrue(
+            citation_appears_in_text(
+                "Document Title", "http://example.com/doc.pdf", response_text
+            )
+        )
+        # Should not match different text with different URL
+        self.assertFalse(
+            citation_appears_in_text(
+                "Wrong Title", "http://different.com/other.pdf", response_text
+            )
+        )
+    def test_citation_appears_in_text_url_encoding(self):
+        """Test citation matching with URL encoding differences"""
+        # Response text with percent-encoded URL
+        response_text_encoded = (
+            "See [My Doc](http://example.com/my%20document.pdf) for details."
+        )
+        # Should match when citation URL has spaces
+        self.assertTrue(
+            citation_appears_in_text(
+                "My Doc", "http://example.com/my document.pdf", response_text_encoded
+            )
+        )
+        # Response text with spaces in URL
+        response_text_spaces = (
+            "See [My Doc](http://example.com/my document.pdf) for details."
+        )
+        # Should match when citation URL is encoded
+        self.assertTrue(
+            citation_appears_in_text(
+                "My Doc", "http://example.com/my%20document.pdf", response_text_spaces
+            )
+        )
+    def test_citation_appears_in_text_url_presence(self):
+        """Test fallback URL presence matching"""
+        # Response text that contains URL but not in exact citation format
+        response_text = (
+            "The document at http://example.com/report.pdf contains the analysis."
+        )
+        # Should match based on URL presence
+        self.assertTrue(
+            citation_appears_in_text(
+                "Report", "http://example.com/report.pdf", response_text
+            )
+        )
+        # Should work with encoded URL in response
+        response_encoded = (
+            "The document at http://example.com/my%20report.pdf contains data."
+        )
+        self.assertTrue(
+            citation_appears_in_text(
+                "Report", "http://example.com/my report.pdf", response_encoded
+            )
+        )
+    def test_citation_appears_in_text_edge_cases(self):
+        """Test edge cases and error conditions"""
+        response_text = "Some text with [citations](http://example.com/doc.pdf) here."
+        # Empty inputs should return False
+        self.assertFalse(
+            citation_appears_in_text("", "http://example.com/doc.pdf", response_text)
+        )
+        self.assertFalse(citation_appears_in_text("Title", "", response_text))
+        self.assertFalse(
+            citation_appears_in_text("Title", "http://example.com/doc.pdf", "")
+        )
+        self.assertFalse(
+            citation_appears_in_text(None, "http://example.com/doc.pdf", response_text)
+        )
+        # Both None should return False
+        self.assertFalse(citation_appears_in_text(None, None, response_text))
+        # Very short filename should not trigger filename matching
+        self.assertFalse(
+            citation_appears_in_text(
+                "Title", "http://example.com/x.y", "Different content"
+            )
+        )
+    def test_citation_appears_in_text_complex_encoding(self):
+        """Test complex URL encoding scenarios"""
+        # Test case with multiple special characters
+        response_text = "Document: [Legal Doc](http://example.com/docs/Contract%20%5B2024%5D%20%26%20Agreement.pdf)"
+        # Should match with unencoded URL
+        self.assertTrue(
+            citation_appears_in_text(
+                "Legal Doc",
+                "http://example.com/docs/Contract [2024] & Agreement.pdf",
+                response_text,
+            )
+        )
+    def test_citation_appears_in_text_url_only(self):
+        """Test citation matching when only URL is available (no text)"""
+        # Test the [(url)] format when only URL is available
+        response_text = "Reference: [(http://example.com/report.pdf)] shows data."
+        # Should match with URL-only citation format
+        self.assertTrue(
+            citation_appears_in_text(
+                None, "http://example.com/report.pdf", response_text
+            )
+        )
+        # Should also work with URL encoding differences
+        response_encoded = (
+            "Reference: [(http://example.com/my%20report.pdf)] shows data."
+        )
+        self.assertTrue(
+            citation_appears_in_text(
+                None, "http://example.com/my report.pdf", response_encoded
+            )
+        )
 if __name__ == "__main__":
     unittest.main()

vectara_agentic/_version.py CHANGED Viewed

@@ -1,4 +1,4 @@
 """
 Define the version of the package.
 """
-__version__ = "0.4.6"
+__version__ = "0.4.8"

vectara_agentic/agent.py CHANGED Viewed

@@ -1096,7 +1096,7 @@ class Agent:
                 model_fields = outputs_model_on_fail_cls.model_fields
                 input_dict = {}
                 for key in model_fields:
-                    value = await workflow_context.get(key, default=_missing)
+                    value = await workflow_context.store.get(key, default=_missing)  # pylint: disable=no-member
                     if value is not _missing:
                         input_dict[key] = value
                 output = outputs_model_on_fail_cls.model_validate(input_dict)

vectara_agentic/agent_core/prompts.py CHANGED Viewed

@@ -23,7 +23,7 @@ GENERAL_INSTRUCTIONS = """
   In rephrasing, aim for alternative queries that may work better for searching for the information.
   For example, you can rephrase "CEO" with "Chief Executive Officer".
   2) Break the question into sub-questions and call this tool or another tool for each sub-question, then combine the answers to provide a complete response.
-  For example if asked "what is the population of France and Germany", you can call the tool twice, once for France and once for Germany.
+  For example if asked "what is the population of France and Germany", you can call the tool twice, once for France and once for Germany,
   and then combine the responses to provide the full answer.
   3) If a tool fails, try other tools that might be appropriate to gain the information you need.
 - If after retrying you can't get the information or answer the question, respond with "I don't know".
@@ -31,22 +31,22 @@ GENERAL_INSTRUCTIONS = """
   Be consistent with the format of numbers and dates across multi turn conversations.
 - Handling citations - IMPORTANT:
   1) Always embed citations inline with the text of your response, using valid URLs provided by tools.
-     Never omit a legitimate citations.
-     Avoid creating a bibliography or a list of sources at the end of your response, and referring the reader to that list.
+     Never omit a legitimate citation.
+     Never repeat the same citation multiple times in a response.
+  2) Avoid creating a bibliography or a list of sources at the end of your response, and referring the reader to that list.
      Instead, embed citations directly in the text where the information is presented.
      For example, "According to the [Nvidia 10-K report](https://www.nvidia.com/doc.pdf#page=8), revenue in 2021 was $10B."
-  2) When including URLs in the citation, only use well-formed, non-empty URLs (beginning with “http://” or “https://”) and ignore any malformed or placeholder links.
-  3) Use descriptive link text for citations whenever possible, falling back to numeric labels only when necessary.
+  3) When including URLs in the citation, only use well-formed, non-empty URLs (beginning with “http://” or “https://”) and ignore any malformed or placeholder links.
+  4) Use descriptive link text for citations whenever possible, falling back to numeric labels only when necessary.
      Preferred: "According to the [Nvidia 10-K report](https://www.nvidia.com/doc.pdf#page=8), revenue in 2021 was $10B."
      Fallback: "According to the Nvidia 10-K report, revenue in 2021 was $10B [1](https://www.nvidia.com/doc.pdf#page=8)."
-  4) If a URL is for a PDF file, and the tool also provided a page number, append "#page=X" to the URL.
+  5) If a URL is for a PDF file, and the tool also provided a page number, append "#page=X" to the URL.
      For example, if the URL is "https://www.xxx.com/doc.pdf" and "page='5'", then the URL used in the citation would be "https://www.xxx.com/doc.pdf#page=5".
      Always include the page number in the URL, whether you use anchor text or a numeric label.
-  5) When citing images, figures, or tables, link directly to the file (or PDF page) just as you would for text.
-  6) Give each discrete fact its own citation (or citations), even if multiple facts come from the same document.
-     Avoid lumping multiple pages into one citation.
-  7) Ensure a space or punctuation precedes and follows every citation.
-     Here's an example where there is no proper spacing, and the citation is shown right after "10-K": "As shown in the [Nvidia 10-K](https://www.nvidia.com), the revenue in 2021 was $10B".
+  6) When citing images, figures, or tables, link directly to the file (or PDF page) just as you would for text.
+  7) Give each discrete fact its own citation (or citations), even if multiple facts come from the same document.
+  8) Ensure a space or punctuation precedes and follows every citation.
+     Here's an example where there is no proper spacing, and the citation is shown right after "10-K": "As shown in the[Nvidia 10-K](https://www.nvidia.com), the revenue in 2021 was $10B".
      Instead use spacing properly: "As shown in the [Nvidia 10-K](https://www.nvidia.com), the revenue in 2021 was $10B".
 - If a tool returns a "Malfunction" error - notify the user that you cannot respond due a tool not operating properly (and the tool name).
 - Your response should never be the input to a tool, only the output.
@@ -58,6 +58,7 @@ GENERAL_INSTRUCTIONS = """
 - Always respond in the language of the question, and in text (no images, videos or code).
 - If you are provided with database tools use them for analytical queries (such as counting, calculating max, min, average, sum, or other statistics).
   For each database, the database tools include: x_list_tables, x_load_data, x_describe_tables, x_load_unique_values, and x_load_sample_data, where 'x' in the database name.
+  Do not call any database tool unless it is included in your list of available tools.
   for example, if the database name is "ev", the tools are: ev_list_tables, ev_load_data, ev_describe_tables, ev_load_unique_values, and ev_load_sample_data.
   Use ANSI SQL-92 syntax for the SQL queries, and do not use any other SQL dialect.
   Before using the x_load_data with a SQL query, always follow these discovery steps:

vectara-agentic 0.4.6__py3-none-any.whl → 0.4.8__py3-none-any.whl

Potentially problematic release.

vectara-agentic 0.4.6py3-none-any.whl → 0.4.8py3-none-any.whl