PyPI - langroid - Versions diffs - 0.32.2__py3-none-any.whl → 0.33.4__py3-none-any.whl - Mend

langroid 0.32.2py3-none-any.whl → 0.33.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

{langroid-0.32.2.dist-info → langroid-0.33.4.dist-info}/METADATA +149 -123
langroid-0.33.4.dist-info/RECORD +7 -0
{langroid-0.32.2.dist-info → langroid-0.33.4.dist-info}/WHEEL +1 -1
langroid-0.33.4.dist-info/entry_points.txt +4 -0
pyproject.toml +317 -212
langroid/__init__.py +0 -106
langroid/agent/__init__.py +0 -41
langroid/agent/base.py +0 -1983
langroid/agent/batch.py +0 -398
langroid/agent/callbacks/__init__.py +0 -0
langroid/agent/callbacks/chainlit.py +0 -598
langroid/agent/chat_agent.py +0 -1899
langroid/agent/chat_document.py +0 -454
langroid/agent/openai_assistant.py +0 -882
langroid/agent/special/__init__.py +0 -59
langroid/agent/special/arangodb/__init__.py +0 -0
langroid/agent/special/arangodb/arangodb_agent.py +0 -656
langroid/agent/special/arangodb/system_messages.py +0 -186
langroid/agent/special/arangodb/tools.py +0 -107
langroid/agent/special/arangodb/utils.py +0 -36
langroid/agent/special/doc_chat_agent.py +0 -1466
langroid/agent/special/lance_doc_chat_agent.py +0 -262
langroid/agent/special/lance_rag/__init__.py +0 -9
langroid/agent/special/lance_rag/critic_agent.py +0 -198
langroid/agent/special/lance_rag/lance_rag_task.py +0 -82
langroid/agent/special/lance_rag/query_planner_agent.py +0 -260
langroid/agent/special/lance_tools.py +0 -61
langroid/agent/special/neo4j/__init__.py +0 -0
langroid/agent/special/neo4j/csv_kg_chat.py +0 -174
langroid/agent/special/neo4j/neo4j_chat_agent.py +0 -433
langroid/agent/special/neo4j/system_messages.py +0 -120
langroid/agent/special/neo4j/tools.py +0 -32
langroid/agent/special/relevance_extractor_agent.py +0 -127
langroid/agent/special/retriever_agent.py +0 -56
langroid/agent/special/sql/__init__.py +0 -17
langroid/agent/special/sql/sql_chat_agent.py +0 -654
langroid/agent/special/sql/utils/__init__.py +0 -21
langroid/agent/special/sql/utils/description_extractors.py +0 -190
langroid/agent/special/sql/utils/populate_metadata.py +0 -85
langroid/agent/special/sql/utils/system_message.py +0 -35
langroid/agent/special/sql/utils/tools.py +0 -64
langroid/agent/special/table_chat_agent.py +0 -263
langroid/agent/task.py +0 -2095
langroid/agent/tool_message.py +0 -393
langroid/agent/tools/__init__.py +0 -38
langroid/agent/tools/duckduckgo_search_tool.py +0 -50
langroid/agent/tools/file_tools.py +0 -234
langroid/agent/tools/google_search_tool.py +0 -39
langroid/agent/tools/metaphor_search_tool.py +0 -67
langroid/agent/tools/orchestration.py +0 -303
langroid/agent/tools/recipient_tool.py +0 -235
langroid/agent/tools/retrieval_tool.py +0 -32
langroid/agent/tools/rewind_tool.py +0 -137
langroid/agent/tools/segment_extract_tool.py +0 -41
langroid/agent/xml_tool_message.py +0 -382
langroid/cachedb/__init__.py +0 -17
langroid/cachedb/base.py +0 -58
langroid/cachedb/momento_cachedb.py +0 -108
langroid/cachedb/redis_cachedb.py +0 -153
langroid/embedding_models/__init__.py +0 -39
langroid/embedding_models/base.py +0 -74
langroid/embedding_models/models.py +0 -461
langroid/embedding_models/protoc/__init__.py +0 -0
langroid/embedding_models/protoc/embeddings.proto +0 -19
langroid/embedding_models/protoc/embeddings_pb2.py +0 -33
langroid/embedding_models/protoc/embeddings_pb2.pyi +0 -50
langroid/embedding_models/protoc/embeddings_pb2_grpc.py +0 -79
langroid/embedding_models/remote_embeds.py +0 -153
langroid/exceptions.py +0 -65
langroid/language_models/__init__.py +0 -53
langroid/language_models/azure_openai.py +0 -153
langroid/language_models/base.py +0 -678
langroid/language_models/config.py +0 -18
langroid/language_models/mock_lm.py +0 -124
langroid/language_models/openai_gpt.py +0 -1964
langroid/language_models/prompt_formatter/__init__.py +0 -16
langroid/language_models/prompt_formatter/base.py +0 -40
langroid/language_models/prompt_formatter/hf_formatter.py +0 -132
langroid/language_models/prompt_formatter/llama2_formatter.py +0 -75
langroid/language_models/utils.py +0 -151
langroid/mytypes.py +0 -84
langroid/parsing/__init__.py +0 -52
langroid/parsing/agent_chats.py +0 -38
langroid/parsing/code_parser.py +0 -121
langroid/parsing/document_parser.py +0 -718
langroid/parsing/para_sentence_split.py +0 -62
langroid/parsing/parse_json.py +0 -155
langroid/parsing/parser.py +0 -313
langroid/parsing/repo_loader.py +0 -790
langroid/parsing/routing.py +0 -36
langroid/parsing/search.py +0 -275
langroid/parsing/spider.py +0 -102
langroid/parsing/table_loader.py +0 -94
langroid/parsing/url_loader.py +0 -111
langroid/parsing/urls.py +0 -273
langroid/parsing/utils.py +0 -373
langroid/parsing/web_search.py +0 -155
langroid/prompts/__init__.py +0 -9
langroid/prompts/dialog.py +0 -17
langroid/prompts/prompts_config.py +0 -5
langroid/prompts/templates.py +0 -141
langroid/pydantic_v1/__init__.py +0 -10
langroid/pydantic_v1/main.py +0 -4
langroid/utils/__init__.py +0 -19
langroid/utils/algorithms/__init__.py +0 -3
langroid/utils/algorithms/graph.py +0 -103
langroid/utils/configuration.py +0 -98
langroid/utils/constants.py +0 -30
langroid/utils/git_utils.py +0 -252
langroid/utils/globals.py +0 -49
langroid/utils/logging.py +0 -135
langroid/utils/object_registry.py +0 -66
langroid/utils/output/__init__.py +0 -20
langroid/utils/output/citations.py +0 -41
langroid/utils/output/printing.py +0 -99
langroid/utils/output/status.py +0 -40
langroid/utils/pandas_utils.py +0 -30
langroid/utils/pydantic_utils.py +0 -602
langroid/utils/system.py +0 -286
langroid/utils/types.py +0 -93
langroid/vector_store/__init__.py +0 -50
langroid/vector_store/base.py +0 -357
langroid/vector_store/chromadb.py +0 -214
langroid/vector_store/lancedb.py +0 -401
langroid/vector_store/meilisearch.py +0 -299
langroid/vector_store/momento.py +0 -278
langroid/vector_store/qdrantdb.py +0 -468
langroid-0.32.2.dist-info/RECORD +0 -128
{langroid-0.32.2.dist-info → langroid-0.33.4.dist-info/licenses}/LICENSE +0 -0

langroid/parsing/code_parser.py DELETED Viewed

@@ -1,121 +0,0 @@
-from functools import reduce
-from typing import Callable, List
-import tiktoken
-from pygments import lex
-from pygments.lexers import get_lexer_by_name
-from pygments.token import Token
-from langroid.mytypes import Document
-from langroid.pydantic_v1 import BaseSettings
-def chunk_code(
-    code: str, language: str, max_tokens: int, len_fn: Callable[[str], int]
-) -> List[str]:
-    """
-    Chunk code into smaller pieces, so that we don't exceed the maximum
-    number of tokens allowed by the embedding model.
-    Args:
-        code: string of code
-        language: str as a file extension, e.g. "py", "yml"
-        max_tokens: max tokens per chunk
-        len_fn: function to get the length of a string in token units
-    Returns:
-    """
-    lexer = get_lexer_by_name(language)
-    tokens = list(lex(code, lexer))
-    chunks = []
-    current_chunk = ""
-    for token_type, token_value in tokens:
-        if token_type in Token.Text.Whitespace:
-            current_chunk += token_value
-        else:
-            token_tokens = len_fn(token_value)
-            if len_fn(current_chunk) + token_tokens <= max_tokens:
-                current_chunk += token_value
-            else:
-                chunks.append(current_chunk)
-                current_chunk = token_value
-    if current_chunk:
-        chunks.append(current_chunk)
-    return chunks
-class CodeParsingConfig(BaseSettings):
-    extensions: List[str] = [
-        "py",
-        "java",
-        "c",
-        "cpp",
-        "h",
-        "hpp",
-        "yml",
-        "yaml",
-        "toml",
-        "cfg",  # e.g. setup.cfg
-        "ini",
-        "json",
-        "rst",
-        "sh",
-        "bash",
-    ]
-    chunk_size: int = 500  # tokens
-    token_encoding_model: str = "text-embedding-ada-002"
-    n_similar_docs: int = 4
-class CodeParser:
-    def __init__(self, config: CodeParsingConfig):
-        self.config = config
-        self.tokenizer = tiktoken.encoding_for_model(config.token_encoding_model)
-    def num_tokens(self, text: str) -> int:
-        """
-        How many tokens are in the text, according to the tokenizer.
-        This needs to be accurate, otherwise we may exceed the maximum
-        number of tokens allowed by the model.
-        Args:
-            text: string to tokenize
-        Returns:
-            number of tokens in the text
-        """
-        tokens = self.tokenizer.encode(text)
-        return len(tokens)
-    def split(self, docs: List[Document]) -> List[Document]:
-        """
-        Split the documents into chunks, according to the config.splitter.
-        Only the documents with a language in the config.extensions are split.
-        !!! note
-            We assume the metadata in each document has at least a `language` field,
-            which is used to determine how to chunk the code.
-        Args:
-            docs: list of documents to split
-        Returns:
-            list of documents, where each document is a chunk; the metadata of the
-            original document is duplicated for each chunk, so that when we retrieve a
-            chunk, we immediately know info about the original document.
-        """
-        chunked_docs = [
-            [
-                Document(content=chunk, metadata=d.metadata)
-                for chunk in chunk_code(
-                    d.content,
-                    d.metadata.language,  # type: ignore
-                    self.config.chunk_size,
-                    self.num_tokens,
-                )
-                if chunk.strip() != ""
-            ]
-            for d in docs
-            if d.metadata.language in self.config.extensions  # type: ignore
-        ]
-        if len(chunked_docs) == 0:
-            return []
-        # collapse the list of lists into a single list
-        return reduce(lambda x, y: x + y, chunked_docs)

langroid 0.32.2__py3-none-any.whl → 0.33.4__py3-none-any.whl

langroid 0.32.2py3-none-any.whl → 0.33.4py3-none-any.whl