PyPI - langchain-githubcopilot-chat - Versions diffs - 0.1.0__py3-none-any.whl - Mend

langchain-githubcopilot-chat 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

langchain_githubcopilot_chat/__init__.py +31 -0
langchain_githubcopilot_chat/chat_models.py +923 -0
langchain_githubcopilot_chat/document_loaders.py +73 -0
langchain_githubcopilot_chat/embeddings.py +96 -0
langchain_githubcopilot_chat/py.typed +0 -0
langchain_githubcopilot_chat/retrievers.py +107 -0
langchain_githubcopilot_chat/toolkits.py +72 -0
langchain_githubcopilot_chat/tools.py +94 -0
langchain_githubcopilot_chat/vectorstores.py +439 -0
langchain_githubcopilot_chat-0.1.0.dist-info/LICENSE +21 -0
langchain_githubcopilot_chat-0.1.0.dist-info/METADATA +70 -0
langchain_githubcopilot_chat-0.1.0.dist-info/RECORD +13 -0
langchain_githubcopilot_chat-0.1.0.dist-info/WHEEL +4 -0

langchain_githubcopilot_chat/vectorstores.py ADDED Viewed

@@ -0,0 +1,439 @@
+"""GithubcopilotChat vector stores."""
+from __future__ import annotations
+import uuid
+from typing import (
+    Any,
+    Callable,
+    Iterator,
+    List,
+    Optional,
+    Sequence,
+    Tuple,
+    Type,
+    TypeVar,
+)
+from langchain_core.documents import Document
+from langchain_core.embeddings import Embeddings
+from langchain_core.vectorstores import VectorStore
+from langchain_core.vectorstores.utils import _cosine_similarity as cosine_similarity
+VST = TypeVar("VST", bound=VectorStore)
+class GithubcopilotChatVectorStore(VectorStore):
+    # TODO: Replace all TODOs in docstring.
+    """GithubcopilotChat vector store integration.
+    # TODO: Replace with relevant packages, env vars.
+    Setup:
+        Install ``langchain-githubcopilot-chat`` and set environment variable ``GITHUBCOPILOTCHAT_API_KEY``.
+        .. code-block:: bash
+            pip install -U langchain-githubcopilot-chat
+            export GITHUBCOPILOTCHAT_API_KEY="your-api-key"
+    # TODO: Populate with relevant params.
+    Key init args — indexing params:
+        collection_name: str
+            Name of the collection.
+        embedding_function: Embeddings
+            Embedding function to use.
+    # TODO: Populate with relevant params.
+    Key init args — client params:
+        client: Optional[Client]
+            Client to use.
+        connection_args: Optional[dict]
+            Connection arguments.
+    # TODO: Replace with relevant init params.
+    Instantiate:
+        .. code-block:: python
+            from langchain_githubcopilot_chat.vectorstores import GithubcopilotChatVectorStore
+            from langchain_openai import OpenAIEmbeddings
+            vector_store = GithubcopilotChatVectorStore(
+                collection_name="foo",
+                embedding_function=OpenAIEmbeddings(),
+                connection_args={"uri": "./foo.db"},
+                # other params...
+            )
+    # TODO: Populate with relevant variables.
+    Add Documents:
+        .. code-block:: python
+            from langchain_core.documents import Document
+            document_1 = Document(page_content="foo", metadata={"baz": "bar"})
+            document_2 = Document(page_content="thud", metadata={"bar": "baz"})
+            document_3 = Document(page_content="i will be deleted :(")
+            documents = [document_1, document_2, document_3]
+            ids = ["1", "2", "3"]
+            vector_store.add_documents(documents=documents, ids=ids)
+    # TODO: Populate with relevant variables.
+    Delete Documents:
+        .. code-block:: python
+            vector_store.delete(ids=["3"])
+    # TODO: Fill out with relevant variables and example output.
+    Search:
+        .. code-block:: python
+            results = vector_store.similarity_search(query="thud",k=1)
+            for doc in results:
+                print(f"* {doc.page_content} [{doc.metadata}]")
+        .. code-block:: python
+            # TODO: Example output
+    # TODO: Fill out with relevant variables and example output.
+    Search with filter:
+        .. code-block:: python
+            results = vector_store.similarity_search(query="thud",k=1,filter={"bar": "baz"})
+            for doc in results:
+                print(f"* {doc.page_content} [{doc.metadata}]")
+        .. code-block:: python
+            # TODO: Example output
+    # TODO: Fill out with relevant variables and example output.
+    Search with score:
+        .. code-block:: python
+            results = vector_store.similarity_search_with_score(query="qux",k=1)
+            for doc, score in results:
+                print(f"* [SIM={score:3f}] {doc.page_content} [{doc.metadata}]")
+        .. code-block:: python
+            # TODO: Example output
+    # TODO: Fill out with relevant variables and example output.
+    Async:
+        .. code-block:: python
+            # add documents
+            # await vector_store.aadd_documents(documents=documents, ids=ids)
+            # delete documents
+            # await vector_store.adelete(ids=["3"])
+            # search
+            # results = vector_store.asimilarity_search(query="thud",k=1)
+            # search with score
+            results = await vector_store.asimilarity_search_with_score(query="qux",k=1)
+            for doc,score in results:
+                print(f"* [SIM={score:3f}] {doc.page_content} [{doc.metadata}]")
+        .. code-block:: python
+            # TODO: Example output
+    # TODO: Fill out with relevant variables and example output.
+    Use as Retriever:
+        .. code-block:: python
+            retriever = vector_store.as_retriever(
+                search_type="mmr",
+                search_kwargs={"k": 1, "fetch_k": 2, "lambda_mult": 0.5},
+            )
+            retriever.invoke("thud")
+        .. code-block:: python
+            # TODO: Example output
+    """  # noqa: E501
+    def __init__(self, embedding: Embeddings) -> None:
+        """Initialize with the given embedding function.
+        Args:
+            embedding: embedding function to use.
+        """
+        self._database: dict[str, dict[str, Any]] = {}
+        self.embedding = embedding
+    @classmethod
+    def from_texts(
+        cls: Type[GithubcopilotChatVectorStore],
+        texts: List[str],
+        embedding: Embeddings,
+        metadatas: Optional[List[dict]] = None,
+        **kwargs: Any,
+    ) -> GithubcopilotChatVectorStore:
+        store = cls(
+            embedding=embedding,
+        )
+        store.add_texts(texts=texts, metadatas=metadatas, **kwargs)
+        return store
+    # optional: add custom async implementations
+    # @classmethod
+    # async def afrom_texts(
+    #     cls: Type[VST],
+    #     texts: List[str],
+    #     embedding: Embeddings,
+    #     metadatas: Optional[List[dict]] = None,
+    #     **kwargs: Any,
+    # ) -> VST:
+    #     return await asyncio.get_running_loop().run_in_executor(
+    #         None, partial(cls.from_texts, **kwargs), texts, embedding, metadatas
+    #     )
+    @property
+    def embeddings(self) -> Embeddings:
+        return self.embedding
+    def add_documents(
+        self,
+        documents: List[Document],
+        ids: Optional[List[str]] = None,
+        **kwargs: Any,
+    ) -> List[str]:
+        """Add documents to the store."""
+        texts = [doc.page_content for doc in documents]
+        vectors = self.embedding.embed_documents(texts)
+        if ids and len(ids) != len(texts):
+            msg = (
+                f"ids must be the same length as texts. "
+                f"Got {len(ids)} ids and {len(texts)} texts."
+            )
+            raise ValueError(msg)
+        id_iterator: Iterator[Optional[str]] = (
+            iter(ids) if ids else iter(doc.id for doc in documents)
+        )
+        ids_ = []
+        for doc, vector in zip(documents, vectors):
+            doc_id = next(id_iterator)
+            doc_id_ = doc_id if doc_id else str(uuid.uuid4())
+            ids_.append(doc_id_)
+            self._database[doc_id_] = {
+                "id": doc_id_,
+                "vector": vector,
+                "text": doc.page_content,
+                "metadata": doc.metadata,
+            }
+        return ids_
+    # optional: add custom async implementations
+    # async def aadd_documents(
+    #     self,
+    #     documents: List[Document],
+    #     ids: Optional[List[str]] = None,
+    #     **kwargs: Any,
+    # ) -> List[str]:
+    #     raise NotImplementedError
+    def delete(self, ids: Optional[List[str]] = None, **kwargs: Any) -> None:
+        if ids:
+            for _id in ids:
+                self._database.pop(_id, None)
+    # optional: add custom async implementations
+    # async def adelete(
+    #     self, ids: Optional[List[str]] = None, **kwargs: Any
+    # ) -> None:
+    #     raise NotImplementedError
+    def get_by_ids(self, ids: Sequence[str], /) -> list[Document]:
+        """Get documents by their ids.
+        Args:
+            ids: The ids of the documents to get.
+        Returns:
+            A list of Document objects.
+        """
+        documents = []
+        for doc_id in ids:
+            doc = self._database.get(doc_id)
+            if doc:
+                documents.append(
+                    Document(
+                        id=doc["id"],
+                        page_content=doc["text"],
+                        metadata=doc["metadata"],
+                    )
+                )
+        return documents
+    # optional: add custom async implementations
+    # async def aget_by_ids(self, ids: Sequence[str], /) -> list[Document]:
+    #     raise NotImplementedError
+    # NOTE: the below helper method implements similarity search for in-memory
+    # storage. It is optional and not a part of the vector store interface.
+    def _similarity_search_with_score_by_vector(
+        self,
+        embedding: List[float],
+        k: int = 4,
+        filter: Optional[Callable[[Document], bool]] = None,
+        **kwargs: Any,
+    ) -> List[tuple[Document, float, List[float]]]:
+        # get all docs with fixed order in list
+        docs = list(self._database.values())
+        if filter is not None:
+            docs = [
+                doc
+                for doc in docs
+                if filter(Document(page_content=doc["text"], metadata=doc["metadata"]))
+            ]
+        if not docs:
+            return []
+        similarity = cosine_similarity([embedding], [doc["vector"] for doc in docs])[0]
+        # get the indices ordered by similarity score
+        top_k_idx = similarity.argsort()[::-1][:k]
+        return [
+            (
+                # Document
+                Document(
+                    id=doc_dict["id"],
+                    page_content=doc_dict["text"],
+                    metadata=doc_dict["metadata"],
+                ),
+                # Score
+                float(similarity[idx].item()),
+                # Embedding vector
+                doc_dict["vector"],
+            )
+            for idx in top_k_idx
+            # Assign using walrus operator to avoid multiple lookups
+            if (doc_dict := docs[idx])
+        ]
+    def similarity_search(
+        self, query: str, k: int = 4, **kwargs: Any
+    ) -> List[Document]:
+        embedding = self.embedding.embed_query(query)
+        return [
+            doc
+            for doc, _, _ in self._similarity_search_with_score_by_vector(
+                embedding=embedding, k=k, **kwargs
+            )
+        ]
+    # optional: add custom async implementations
+    # async def asimilarity_search(
+    #     self, query: str, k: int = 4, **kwargs: Any
+    # ) -> List[Document]:
+    #     # This is a temporary workaround to make the similarity search
+    #     # asynchronous. The proper solution is to make the similarity search
+    #     # asynchronous in the vector store implementations.
+    #     func = partial(self.similarity_search, query, k=k, **kwargs)
+    #     return await asyncio.get_event_loop().run_in_executor(None, func)
+    def similarity_search_with_score(
+        self, query: str, k: int = 4, **kwargs: Any
+    ) -> List[Tuple[Document, float]]:
+        embedding = self.embedding.embed_query(query)
+        return [
+            (doc, similarity)
+            for doc, similarity, _ in self._similarity_search_with_score_by_vector(
+                embedding=embedding, k=k, **kwargs
+            )
+        ]
+    # optional: add custom async implementations
+    # async def asimilarity_search_with_score(
+    #     self, *args: Any, **kwargs: Any
+    # ) -> List[Tuple[Document, float]]:
+    #     # This is a temporary workaround to make the similarity search
+    #     # asynchronous. The proper solution is to make the similarity search
+    #     # asynchronous in the vector store implementations.
+    #     func = partial(self.similarity_search_with_score, *args, **kwargs)
+    #     return await asyncio.get_event_loop().run_in_executor(None, func)
+    ### ADDITIONAL OPTIONAL SEARCH METHODS BELOW ###
+    # def similarity_search_by_vector(
+    #     self, embedding: List[float], k: int = 4, **kwargs: Any
+    # ) -> List[Document]:
+    #     raise NotImplementedError
+    # optional: add custom async implementations
+    # async def asimilarity_search_by_vector(
+    #     self, embedding: List[float], k: int = 4, **kwargs: Any
+    # ) -> List[Document]:
+    #     # This is a temporary workaround to make the similarity search
+    #     # asynchronous. The proper solution is to make the similarity search
+    #     # asynchronous in the vector store implementations.
+    #     func = partial(self.similarity_search_by_vector, embedding, k=k, **kwargs)
+    #     return await asyncio.get_event_loop().run_in_executor(None, func)
+    # def max_marginal_relevance_search(
+    #     self,
+    #     query: str,
+    #     k: int = 4,
+    #     fetch_k: int = 20,
+    #     lambda_mult: float = 0.5,
+    #     **kwargs: Any,
+    # ) -> List[Document]:
+    #     raise NotImplementedError
+    # optional: add custom async implementations
+    # async def amax_marginal_relevance_search(
+    #     self,
+    #     query: str,
+    #     k: int = 4,
+    #     fetch_k: int = 20,
+    #     lambda_mult: float = 0.5,
+    #     **kwargs: Any,
+    # ) -> List[Document]:
+    #     # This is a temporary workaround to make the similarity search
+    #     # asynchronous. The proper solution is to make the similarity search
+    #     # asynchronous in the vector store implementations.
+    #     func = partial(
+    #         self.max_marginal_relevance_search,
+    #         query,
+    #         k=k,
+    #         fetch_k=fetch_k,
+    #         lambda_mult=lambda_mult,
+    #         **kwargs,
+    #     )
+    #     return await asyncio.get_event_loop().run_in_executor(None, func)
+    # def max_marginal_relevance_search_by_vector(
+    #     self,
+    #     embedding: List[float],
+    #     k: int = 4,
+    #     fetch_k: int = 20,
+    #     lambda_mult: float = 0.5,
+    #     **kwargs: Any,
+    # ) -> List[Document]:
+    #     raise NotImplementedError
+    # optional: add custom async implementations
+    # async def amax_marginal_relevance_search_by_vector(
+    #     self,
+    #     embedding: List[float],
+    #     k: int = 4,
+    #     fetch_k: int = 20,
+    #     lambda_mult: float = 0.5,
+    #     **kwargs: Any,
+    # ) -> List[Document]:
+    #     raise NotImplementedError

langchain_githubcopilot_chat-0.1.0.dist-info/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2024 LangChain, Inc.
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

langchain_githubcopilot_chat-0.1.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,70 @@
+Metadata-Version: 2.1
+Name: langchain-githubcopilot-chat
+Version: 0.1.0
+Summary: An integration package connecting GithubcopilotChat and LangChain
+Home-page: https://github.com/langchain-ai/langchain
+License: MIT
+Author: YIhan Wu
+Author-email: iumm@ibat.ac.cn
+Requires-Python: >=3.9,<4.0
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Requires-Dist: httpx (>=0.24.0)
+Requires-Dist: langchain-core (>=0.3.15,<0.4.0)
+Project-URL: Repository, https://github.com/langchain-ai/langchain
+Project-URL: Release Notes, https://github.com/langchain-ai/langchain/releases?q=tag%3A%22githubcopilot-chat%3D%3D0%22&expanded=true
+Project-URL: Source Code, https://github.com/langchain-ai/langchain/tree/master/libs/partners/githubcopilot-chat
+Description-Content-Type: text/markdown
+# langchain-githubcopilot-chat
+This package contains the LangChain integration with GithubcopilotChat
+## Installation
+```bash
+pip install -U langchain-githubcopilot-chat
+```
+And you should configure credentials by setting the following environment variables:
+* TODO: fill this out
+## Chat Models
+`ChatGithubcopilotChat` class exposes chat models from GithubcopilotChat.
+```python
+from langchain_githubcopilot_chat import ChatGithubcopilotChat
+llm = ChatGithubcopilotChat()
+llm.invoke("Sing a ballad of LangChain.")
+```
+## Embeddings
+`GithubcopilotChatEmbeddings` class exposes embeddings from GithubcopilotChat.
+```python
+from langchain_githubcopilot_chat import GithubcopilotChatEmbeddings
+embeddings = GithubcopilotChatEmbeddings()
+embeddings.embed_query("What is the meaning of life?")
+```
+## LLMs
+`GithubcopilotChatLLM` class exposes LLMs from GithubcopilotChat.
+```python
+from langchain_githubcopilot_chat import GithubcopilotChatLLM
+llm = GithubcopilotChatLLM()
+llm.invoke("The meaning of life is")
+```

langchain_githubcopilot_chat-0.1.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,13 @@
+langchain_githubcopilot_chat/__init__.py,sha256=0gzCpfEQave85jhRxL_2jt5FSH3cnc5x-KF74BDDgLk,1162
+langchain_githubcopilot_chat/chat_models.py,sha256=q9-oIM7HbnzBrZiAVVn1bKvez7-HrxJ0CFAbHLqvcCE,33756
+langchain_githubcopilot_chat/document_loaders.py,sha256=40HublhiKiwqx_nA8kfpMgYlvVOoVUx_IJAYJz64nnQ,2257
+langchain_githubcopilot_chat/embeddings.py,sha256=rnkeKHQn92brG0g_9PD0gF8km6pifJ22GheuSswftAQ,2732
+langchain_githubcopilot_chat/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+langchain_githubcopilot_chat/retrievers.py,sha256=ZjLO6AwcxfHmdTxWxKYJ2Xo2TjJWn9CS6zG7m6dRLMw,3104
+langchain_githubcopilot_chat/toolkits.py,sha256=J-NwHAZ-h2iFBpgPuMKrvatSYXXcIhOEptgz_2NefiM,1993
+langchain_githubcopilot_chat/tools.py,sha256=WwxpkhycsmlP1mczjyKT3H4-IuvLODr5aeGjMFIh7N8,2774
+langchain_githubcopilot_chat/vectorstores.py,sha256=Iu10f1mLH8kQEFuRM0h5ZenI18wZ5oUD8LVRWMREvw4,14305
+langchain_githubcopilot_chat-0.1.0.dist-info/LICENSE,sha256=2btS8uNUDWD_UNjw9ba6ZJt_00aUjEw9CGyK-xIHY8c,1072
+langchain_githubcopilot_chat-0.1.0.dist-info/METADATA,sha256=mRCtxGBbbWWvnCkskhLTURRIqWOdydVv7L--klNV_HU,2102
+langchain_githubcopilot_chat-0.1.0.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
+langchain_githubcopilot_chat-0.1.0.dist-info/RECORD,,

langchain_githubcopilot_chat-0.1.0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: poetry-core 1.9.1
+Root-Is-Purelib: true
+Tag: py3-none-any