PyPI - langchain-githubcopilot-chat - Versions diffs - 0.1.0__tar.gz → 0.1.2__tar.gz - Mend

langchain-githubcopilot-chat 0.1.0tar.gz → 0.1.2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

{langchain_githubcopilot_chat-0.1.0 → langchain_githubcopilot_chat-0.1.2}/PKG-INFO RENAMED Viewed

@@ -1,21 +1,20 @@
 Metadata-Version: 2.1
 Name: langchain-githubcopilot-chat
-Version: 0.1.0
+Version: 0.1.2
 Summary: An integration package connecting GithubcopilotChat and LangChain
 Home-page: https://github.com/langchain-ai/langchain
 License: MIT
 Author: YIhan Wu
 Author-email: iumm@ibat.ac.cn
-Requires-Python: >=3.9,<4.0
+Requires-Python: >=3.10,<4.0
 Classifier: License :: OSI Approved :: MIT License
 Classifier: Programming Language :: Python :: 3
-Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
-Requires-Dist: httpx (>=0.24.0)
-Requires-Dist: langchain-core (>=0.3.15,<0.4.0)
+Requires-Dist: httpx (>=0.28.1)
+Requires-Dist: langchain-core (>=1.1.0,<2.0.0)
 Project-URL: Repository, https://github.com/langchain-ai/langchain
 Project-URL: Release Notes, https://github.com/langchain-ai/langchain/releases?q=tag%3A%22githubcopilot-chat%3D%3D0%22&expanded=true
 Project-URL: Source Code, https://github.com/langchain-ai/langchain/tree/master/libs/partners/githubcopilot-chat

{langchain_githubcopilot_chat-0.1.0 → langchain_githubcopilot_chat-0.1.2}/langchain_githubcopilot_chat/chat_models.py RENAMED Viewed

@@ -444,6 +444,11 @@ class ChatGithubCopilot(BaseChatModel):
     max_retries: int = 2
     """Number of automatic retries on transient errors."""
+    # ------------------------------------------------------------------
+    # Pydantic v2 config — allow the ``model`` alias on construction
+    # ------------------------------------------------------------------
+    model_config = {"populate_by_name": True}
     # ------------------------------------------------------------------
     # Validators / setup
     # ------------------------------------------------------------------

langchain_githubcopilot_chat-0.1.2/langchain_githubcopilot_chat/embeddings.py ADDED Viewed

@@ -0,0 +1,321 @@
+"""GitHub Copilot Chat embeddings integration via GitHub Models Embeddings API."""
+from __future__ import annotations
+import os
+from typing import Any, Dict, List, Optional, Union
+import httpx
+from langchain_core.embeddings import Embeddings
+from pydantic import BaseModel, Field, SecretStr, model_validator
+_GITHUB_MODELS_BASE_URL = "https://models.github.ai"
+_EMBEDDINGS_PATH = "/inference/embeddings"
+_ORG_EMBEDDINGS_PATH = "/orgs/{org}/inference/embeddings"
+_API_VERSION = "2026-03-10"
+class GithubcopilotChatEmbeddings(BaseModel, Embeddings):
+    """GitHub Copilot Chat embedding model integration via the GitHub Models API.
+    GitHub Models provides access to embedding models (e.g. OpenAI
+    ``text-embedding-3-small``, ``text-embedding-3-large``) through a unified
+    OpenAI-compatible REST API.  This class wraps the ``/inference/embeddings``
+    endpoint so that any embedding model available in the GitHub Models catalog
+    can be used as a drop-in LangChain ``Embeddings`` implementation.
+    Setup:
+        Install ``langchain-githubcopilot-chat`` and set the
+        ``GITHUB_TOKEN`` environment variable (a classic or fine-grained PAT
+        with the ``models: read`` scope, or a GitHub Copilot subscription token).
+        .. code-block:: bash
+            pip install -U langchain-githubcopilot-chat
+            export GITHUB_TOKEN="github_pat_..."
+    Key init args:
+        model: str
+            Model ID in the ``{publisher}/{model_name}`` format, e.g.
+            ``"openai/text-embedding-3-small"``.
+        github_token: Optional[SecretStr]
+            GitHub token.  Falls back to ``GITHUB_TOKEN`` env var.
+        base_url: str
+            Base URL of the GitHub Models API.
+            Defaults to ``"https://models.github.ai"``.
+        org: Optional[str]
+            Organisation login.  When set, requests are attributed to that org.
+        api_version: str
+            GitHub Models REST API version header value.
+            Defaults to ``"2026-03-10"``.
+        dimensions: Optional[int]
+            The number of dimensions for the output embeddings.  Only supported
+            by ``text-embedding-3`` and later models.
+        encoding_format: str
+            The format to return embeddings in.  Either ``"float"`` (default)
+            or ``"base64"``.
+        timeout: Optional[float]
+            HTTP request timeout in seconds.
+        max_retries: int
+            Number of automatic retries on transient errors (default ``2``).
+    Instantiate:
+        .. code-block:: python
+            from langchain_githubcopilot_chat import GithubcopilotChatEmbeddings
+            embed = GithubcopilotChatEmbeddings(
+                model="openai/text-embedding-3-small",
+                # github_token="github_pat_...",  # or set GITHUB_TOKEN env var
+            )
+    Embed single text:
+        .. code-block:: python
+            vector = embed.embed_query("What is the meaning of life?")
+            print(len(vector))   # e.g. 1536
+    Embed multiple texts:
+        .. code-block:: python
+            vectors = embed.embed_documents(
+                ["Document one.", "Document two."]
+            )
+            print(len(vectors), len(vectors[0]))
+    Async:
+        .. code-block:: python
+            vector = await embed.aembed_query("What is the meaning of life?")
+            vectors = await embed.aembed_documents(
+                ["Document one.", "Document two."]
+            )
+    """
+    model_config = {"populate_by_name": True}
+    model_name: str = Field(alias="model")
+    """Embedding model ID in the ``{publisher}/{model_name}`` format.
+    Examples: ``"openai/text-embedding-3-small"``,
+    ``"openai/text-embedding-3-large"``.
+    """
+    github_token: Optional[SecretStr] = Field(default=None)
+    """GitHub token with ``models: read`` scope.
+    If not provided, the value of the ``GITHUB_TOKEN`` environment variable
+    is used.
+    """
+    base_url: str = _GITHUB_MODELS_BASE_URL
+    """Base URL for the GitHub Models REST API."""
+    org: Optional[str] = None
+    """Organisation login for attributed inference requests.
+    When set, requests are sent to
+    ``/orgs/{org}/inference/embeddings`` instead of ``/inference/embeddings``.
+    """
+    api_version: str = _API_VERSION
+    """GitHub Models API version sent as the ``X-GitHub-Api-Version`` header."""
+    dimensions: Optional[int] = None
+    """Number of output embedding dimensions.
+    Only supported by ``text-embedding-3`` and later models.
+    """
+    encoding_format: str = "float"
+    """Format of the returned embeddings.  Either ``"float"`` or ``"base64"``."""
+    timeout: Optional[float] = None
+    """HTTP request timeout in seconds."""
+    max_retries: int = 2
+    """Number of automatic retries on transient errors."""
+    # ------------------------------------------------------------------
+    # Validators / setup
+    # ------------------------------------------------------------------
+    @model_validator(mode="before")
+    @classmethod
+    def _resolve_token(cls, values: Dict[str, Any]) -> Dict[str, Any]:
+        """Resolve the GitHub token from the environment if not supplied."""
+        token = values.get("github_token") or values.get("api_key")
+        if not token:
+            token = os.environ.get("GITHUB_TOKEN")
+            if token:
+                values["github_token"] = token
+        return values
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+    @property
+    def _token(self) -> str:
+        """Return the raw GitHub token string."""
+        if self.github_token:
+            return self.github_token.get_secret_value()
+        env_token = os.environ.get("GITHUB_TOKEN", "")
+        if not env_token:
+            raise ValueError(
+                "A GitHub token is required.  Set the GITHUB_TOKEN environment "
+                "variable or pass ``github_token`` when instantiating "
+                "GithubcopilotChatEmbeddings."
+            )
+        return env_token
+    @property
+    def _embeddings_url(self) -> str:
+        """Return the full embeddings endpoint URL."""
+        if self.org:
+            path = _ORG_EMBEDDINGS_PATH.format(org=self.org)
+        else:
+            path = _EMBEDDINGS_PATH
+        return self.base_url.rstrip("/") + path
+    def _build_headers(self) -> Dict[str, str]:
+        return {
+            "Authorization": f"Bearer {self._token}",
+            "Accept": "application/vnd.github+json",
+            "Content-Type": "application/json",
+            "X-GitHub-Api-Version": self.api_version,
+        }
+    def _build_payload(self, input: Union[str, List[str]]) -> Dict[str, Any]:
+        """Assemble the JSON body for the embeddings API."""
+        payload: Dict[str, Any] = {
+            "model": self.model_name,
+            "input": input,
+            "encoding_format": self.encoding_format,
+        }
+        if self.dimensions is not None:
+            payload["dimensions"] = self.dimensions
+        return payload
+    def _do_request(self, payload: Dict[str, Any]) -> Dict[str, Any]:
+        """Perform a synchronous HTTP POST with retries."""
+        headers = self._build_headers()
+        last_exc: Optional[Exception] = None
+        for attempt in range(self.max_retries + 1):
+            try:
+                response = httpx.post(
+                    self._embeddings_url,
+                    headers=headers,
+                    json=payload,
+                    timeout=self.timeout,
+                )
+                response.raise_for_status()
+                return response.json()
+            except (httpx.TimeoutException, httpx.TransportError) as exc:
+                last_exc = exc
+                if attempt == self.max_retries:
+                    raise
+            except httpx.HTTPStatusError as exc:
+                if exc.response.status_code < 500:
+                    raise
+                last_exc = exc
+                if attempt == self.max_retries:
+                    raise
+        raise RuntimeError("Unexpected retry loop exit") from last_exc
+    async def _do_request_async(self, payload: Dict[str, Any]) -> Dict[str, Any]:
+        """Perform an asynchronous HTTP POST with retries."""
+        headers = self._build_headers()
+        last_exc: Optional[Exception] = None
+        async with httpx.AsyncClient(timeout=self.timeout) as client:
+            for attempt in range(self.max_retries + 1):
+                try:
+                    response = await client.post(
+                        self._embeddings_url,
+                        headers=headers,
+                        json=payload,
+                    )
+                    response.raise_for_status()
+                    return response.json()
+                except (httpx.TimeoutException, httpx.TransportError) as exc:
+                    last_exc = exc
+                    if attempt == self.max_retries:
+                        raise
+                except httpx.HTTPStatusError as exc:
+                    if exc.response.status_code < 500:
+                        raise
+                    last_exc = exc
+                    if attempt == self.max_retries:
+                        raise
+        raise RuntimeError("Unexpected retry loop exit") from last_exc
+    @staticmethod
+    def _extract_embeddings(response_data: Dict[str, Any]) -> List[List[float]]:
+        """Extract the list of embedding vectors from an API response."""
+        data = response_data.get("data", [])
+        if not data:
+            raise ValueError(
+                f"GitHub Models Embeddings API returned no data. "
+                f"Response: {response_data}"
+            )
+        # Sort by index to preserve input order (the API may reorder items)
+        sorted_data = sorted(data, key=lambda x: x.get("index", 0))
+        return [item["embedding"] for item in sorted_data]
+    # ------------------------------------------------------------------
+    # LangChain Embeddings interface
+    # ------------------------------------------------------------------
+    def embed_documents(self, texts: List[str]) -> List[List[float]]:
+        """Embed a list of documents using the GitHub Models Embeddings API.
+        Args:
+            texts: The list of texts to embed.
+        Returns:
+            A list of embedding vectors, one per input text.
+        """
+        if not texts:
+            return []
+        payload = self._build_payload(texts)
+        response_data = self._do_request(payload)
+        return self._extract_embeddings(response_data)
+    def embed_query(self, text: str) -> List[float]:
+        """Embed a single query text using the GitHub Models Embeddings API.
+        Args:
+            text: The text to embed.
+        Returns:
+            An embedding vector.
+        """
+        return self.embed_documents([text])[0]
+    async def aembed_documents(self, texts: List[str]) -> List[List[float]]:
+        """Asynchronously embed a list of documents.
+        Args:
+            texts: The list of texts to embed.
+        Returns:
+            A list of embedding vectors, one per input text.
+        """
+        if not texts:
+            return []
+        payload = self._build_payload(texts)
+        response_data = await self._do_request_async(payload)
+        return self._extract_embeddings(response_data)
+    async def aembed_query(self, text: str) -> List[float]:
+        """Asynchronously embed a single query text.
+        Args:
+            text: The text to embed.
+        Returns:
+            An embedding vector.
+        """
+        results = await self.aembed_documents([text])
+        return results[0]

{langchain_githubcopilot_chat-0.1.0 → langchain_githubcopilot_chat-0.1.2}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
 [tool.poetry]
 name = "langchain-githubcopilot-chat"
-version = "0.1.0"
+version = "0.1.2"
 description = "An integration package connecting GithubcopilotChat and LangChain"
 authors = ["YIhan Wu <iumm@ibat.ac.cn>"]
 readme = "README.md"
@@ -19,9 +19,9 @@ disallow_untyped_defs = "True"
 "Release Notes" = "https://github.com/langchain-ai/langchain/releases?q=tag%3A%22githubcopilot-chat%3D%3D0%22&expanded=true"
 [tool.poetry.dependencies]
-python = ">=3.9,<4.0"
-langchain-core = "^0.3.15"
-httpx = ">=0.24.0"
+python = ">=3.10,<4.0"
+langchain-core = ">=1.1.0,<2.0.0"
+httpx = ">=0.28.1"
 [tool.ruff.lint]
 select = ["E", "F", "I", "T201"]
@@ -59,7 +59,7 @@ pytest = "^7.4.3"
 pytest-asyncio = "^0.23.2"
 pytest-socket = "^0.7.0"
 pytest-watcher = "^0.3.4"
-langchain-tests = "^0.3.5"
+langchain-tests = "^1.1.5"
 [tool.poetry.group.codespell.dependencies]
 codespell = "^2.2.6"

langchain_githubcopilot_chat-0.1.0/langchain_githubcopilot_chat/embeddings.py DELETED Viewed

@@ -1,96 +0,0 @@
-from typing import List
-from langchain_core.embeddings import Embeddings
-class GithubcopilotChatEmbeddings(Embeddings):
-    """GithubcopilotChat embedding model integration.
-    # TODO: Replace with relevant packages, env vars.
-    Setup:
-        Install ``langchain-githubcopilot-chat`` and set environment variable
-        ``GITHUBCOPILOTCHAT_API_KEY``.
-        .. code-block:: bash
-            pip install -U langchain-githubcopilot-chat
-            export GITHUBCOPILOTCHAT_API_KEY="your-api-key"
-    # TODO: Populate with relevant params.
-    Key init args — completion params:
-        model: str
-            Name of GithubcopilotChat model to use.
-    See full list of supported init args and their descriptions in the params section.
-    # TODO: Replace with relevant init params.
-    Instantiate:
-        .. code-block:: python
-            from langchain_githubcopilot_chat import GithubcopilotChatEmbeddings
-            embed = GithubcopilotChatEmbeddings(
-                model="...",
-                # api_key="...",
-                # other params...
-            )
-    Embed single text:
-        .. code-block:: python
-            input_text = "The meaning of life is 42"
-            embed.embed_query(input_text)
-        .. code-block:: python
-            # TODO: Example output.
-    # TODO: Delete if token-level streaming isn't supported.
-    Embed multiple text:
-        .. code-block:: python
-             input_texts = ["Document 1...", "Document 2..."]
-            embed.embed_documents(input_texts)
-        .. code-block:: python
-            # TODO: Example output.
-    # TODO: Delete if native async isn't supported.
-    Async:
-        .. code-block:: python
-            await embed.aembed_query(input_text)
-            # multiple:
-            # await embed.aembed_documents(input_texts)
-        .. code-block:: python
-            # TODO: Example output.
-    """
-    def __init__(self, model: str):
-        self.model = model
-    def embed_documents(self, texts: List[str]) -> List[List[float]]:
-        """Embed search docs."""
-        return [[0.5, 0.6, 0.7] for _ in texts]
-    def embed_query(self, text: str) -> List[float]:
-        """Embed query text."""
-        return self.embed_documents([text])[0]
-    # optional: add custom async implementations here
-    # you can also delete these, and the base class will
-    # use the default implementation, which calls the sync
-    # version in an async executor:
-    # async def aembed_documents(self, texts: List[str]) -> List[List[float]]:
-    #     """Asynchronous Embed search docs."""
-    #     ...
-    # async def aembed_query(self, text: str) -> List[float]:
-    #     """Asynchronous Embed query text."""
-    #     ...