PyPI - langchain-githubcopilot-chat - Versions diffs - 0.1.0__py3-none-any.whl - Mend

langchain-githubcopilot-chat 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

langchain_githubcopilot_chat/__init__.py +31 -0
langchain_githubcopilot_chat/chat_models.py +923 -0
langchain_githubcopilot_chat/document_loaders.py +73 -0
langchain_githubcopilot_chat/embeddings.py +96 -0
langchain_githubcopilot_chat/py.typed +0 -0
langchain_githubcopilot_chat/retrievers.py +107 -0
langchain_githubcopilot_chat/toolkits.py +72 -0
langchain_githubcopilot_chat/tools.py +94 -0
langchain_githubcopilot_chat/vectorstores.py +439 -0
langchain_githubcopilot_chat-0.1.0.dist-info/LICENSE +21 -0
langchain_githubcopilot_chat-0.1.0.dist-info/METADATA +70 -0
langchain_githubcopilot_chat-0.1.0.dist-info/RECORD +13 -0
langchain_githubcopilot_chat-0.1.0.dist-info/WHEEL +4 -0

langchain_githubcopilot_chat/chat_models.py ADDED Viewed

@@ -0,0 +1,923 @@
+"""GitHub Copilot Chat model integration via GitHub Models inference API."""
+from __future__ import annotations
+import json
+import os
+from typing import (
+    Any,
+    AsyncIterator,
+    Dict,
+    Iterator,
+    List,
+    Literal,
+    Optional,
+    Sequence,
+    Type,
+    Union,
+)
+import httpx
+from langchain_core.callbacks import (
+    AsyncCallbackManagerForLLMRun,
+    CallbackManagerForLLMRun,
+)
+from langchain_core.language_models import BaseChatModel
+from langchain_core.language_models.base import LangSmithParams
+from langchain_core.messages import (
+    AIMessage,
+    AIMessageChunk,
+    BaseMessage,
+    ChatMessage,
+    HumanMessage,
+    SystemMessage,
+    ToolMessage,
+)
+from langchain_core.messages.ai import UsageMetadata
+from langchain_core.messages.tool import tool_call_chunk as create_tool_call_chunk
+from langchain_core.output_parsers.openai_tools import (
+    make_invalid_tool_call,
+    parse_tool_call,
+)
+from langchain_core.outputs import ChatGeneration, ChatGenerationChunk, ChatResult
+from langchain_core.tools import BaseTool
+from langchain_core.utils.function_calling import convert_to_openai_tool
+from pydantic import Field, SecretStr, model_validator
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+_ROLE_MAP = {
+    "human": "user",
+    "ai": "assistant",
+    "system": "system",
+    "developer": "developer",
+    "tool": "tool",
+}
+_GITHUB_MODELS_BASE_URL = "https://models.github.ai"
+_INFERENCE_PATH = "/inference/chat/completions"
+_ORG_INFERENCE_PATH = "/orgs/{org}/inference/chat/completions"
+_API_VERSION = "2026-03-10"
+def _message_to_dict(message: BaseMessage) -> Dict[str, Any]:
+    """Convert a LangChain message to the GitHub Models API message format."""
+    if isinstance(message, SystemMessage):
+        return {"role": "system", "content": message.content}
+    elif isinstance(message, HumanMessage):
+        # Support multimodal content (list of content blocks)
+        if isinstance(message.content, list):
+            parts = []
+            for block in message.content:
+                if isinstance(block, dict):
+                    btype = block.get("type", "")
+                    if btype == "text":
+                        parts.append({"type": "text", "text": block["text"]})
+                    elif btype == "image_url":
+                        parts.append(
+                            {
+                                "type": "image_url",
+                                "image_url": block.get("image_url", {}),
+                            }
+                        )
+                    else:
+                        parts.append(block)
+                else:
+                    parts.append({"type": "text", "text": str(block)})
+            return {"role": "user", "content": parts}
+        return {"role": "user", "content": message.content}
+    elif isinstance(message, AIMessage):
+        msg: Dict[str, Any] = {"role": "assistant", "content": message.content or ""}
+        # Attach tool calls if present
+        if message.tool_calls:
+            msg["tool_calls"] = [
+                {
+                    "id": tc["id"],
+                    "type": "function",
+                    "function": {
+                        "name": tc["name"],
+                        "arguments": json.dumps(tc["args"]),
+                    },
+                }
+                for tc in message.tool_calls
+            ]
+        elif message.additional_kwargs.get("tool_calls"):
+            msg["tool_calls"] = message.additional_kwargs["tool_calls"]
+        return msg
+    elif isinstance(message, ToolMessage):
+        return {
+            "role": "tool",
+            "tool_call_id": message.tool_call_id,
+            "content": message.content,
+        }
+    elif isinstance(message, ChatMessage):
+        role = _ROLE_MAP.get(message.role, message.role)
+        return {"role": role, "content": message.content}
+    else:
+        # Fallback: treat as user message
+        return {"role": "user", "content": str(message.content)}
+def _format_tools_for_api(
+    tools: Sequence[Union[Dict[str, Any], BaseTool, Type]],
+) -> List[Dict[str, Any]]:
+    """Convert LangChain tools into the OpenAI-compatible format
+    expected by GitHub Models.
+    """
+    formatted = []
+    for tool in tools:
+        if isinstance(tool, dict) and tool.get("type") == "function":
+            formatted.append(tool)
+        else:
+            oai_tool = convert_to_openai_tool(tool)  # type: ignore[arg-type]
+            formatted.append(oai_tool)
+    return formatted
+def _parse_tool_calls(
+    raw_tool_calls: List[Dict[str, Any]],
+) -> List[Dict[str, Any]]:
+    """Parse raw API tool_calls into LangChain tool_calls format."""
+    tool_calls: List[Dict[str, Any]] = []
+    for raw in raw_tool_calls:
+        try:
+            parsed = parse_tool_call(raw, return_id=True)
+            if parsed is not None:
+                tool_calls.append(parsed)
+        except Exception as exc:
+            invalid = make_invalid_tool_call(raw, str(exc))
+            tool_calls.append(dict(invalid))
+    return tool_calls
+# GitHub Models API only accepts "auto", "required", or "none" for tool_choice.
+# LangChain internally uses "any" (equivalent to "required") and dict-style
+# {"type": "function", "function": {"name": "..."}} for specific tool forcing.
+_TOOL_CHOICE_MAP: Dict[str, str] = {
+    "any": "required",
+}
+def _normalize_tool_choice(
+    tool_choice: Any,
+) -> Union[str, Dict[str, Any]]:
+    """Normalise a tool_choice value for the GitHub Models API.
+    - ``"any"``  →  ``"required"``  (LangChain internal alias)
+    - dict ``{"type": "function", "function": {"name": "X"}}``  →  kept as-is
+      (the API accepts this form for forcing a specific function)
+    - any other string is passed through unchanged
+    """
+    if isinstance(tool_choice, str):
+        return _TOOL_CHOICE_MAP.get(tool_choice, tool_choice)
+    # dict form — pass through unchanged
+    return tool_choice
+def _build_ai_message(
+    choice: Dict[str, Any], usage: Optional[Dict[str, Any]]
+) -> AIMessage:
+    """Build an AIMessage from a single API response choice."""
+    msg = choice.get("message", {})
+    content: Union[str, List] = msg.get("content") or ""
+    finish_reason = choice.get("finish_reason", "")
+    additional_kwargs: Dict[str, Any] = {}
+    tool_calls = []
+    raw_tool_calls = msg.get("tool_calls", [])
+    if raw_tool_calls:
+        additional_kwargs["tool_calls"] = raw_tool_calls
+        tool_calls = _parse_tool_calls(raw_tool_calls)
+    usage_metadata: Optional[UsageMetadata] = None
+    if usage:
+        usage_metadata = UsageMetadata(
+            input_tokens=usage.get("prompt_tokens", 0),
+            output_tokens=usage.get("completion_tokens", 0),
+            total_tokens=usage.get("total_tokens", 0),
+        )
+    response_metadata: Dict[str, Any] = {
+        "finish_reason": finish_reason,
+    }
+    if usage:
+        response_metadata["usage"] = usage
+    return AIMessage(
+        content=content,
+        additional_kwargs=additional_kwargs,
+        tool_calls=tool_calls,
+        response_metadata=response_metadata,
+        usage_metadata=usage_metadata,
+    )
+# ---------------------------------------------------------------------------
+# Main class
+# ---------------------------------------------------------------------------
+class ChatGithubCopilot(BaseChatModel):
+    """GitHub Copilot Chat model integration via the GitHub Models inference API.
+    GitHub Models provides access to top AI models (OpenAI GPT-4.1, DeepSeek,
+    Llama, and more) through a unified OpenAI-compatible REST API.  This class
+    wraps that API so that every model available in the GitHub Models catalog
+    can be used as a drop-in LangChain ``BaseChatModel``.
+    Setup:
+        Install ``langchain-githubcopilot-chat`` and set the
+        ``GITHUB_TOKEN`` environment variable (a classic or fine-grained PAT
+        with the ``models: read`` scope, or a GitHub Copilot subscription token).
+        .. code-block:: bash
+            pip install -U langchain-githubcopilot-chat
+            export GITHUB_TOKEN="github_pat_..."
+    Key init args — completion params:
+        model: str
+            Model ID in the ``{publisher}/{model_name}`` format, e.g.
+            ``"openai/gpt-4.1"`` or ``"meta/llama-3.3-70b-instruct"``.
+        temperature: Optional[float]
+            Sampling temperature in ``[0, 1]``.  Higher → more creative.
+        max_tokens: Optional[int]
+            Maximum number of tokens to generate.
+        top_p: Optional[float]
+            Nucleus sampling probability mass in ``[0, 1]``.
+        stop: Optional[List[str]]
+            Stop sequences.
+        frequency_penalty: Optional[float]
+            Frequency penalty in ``[-2, 2]``.
+        presence_penalty: Optional[float]
+            Presence penalty in ``[-2, 2]``.
+        seed: Optional[int]
+            Random seed for deterministic sampling (best-effort).
+    Key init args — client params:
+        github_token: Optional[SecretStr]
+            GitHub token.  Falls back to ``GITHUB_TOKEN`` env var.
+        base_url: str
+            Base URL of the GitHub Models API.
+            Defaults to ``"https://models.github.ai"``.
+        org: Optional[str]
+            Organisation login.  When set, every request is attributed to that
+            org (uses the ``/orgs/{org}/inference/chat/completions`` endpoint).
+        api_version: str
+            GitHub Models REST API version header value.
+            Defaults to ``"2026-03-10"``.
+        timeout: Optional[float]
+            HTTP request timeout in seconds.
+        max_retries: int
+            Number of automatic retries on transient errors (default ``2``).
+    Instantiate:
+        .. code-block:: python
+            from langchain_githubcopilot_chat import ChatGithubCopilot
+            llm = ChatGithubCopilot(
+                model="openai/gpt-4.1",
+                temperature=0,
+                max_tokens=1024,
+                # github_token="github_pat_...",  # or set GITHUB_TOKEN env var
+            )
+    Invoke:
+        .. code-block:: python
+            messages = [
+                ("system", "You are a helpful translator. Translate to French."),
+                ("human", "I love programming."),
+            ]
+            ai_msg = llm.invoke(messages)
+            print(ai_msg.content)
+            # "J'adore la programmation."
+    Stream:
+        .. code-block:: python
+            for chunk in llm.stream(messages):
+                print(chunk.content, end="", flush=True)
+    Async:
+        .. code-block:: python
+            ai_msg = await llm.ainvoke(messages)
+            async for chunk in llm.astream(messages):
+                print(chunk.content, end="", flush=True)
+    Tool calling:
+        .. code-block:: python
+            from pydantic import BaseModel, Field
+            class GetWeather(BaseModel):
+                '''Get the current weather in a given location.'''
+                location: str = Field(
+                    ..., description="City and state, e.g. Paris, France"
+                )
+            llm_with_tools = llm.bind_tools([GetWeather])
+            ai_msg = llm_with_tools.invoke("What is the weather like in Paris?")
+            print(ai_msg.tool_calls)
+            # [{'name': 'GetWeather', 'args': {'location': 'Paris, France'},
+            #   'id': '...'}]
+    Structured output:
+        .. code-block:: python
+            from typing import Optional
+            from pydantic import BaseModel, Field
+            class Joke(BaseModel):
+                '''Joke to tell user.'''
+                setup: str = Field(description="The setup of the joke")
+                punchline: str = Field(description="The punchline to the joke")
+                rating: Optional[int] = Field(description="Funniness rating 1-10")
+            structured_llm = llm.with_structured_output(Joke)
+            structured_llm.invoke("Tell me a joke about cats")
+    JSON mode:
+        .. code-block:: python
+            json_llm = llm.bind(response_format={"type": "json_object"})
+            ai_msg = json_llm.invoke(
+                "Return a JSON object with key 'numbers' and a list of 5 random ints."
+            )
+            print(ai_msg.content)
+    Image input:
+        .. code-block:: python
+            import base64, httpx
+            from langchain_core.messages import HumanMessage
+            image_url = "https://upload.wikimedia.org/wikipedia/commons/thumb/d/dd/Gfp-wisconsin-madison-the-nature-boardwalk.jpg/2560px-Gfp-wisconsin-madison-the-nature-boardwalk.jpg"
+            image_data = base64.b64encode(httpx.get(image_url).content).decode("utf-8")
+            message = HumanMessage(
+                content=[
+                    {"type": "text", "text": "Describe the weather in this image."},
+                    {
+                        "type": "image_url",
+                        "image_url": {"url": f"data:image/jpeg;base64,{image_data}"},
+                    },
+                ]
+            )
+            ai_msg = llm.invoke([message])
+            print(ai_msg.content)
+    Token usage:
+        .. code-block:: python
+            ai_msg = llm.invoke(messages)
+            print(ai_msg.usage_metadata)
+            # {'input_tokens': 28, 'output_tokens': 18, 'total_tokens': 46}
+    Response metadata:
+        .. code-block:: python
+            ai_msg = llm.invoke(messages)
+            print(ai_msg.response_metadata)
+            # {'finish_reason': 'stop', 'usage': {'prompt_tokens': 28, ...}}
+    """
+    # ------------------------------------------------------------------
+    # Fields
+    # ------------------------------------------------------------------
+    model_name: str = Field(alias="model")
+    """Model ID in the ``{publisher}/{model_name}`` format.
+    Examples: ``"openai/gpt-4.1"``, ``"meta/llama-3.3-70b-instruct"``.
+    """
+    github_token: Optional[SecretStr] = Field(default=None)
+    """GitHub token with ``models: read`` scope.
+    If not provided, the value of the ``GITHUB_TOKEN`` environment variable
+    is used.
+    """
+    base_url: str = _GITHUB_MODELS_BASE_URL
+    """Base URL for the GitHub Models REST API."""
+    org: Optional[str] = None
+    """Organisation login for attributed inference requests.
+    When set, requests are sent to
+    ``/orgs/{org}/inference/chat/completions`` instead of
+    ``/inference/chat/completions``.
+    """
+    api_version: str = _API_VERSION
+    """GitHub Models API version sent as the ``X-GitHub-Api-Version`` header."""
+    temperature: Optional[float] = None
+    """Sampling temperature in ``[0, 1]``."""
+    max_tokens: Optional[int] = None
+    """Maximum number of tokens to generate."""
+    top_p: Optional[float] = None
+    """Nucleus sampling probability mass in ``[0, 1]``."""
+    stop: Optional[List[str]] = None
+    """Stop sequences that terminate generation."""
+    frequency_penalty: Optional[float] = None
+    """Frequency penalty in ``[-2, 2]``."""
+    presence_penalty: Optional[float] = None
+    """Presence penalty in ``[-2, 2]``."""
+    seed: Optional[int] = None
+    """Random seed for (best-effort) deterministic sampling."""
+    timeout: Optional[float] = None
+    """HTTP request timeout in seconds."""
+    max_retries: int = 2
+    """Number of automatic retries on transient errors."""
+    # ------------------------------------------------------------------
+    # Validators / setup
+    # ------------------------------------------------------------------
+    @model_validator(mode="before")
+    @classmethod
+    def _validate_token(cls, values: Dict[str, Any]) -> Dict[str, Any]:
+        """Resolve the GitHub token from the environment if not supplied.
+        Priority order:
+        1. Explicitly passed ``github_token``
+        2. Explicitly passed ``api_key`` alias
+        3. ``GITHUB_TOKEN`` environment variable
+        """
+        token = values.get("github_token") or values.get("api_key")
+        if not token:
+            token = os.environ.get("GITHUB_TOKEN")
+            if token:
+                values["github_token"] = token
+        return values
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+    @property
+    def _token(self) -> str:
+        """Return the raw GitHub token string."""
+        if self.github_token:
+            return self.github_token.get_secret_value()
+        env_token = os.environ.get("GITHUB_TOKEN", "")
+        if not env_token:
+            raise ValueError(
+                "A GitHub token is required.  Set the GITHUB_TOKEN environment "
+                "variable or pass ``github_token`` when instantiating "
+                "ChatGithubCopilot."
+            )
+        return env_token
+    @property
+    def _inference_url(self) -> str:
+        """Return the full chat-completions endpoint URL."""
+        if self.org:
+            path = _ORG_INFERENCE_PATH.format(org=self.org)
+        else:
+            path = _INFERENCE_PATH
+        return self.base_url.rstrip("/") + path
+    def _build_headers(self) -> Dict[str, str]:
+        return {
+            "Authorization": f"Bearer {self._token}",
+            "Accept": "application/vnd.github+json",
+            "Content-Type": "application/json",
+            "X-GitHub-Api-Version": self.api_version,
+        }
+    def _build_payload(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        stream: bool = False,
+        **kwargs: Any,
+    ) -> Dict[str, Any]:
+        """Assemble the JSON body for the inference API."""
+        payload: Dict[str, Any] = {
+            "model": self.model_name,
+            "messages": [_message_to_dict(m) for m in messages],
+            "stream": stream,
+        }
+        if stream:
+            payload["stream_options"] = {"include_usage": True}
+        # Optional sampling params (kwargs override instance-level defaults)
+        for field_name, api_key in [
+            ("temperature", "temperature"),
+            ("max_tokens", "max_tokens"),
+            ("top_p", "top_p"),
+            ("frequency_penalty", "frequency_penalty"),
+            ("presence_penalty", "presence_penalty"),
+            ("seed", "seed"),
+        ]:
+            value = kwargs.pop(api_key, None) or getattr(self, field_name, None)
+            if value is not None:
+                payload[api_key] = value
+        # Stop sequences
+        effective_stop = stop or self.stop
+        if effective_stop:
+            payload["stop"] = effective_stop
+        # Tools / tool_choice
+        tools = kwargs.pop("tools", None)
+        if tools:
+            payload["tools"] = _format_tools_for_api(tools)
+            tool_choice = kwargs.pop("tool_choice", None)
+            if tool_choice:
+                payload["tool_choice"] = _normalize_tool_choice(tool_choice)
+        # Response format (JSON mode / structured output)
+        response_format = kwargs.pop("response_format", None)
+        if response_format:
+            payload["response_format"] = response_format
+        # Pass through any remaining caller-supplied kwargs
+        payload.update(kwargs)
+        return payload
+    def _do_request(self, payload: Dict[str, Any]) -> Dict[str, Any]:
+        """Perform a synchronous (non-streaming) HTTP POST with retries."""
+        headers = self._build_headers()
+        last_exc: Optional[Exception] = None
+        for attempt in range(self.max_retries + 1):
+            try:
+                response = httpx.post(
+                    self._inference_url,
+                    headers=headers,
+                    json=payload,
+                    timeout=self.timeout,
+                )
+                response.raise_for_status()
+                return response.json()
+            except (httpx.TimeoutException, httpx.TransportError) as exc:
+                last_exc = exc
+                if attempt == self.max_retries:
+                    raise
+            except httpx.HTTPStatusError as exc:
+                # Don't retry on 4xx client errors
+                if exc.response.status_code < 500:
+                    raise
+                last_exc = exc
+                if attempt == self.max_retries:
+                    raise
+        raise RuntimeError("Unexpected retry loop exit") from last_exc
+    def _do_stream(self, payload: Dict[str, Any]) -> Iterator[Dict[str, Any]]:
+        """Perform a synchronous streaming HTTP POST and yield parsed SSE chunks."""
+        headers = self._build_headers()
+        with httpx.stream(
+            "POST",
+            self._inference_url,
+            headers=headers,
+            json=payload,
+            timeout=self.timeout,
+        ) as response:
+            response.raise_for_status()
+            for line in response.iter_lines():
+                line = line.strip()
+                if not line or line == "data: [DONE]":
+                    continue
+                if line.startswith("data: "):
+                    line = line[len("data: ") :]
+                try:
+                    yield json.loads(line)
+                except json.JSONDecodeError:
+                    continue
+    async def _do_request_async(self, payload: Dict[str, Any]) -> Dict[str, Any]:
+        """Perform an asynchronous (non-streaming) HTTP POST with retries."""
+        headers = self._build_headers()
+        last_exc: Optional[Exception] = None
+        async with httpx.AsyncClient(timeout=self.timeout) as client:
+            for attempt in range(self.max_retries + 1):
+                try:
+                    response = await client.post(
+                        self._inference_url,
+                        headers=headers,
+                        json=payload,
+                    )
+                    response.raise_for_status()
+                    return response.json()
+                except (httpx.TimeoutException, httpx.TransportError) as exc:
+                    last_exc = exc
+                    if attempt == self.max_retries:
+                        raise
+                except httpx.HTTPStatusError as exc:
+                    if exc.response.status_code < 500:
+                        raise
+                    last_exc = exc
+                    if attempt == self.max_retries:
+                        raise
+        raise RuntimeError("Unexpected retry loop exit") from last_exc
+    async def _do_stream_async(
+        self, payload: Dict[str, Any]
+    ) -> AsyncIterator[Dict[str, Any]]:
+        """Perform an asynchronous streaming HTTP POST and yield parsed SSE chunks."""
+        headers = self._build_headers()
+        async with httpx.AsyncClient(timeout=self.timeout) as client:
+            async with client.stream(
+                "POST",
+                self._inference_url,
+                headers=headers,
+                json=payload,
+            ) as response:
+                response.raise_for_status()
+                async for line in response.aiter_lines():
+                    line = line.strip()
+                    if not line or line == "data: [DONE]":
+                        continue
+                    if line.startswith("data: "):
+                        line = line[len("data: ") :]
+                    try:
+                        yield json.loads(line)
+                    except json.JSONDecodeError:
+                        continue
+    # ------------------------------------------------------------------
+    # Stream delta → AIMessageChunk helpers
+    # ------------------------------------------------------------------
+    @staticmethod
+    def _chunk_from_delta(
+        delta: Dict[str, Any],
+        finish_reason: Optional[str],
+        usage: Optional[Dict[str, Any]],
+    ) -> AIMessageChunk:
+        """Convert a single SSE delta object into an ``AIMessageChunk``."""
+        content = delta.get("content") or ""
+        additional_kwargs: Dict[str, Any] = {}
+        tool_call_chunks = []
+        raw_tool_calls = delta.get("tool_calls") or []
+        for raw_tc in raw_tool_calls:
+            index = raw_tc.get("index", 0)
+            tc_id = raw_tc.get("id")
+            func = raw_tc.get("function", {})
+            tool_call_chunks.append(
+                create_tool_call_chunk(
+                    name=func.get("name"),
+                    args=func.get("arguments"),
+                    id=tc_id,
+                    index=index,
+                )
+            )
+        response_metadata: Dict[str, Any] = {}
+        if finish_reason:
+            response_metadata["finish_reason"] = finish_reason
+        usage_metadata: Optional[UsageMetadata] = None
+        if usage:
+            usage_metadata = UsageMetadata(
+                input_tokens=usage.get("prompt_tokens", 0),
+                output_tokens=usage.get("completion_tokens", 0),
+                total_tokens=usage.get("total_tokens", 0),
+            )
+            response_metadata["usage"] = usage
+        return AIMessageChunk(
+            content=content,
+            additional_kwargs=additional_kwargs,
+            tool_call_chunks=tool_call_chunks,
+            response_metadata=response_metadata,
+            usage_metadata=usage_metadata,
+        )
+    # ------------------------------------------------------------------
+    # LangChain BaseChatModel interface
+    # ------------------------------------------------------------------
+    @property
+    def _llm_type(self) -> str:
+        return "chat-github-copilot"
+    @property
+    def _identifying_params(self) -> Dict[str, Any]:
+        return {
+            "model_name": self.model_name,
+            "temperature": self.temperature,
+            "max_tokens": self.max_tokens,
+        }
+    def _get_ls_params(
+        self,
+        stop: Optional[List[str]] = None,
+        **kwargs: Any,
+    ) -> LangSmithParams:
+        params = self._identifying_params
+        return LangSmithParams(
+            ls_provider="github-copilot",
+            ls_model_name=self.model_name,
+            ls_model_type="chat",
+            ls_temperature=params.get("temperature"),
+            ls_max_tokens=params.get("max_tokens"),
+            ls_stop=stop or self.stop or [],
+        )
+    def _generate(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        """Call the GitHub Models chat completions API and return a ChatResult."""
+        payload = self._build_payload(messages, stop=stop, stream=False, **kwargs)
+        response_data = self._do_request(payload)
+        choices = response_data.get("choices", [])
+        if not choices:
+            raise ValueError(
+                f"GitHub Models API returned no choices. Response: {response_data}"
+            )
+        usage = response_data.get("usage")
+        generations = []
+        for choice in choices:
+            ai_msg = _build_ai_message(choice, usage)
+            generations.append(ChatGeneration(message=ai_msg))
+        return ChatResult(generations=generations)
+    def _stream(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> Iterator[ChatGenerationChunk]:
+        """Stream token-level chunks from the GitHub Models API."""
+        payload = self._build_payload(messages, stop=stop, stream=True, **kwargs)
+        for raw_chunk in self._do_stream(payload):
+            choices = raw_chunk.get("choices", [])
+            usage = raw_chunk.get(
+                "usage"
+            )  # present in the final chunk when include_usage=True
+            if not choices and usage:
+                # Final usage-only chunk
+                chunk = ChatGenerationChunk(
+                    message=AIMessageChunk(
+                        content="",
+                        usage_metadata=UsageMetadata(
+                            input_tokens=usage.get("prompt_tokens", 0),
+                            output_tokens=usage.get("completion_tokens", 0),
+                            total_tokens=usage.get("total_tokens", 0),
+                        ),
+                        response_metadata={"usage": usage},
+                    )
+                )
+                if run_manager:
+                    run_manager.on_llm_new_token("", chunk=chunk)
+                yield chunk
+                continue
+            for choice in choices:
+                delta = choice.get("delta", {})
+                finish_reason = choice.get("finish_reason")
+                ai_chunk = self._chunk_from_delta(delta, finish_reason, usage)
+                gen_chunk = ChatGenerationChunk(message=ai_chunk)
+                if run_manager and ai_chunk.content:
+                    run_manager.on_llm_new_token(str(ai_chunk.content), chunk=gen_chunk)
+                yield gen_chunk
+    async def _agenerate(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        """Async version of ``_generate``."""
+        payload = self._build_payload(messages, stop=stop, stream=False, **kwargs)
+        response_data = await self._do_request_async(payload)
+        choices = response_data.get("choices", [])
+        if not choices:
+            raise ValueError(
+                f"GitHub Models API returned no choices. Response: {response_data}"
+            )
+        usage = response_data.get("usage")
+        generations = []
+        for choice in choices:
+            ai_msg = _build_ai_message(choice, usage)
+            generations.append(ChatGeneration(message=ai_msg))
+        return ChatResult(generations=generations)
+    async def _astream(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> AsyncIterator[ChatGenerationChunk]:
+        """Async streaming version of ``_stream``."""
+        payload = self._build_payload(messages, stop=stop, stream=True, **kwargs)
+        async for raw_chunk in self._do_stream_async(payload):
+            choices = raw_chunk.get("choices", [])
+            usage = raw_chunk.get("usage")
+            if not choices and usage:
+                chunk = ChatGenerationChunk(
+                    message=AIMessageChunk(
+                        content="",
+                        usage_metadata=UsageMetadata(
+                            input_tokens=usage.get("prompt_tokens", 0),
+                            output_tokens=usage.get("completion_tokens", 0),
+                            total_tokens=usage.get("total_tokens", 0),
+                        ),
+                        response_metadata={"usage": usage},
+                    )
+                )
+                if run_manager:
+                    await run_manager.on_llm_new_token("", chunk=chunk)
+                yield chunk
+                continue
+            for choice in choices:
+                delta = choice.get("delta", {})
+                finish_reason = choice.get("finish_reason")
+                ai_chunk = self._chunk_from_delta(delta, finish_reason, usage)
+                gen_chunk = ChatGenerationChunk(message=ai_chunk)
+                if run_manager and ai_chunk.content:
+                    await run_manager.on_llm_new_token(
+                        str(ai_chunk.content), chunk=gen_chunk
+                    )
+                yield gen_chunk
+    # ------------------------------------------------------------------
+    # Tool calling support
+    # ------------------------------------------------------------------
+    def bind_tools(
+        self,
+        tools: Sequence[Union[Dict[str, Any], BaseTool, Type, Any]],
+        *,
+        tool_choice: Optional[Union[str, Literal["auto", "required", "none"]]] = None,
+        **kwargs: Any,
+    ) -> "ChatGithubCopilot":
+        """Bind tools to this model, enabling tool calling.
+        Args:
+            tools: A list of tools to bind.  Accepts LangChain ``BaseTool``
+                instances, Pydantic models, or pre-formatted OpenAI tool dicts.
+            tool_choice: Controls tool selection.  One of ``"auto"``,
+                ``"required"``, ``"none"``, or the name of a specific tool.
+                Defaults to ``"auto"`` when tools are provided.
+        Returns:
+            A new ``ChatGithubCopilot`` instance with ``tools`` bound.
+        Example:
+            .. code-block:: python
+                from pydantic import BaseModel, Field
+                class SearchWeb(BaseModel):
+                    '''Search the web for up-to-date information.'''
+                    query: str = Field(..., description="The search query")
+                llm_with_tools = llm.bind_tools([SearchWeb])
+                ai_msg = llm_with_tools.invoke("Who won the 2024 Olympics 100m sprint?")
+                print(ai_msg.tool_calls)
+        """
+        formatted_tools = _format_tools_for_api(tools)
+        tool_choice_param: Optional[str] = tool_choice or (
+            "auto" if formatted_tools else None
+        )
+        return self.bind(
+            tools=formatted_tools,
+            tool_choice=tool_choice_param,
+            **kwargs,
+        )  # type: ignore[return-value]
+# ---------------------------------------------------------------------------
+# Backwards-compatible alias (matches the generated stub name)
+# ---------------------------------------------------------------------------
+ChatGithubcopilotChat = ChatGithubCopilot