PyPI - langgraph-api - Versions diffs - 0.4.29__tar.gz → 0.4.30__tar.gz - Mend

langgraph-api 0.4.29tar.gz → 0.4.30tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of langgraph-api might be problematic. Click here for more details.

Files changed (132) hide show

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: langgraph-api
-Version: 0.4.29
+Version: 0.4.30
 Author-email: Nuno Campos <nuno@langchain.dev>, Will Fu-Hinthorn <will@langchain.dev>
 License: Elastic-2.0
 License-File: LICENSE
@@ -17,6 +17,9 @@ Requires-Dist: langgraph-runtime-inmem<0.15.0,>=0.14.0
 Requires-Dist: langgraph-sdk>=0.2.0
 Requires-Dist: langgraph>=0.4.0
 Requires-Dist: langsmith>=0.3.45
+Requires-Dist: opentelemetry-api>=1.37.0
+Requires-Dist: opentelemetry-exporter-otlp-proto-http>=1.37.0
+Requires-Dist: opentelemetry-sdk>=1.37.0
 Requires-Dist: orjson>=3.9.7
 Requires-Dist: protobuf<7.0.0,>=6.32.1
 Requires-Dist: pyjwt>=2.9.0

langgraph_api-0.4.30/langgraph_api/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "0.4.30"

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/api/meta.py RENAMED Viewed

@@ -1,5 +1,3 @@
-from typing import cast
 import langgraph.version
 import structlog
 from starlette.responses import JSONResponse, PlainTextResponse
@@ -48,7 +46,7 @@ async def meta_metrics(request: ApiRequest):
     # collect stats
     metrics = get_metrics()
-    worker_metrics = cast(dict[str, int], metrics["workers"])
+    worker_metrics = metrics["workers"]
     workers_max = worker_metrics["max"]
     workers_active = worker_metrics["active"]
     workers_available = worker_metrics["available"]

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/config.py RENAMED Viewed

@@ -374,6 +374,16 @@ API_VARIANT = env("LANGSMITH_LANGGRAPH_API_VARIANT", cast=str, default="")
 # UI
 UI_USE_BUNDLER = env("LANGGRAPH_UI_BUNDLER", cast=bool, default=False)
+SELF_HOSTED_METRICS_ENABLED = env(
+    "SELF_HOSTED_METRICS_ENABLED", cast=bool, default=False
+)
+SELF_HOSTED_METRICS_ENDPOINT = env(
+    "SELF_HOSTED_METRICS_ENDPOINT", cast=str, default=None
+)
+SELF_HOSTED_METRICS_EXPORT_INTERVAL_MS = env(
+    "SELF_HOSTED_METRICS_EXPORT_INTERVAL_MS", cast=int, default=60000
+)
 IS_QUEUE_ENTRYPOINT = False
 IS_EXECUTOR_ENTRYPOINT = False
 ref_sha = None

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/grpc_ops/generated/core_api_pb2_grpc.py RENAMED Viewed

@@ -6,7 +6,7 @@ import warnings
 from . import core_api_pb2 as core__api__pb2
 from google.protobuf import empty_pb2 as google_dot_protobuf_dot_empty__pb2
-GRPC_GENERATED_VERSION = '1.75.0'
+GRPC_GENERATED_VERSION = '1.75.1'
 GRPC_VERSION = grpc.__version__
 _version_not_supported = False

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/http_metrics.py RENAMED Viewed

@@ -1,51 +1,23 @@
 from collections import defaultdict
 from typing import Any
-FILTERED_ROUTES = {"/ok", "/info", "/metrics", "/docs", "/openapi.json"}
+from langgraph_api import config
+from langgraph_api.http_metrics_utils import (
+    HTTP_LATENCY_BUCKETS,
+    get_route,
+    should_filter_route,
+)
 MAX_REQUEST_COUNT_ENTRIES = 5000
 MAX_HISTOGRAM_ENTRIES = 1000
-def get_route(route: Any) -> str | None:
-    try:
-        # default lg api routes use the custom APIRoute where scope["route"] is set to a string
-        if isinstance(route, str):
-            return route
-        else:
-            # custom FastAPI routes provided by user_router attach an object to scope["route"]
-            route_path = getattr(route, "path", None)
-            return route_path
-    except Exception:
-        return None
-def should_filter_route(route_path: str) -> bool:
-    # use endswith to honor MOUNT_PREFIX
-    return any(route_path.endswith(suffix) for suffix in FILTERED_ROUTES)
 class HTTPMetricsCollector:
     def __init__(self):
         # Counter: Key: (method, route, status), Value: count
         self._request_counts: dict[tuple[str, str, int], int] = defaultdict(int)
-        self._histogram_buckets = [
-            0.01,
-            0.1,
-            0.5,
-            1,
-            5,
-            15,
-            30,
-            60,
-            120,
-            300,
-            600,
-            1800,
-            3600,
-            float("inf"),
-        ]
+        self._histogram_buckets = HTTP_LATENCY_BUCKETS
         self._histogram_bucket_labels = [
             "+Inf" if value == float("inf") else str(value)
             for value in self._histogram_buckets
@@ -97,6 +69,14 @@ class HTTPMetricsCollector:
         hist_data["sum"] += latency_seconds
         hist_data["count"] += 1
+        try:
+            if config.SELF_HOSTED_METRICS_ENABLED:
+                from langgraph_api.self_hosted_metrics import record_http_request
+                record_http_request(method, route_path, status, latency_seconds)
+        except Exception:
+            pass
     def get_metrics(
         self,
         project_id: str | None,

langgraph_api-0.4.30/langgraph_api/http_metrics_utils.py ADDED Viewed

@@ -0,0 +1,38 @@
+from typing import Any
+FILTERED_ROUTES = {"/ok", "/info", "/metrics", "/docs", "/openapi.json"}
+HTTP_LATENCY_BUCKETS = [
+    0.01,
+    0.1,
+    0.5,
+    1,
+    5,
+    15,
+    30,
+    60,
+    120,
+    300,
+    600,
+    1800,
+    3600,
+    float("inf"),
+]
+def get_route(route: Any) -> str | None:
+    try:
+        # default lg api routes use the custom APIRoute where scope["route"] is set to a string
+        if isinstance(route, str):
+            return route
+        else:
+            # custom FastAPI routes provided by user_router attach an object to scope["route"]
+            route_path = getattr(route, "path", None)
+            return route_path
+    except Exception:
+        return None
+def should_filter_route(route_path: str) -> bool:
+    # use endswith to honor MOUNT_PREFIX
+    return any(route_path.endswith(suffix) for suffix in FILTERED_ROUTES)

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/queue_entrypoint.py RENAMED Viewed

@@ -18,7 +18,6 @@ import logging.config
 import pathlib
 import signal
 from contextlib import asynccontextmanager
-from typing import cast
 import structlog
@@ -50,7 +49,7 @@ async def health_and_metrics_server():
             metrics_format = "prometheus"
         metrics = get_metrics()
-        worker_metrics = cast(dict[str, int], metrics["workers"])
+        worker_metrics = metrics["workers"]
         workers_max = worker_metrics["max"]
         workers_active = worker_metrics["active"]
         workers_available = worker_metrics["available"]

langgraph_api-0.4.30/langgraph_api/self_hosted_metrics.py ADDED Viewed

@@ -0,0 +1,380 @@
+import os
+import structlog
+from opentelemetry import metrics
+from opentelemetry.exporter.otlp.proto.http.metric_exporter import (
+    OTLPMetricExporter,
+)
+from opentelemetry.metrics import CallbackOptions, Observation
+from opentelemetry.sdk.metrics import MeterProvider
+from opentelemetry.sdk.metrics.export import PeriodicExportingMetricReader
+from opentelemetry.sdk.resources import Resource
+from langgraph_api import asyncio as lg_asyncio
+from langgraph_api import config, metadata
+from langgraph_api.http_metrics_utils import HTTP_LATENCY_BUCKETS
+from langgraph_runtime.database import connect, pool_stats
+from langgraph_runtime.metrics import get_metrics
+from langgraph_runtime.ops import Runs
+logger = structlog.stdlib.get_logger(__name__)
+_meter_provider = None
+_customer_attributes = {}
+_http_request_counter = None
+_http_latency_histogram = None
+def initialize_self_hosted_metrics():
+    global \
+        _meter_provider, \
+        _http_request_counter, \
+        _http_latency_histogram, \
+        _customer_attributes
+    if not config.SELF_HOSTED_METRICS_ENABLED:
+        return
+    if not config.SELF_HOSTED_METRICS_ENDPOINT:
+        raise RuntimeError(
+            "SELF_HOSTED_METRICS_ENABLED is true but no SELF_HOSTED_METRICS_ENDPOINT is configured"
+        )
+    # for now, this is only enabled for fully self-hosted customers
+    # we will need to update the otel collector auth model to support hybrid customers
+    if not config.LANGGRAPH_CLOUD_LICENSE_KEY:
+        logger.warning(
+            "Self-hosted metrics require a license key, and do not work with hybrid deployments yet."
+        )
+        return
+    try:
+        exporter = OTLPMetricExporter(
+            endpoint=config.SELF_HOSTED_METRICS_ENDPOINT,
+            headers={"X-Langchain-License-Key": config.LANGGRAPH_CLOUD_LICENSE_KEY},
+        )
+        # this will periodically export metrics to our beacon lgp otel collector in a separate thread
+        metric_reader = PeriodicExportingMetricReader(
+            exporter=exporter,
+            export_interval_millis=config.SELF_HOSTED_METRICS_EXPORT_INTERVAL_MS,
+        )
+        resource_attributes = {
+            "service.name": "LGP_Self_Hosted",
+        }
+        resource = Resource.create(resource_attributes)
+        if config.LANGGRAPH_CLOUD_LICENSE_KEY:
+            try:
+                from langgraph_license.validation import (
+                    CUSTOMER_ID,  # type: ignore[unresolved-import]
+                    CUSTOMER_NAME,  # type: ignore[unresolved-import]
+                )
+                if CUSTOMER_ID:
+                    _customer_attributes["customer_id"] = CUSTOMER_ID
+                if CUSTOMER_NAME:
+                    _customer_attributes["customer_name"] = CUSTOMER_NAME
+            except ImportError:
+                pass
+            except Exception as e:
+                logger.warning("Failed to get customer info from license", exc_info=e)
+        # resolves to pod name in k8s, or container id in docker
+        instance_id = os.environ.get("HOSTNAME")
+        if instance_id:
+            _customer_attributes["instance_id"] = instance_id
+        _meter_provider = MeterProvider(
+            metric_readers=[metric_reader], resource=resource
+        )
+        metrics.set_meter_provider(_meter_provider)
+        meter = metrics.get_meter("langgraph_api.self_hosted")
+        meter.create_observable_gauge(
+            name="lg_api_num_pending_runs",
+            description="The number of runs currently pending",
+            unit="1",
+            callbacks=[_get_pending_runs_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_num_running_runs",
+            description="The number of runs currently running",
+            unit="1",
+            callbacks=[_get_running_runs_callback],
+        )
+        if config.N_JOBS_PER_WORKER > 0:
+            meter.create_observable_gauge(
+                name="lg_api_workers_max",
+                description="The maximum number of workers available",
+                unit="1",
+                callbacks=[_get_workers_max_callback],
+            )
+            meter.create_observable_gauge(
+                name="lg_api_workers_active",
+                description="The number of currently active workers",
+                unit="1",
+                callbacks=[_get_workers_active_callback],
+            )
+            meter.create_observable_gauge(
+                name="lg_api_workers_available",
+                description="The number of available (idle) workers",
+                unit="1",
+                callbacks=[_get_workers_available_callback],
+            )
+        if not config.IS_QUEUE_ENTRYPOINT and not config.IS_EXECUTOR_ENTRYPOINT:
+            _http_request_counter = meter.create_counter(
+                name="lg_api_http_requests_total",
+                description="Total number of HTTP requests",
+                unit="1",
+            )
+            _http_latency_histogram = meter.create_histogram(
+                name="lg_api_http_requests_latency_seconds",
+                description="HTTP request latency in seconds",
+                unit="s",
+                explicit_bucket_boundaries_advisory=[
+                    b for b in HTTP_LATENCY_BUCKETS if b != float("inf")
+                ],
+            )
+        meter.create_observable_gauge(
+            name="lg_api_pg_pool_max",
+            description="The maximum size of the postgres connection pool",
+            unit="1",
+            callbacks=[_get_pg_pool_max_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_pg_pool_size",
+            description="Number of connections currently managed by the postgres connection pool",
+            unit="1",
+            callbacks=[_get_pg_pool_size_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_pg_pool_available",
+            description="Number of connections currently idle in the postgres connection pool",
+            unit="1",
+            callbacks=[_get_pg_pool_available_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_redis_pool_max",
+            description="The maximum size of the redis connection pool",
+            unit="1",
+            callbacks=[_get_redis_pool_max_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_redis_pool_size",
+            description="Number of connections currently in use in the redis connection pool",
+            unit="1",
+            callbacks=[_get_redis_pool_size_callback],
+        )
+        meter.create_observable_gauge(
+            name="lg_api_redis_pool_available",
+            description="Number of connections currently idle in the redis connection pool",
+            unit="1",
+            callbacks=[_get_redis_pool_available_callback],
+        )
+        logger.info(
+            "Self-hosted metrics initialized successfully",
+            endpoint=config.SELF_HOSTED_METRICS_ENDPOINT,
+            export_interval_ms=config.SELF_HOSTED_METRICS_EXPORT_INTERVAL_MS,
+        )
+    except Exception as e:
+        logger.exception("Failed to initialize self-hosted metrics", exc_info=e)
+def shutdown_self_hosted_metrics():
+    global _meter_provider
+    if _meter_provider:
+        try:
+            logger.info("Shutting down self-hosted metrics")
+            _meter_provider.shutdown(timeout_millis=5000)
+            _meter_provider = None
+        except Exception as e:
+            logger.exception("Failed to shutdown self-hosted metrics", exc_info=e)
+def record_http_request(
+    method: str, route_path: str, status: int, latency_seconds: float
+):
+    if not _meter_provider or not _http_request_counter or not _http_latency_histogram:
+        return
+    attributes = {"method": method, "path": route_path, "status": str(status)}
+    if _customer_attributes:
+        attributes.update(_customer_attributes)
+    _http_request_counter.add(1, attributes)
+    _http_latency_histogram.record(latency_seconds, attributes)
+def _get_queue_stats():
+    async def _fetch_queue_stats():
+        try:
+            async with connect() as conn:
+                return await Runs.stats(conn)
+        except Exception as e:
+            logger.warning("Failed to get queue stats from database", exc_info=e)
+            return {"n_pending": 0, "n_running": 0}
+    try:
+        future = lg_asyncio.run_coroutine_threadsafe(_fetch_queue_stats())
+        return future.result(timeout=5)
+    except Exception as e:
+        logger.warning("Failed to get queue stats", exc_info=e)
+        return {"n_pending": 0, "n_running": 0}
+def _get_pool_stats():
+    # _get_pool() inside the pool_stats fn will not work correctly if called from the daemon thread created by PeriodicExportingMetricReader,
+    # so we submit this as a coro to run in the main event loop
+    async def _fetch_pool_stats():
+        try:
+            return pool_stats(
+                metadata.PROJECT_ID, metadata.HOST_REVISION_ID, format="json"
+            )
+        except Exception as e:
+            logger.warning("Failed to get pool stats", exc_info=e)
+            return {"postgres": {}, "redis": {}}
+    try:
+        future = lg_asyncio.run_coroutine_threadsafe(_fetch_pool_stats())
+        return future.result(timeout=5)
+    except Exception as e:
+        logger.warning("Failed to get pool stats", exc_info=e)
+        return {"postgres": {}, "redis": {}}
+def _get_pending_runs_callback(options: CallbackOptions):
+    try:
+        stats = _get_queue_stats()
+        return [Observation(stats.get("n_pending", 0), attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get pending runs", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_running_runs_callback(options: CallbackOptions):
+    try:
+        stats = _get_queue_stats()
+        return [Observation(stats.get("n_running", 0), attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get running runs", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_workers_max_callback(options: CallbackOptions):
+    try:
+        metrics_data = get_metrics()
+        worker_metrics = metrics_data.get("workers", {})
+        return [
+            Observation(worker_metrics.get("max", 0), attributes=_customer_attributes)
+        ]
+    except Exception as e:
+        logger.warning("Failed to get max workers", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_workers_active_callback(options: CallbackOptions):
+    try:
+        metrics_data = get_metrics()
+        worker_metrics = metrics_data.get("workers", {})
+        return [
+            Observation(
+                worker_metrics.get("active", 0), attributes=_customer_attributes
+            )
+        ]
+    except Exception as e:
+        logger.warning("Failed to get active workers", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_workers_available_callback(options: CallbackOptions):
+    try:
+        metrics_data = get_metrics()
+        worker_metrics = metrics_data.get("workers", {})
+        return [
+            Observation(
+                worker_metrics.get("available", 0), attributes=_customer_attributes
+            )
+        ]
+    except Exception as e:
+        logger.warning("Failed to get available workers", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_pg_pool_max_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        pg_max = stats.get("postgres", {}).get("pool_max", 0)
+        return [Observation(pg_max, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get PG pool max", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_pg_pool_size_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        pg_size = stats.get("postgres", {}).get("pool_size", 0)
+        return [Observation(pg_size, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get PG pool size", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_pg_pool_available_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        pg_available = stats.get("postgres", {}).get("pool_available", 0)
+        return [Observation(pg_available, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get PG pool available", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_redis_pool_max_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        redis_max = stats.get("redis", {}).get("max_connections", 0)
+        return [Observation(redis_max, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get Redis pool max", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_redis_pool_size_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        redis_size = stats.get("redis", {}).get("in_use_connections", 0)
+        return [Observation(redis_size, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get Redis pool size", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]
+def _get_redis_pool_available_callback(options: CallbackOptions):
+    try:
+        stats = _get_pool_stats()
+        redis_available = stats.get("redis", {}).get("idle_connections", 0)
+        return [Observation(redis_available, attributes=_customer_attributes)]
+    except Exception as e:
+        logger.warning("Failed to get Redis pool available", exc_info=e)
+        return [Observation(0, attributes=_customer_attributes)]

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/langgraph_api/stream.py RENAMED Viewed

@@ -231,6 +231,8 @@ async def astream_state(
     # stream run
     if use_astream_events:
+        if USE_RUNTIME_CONTEXT_API:
+            kwargs["context"] = context
         async with (
             stack,
             aclosing(  # type: ignore[invalid-argument-type]

{langgraph_api-0.4.29 → langgraph_api-0.4.30}/pyproject.toml RENAMED Viewed

@@ -36,6 +36,9 @@ dependencies = [
     "protobuf>=6.32.1,<7.0.0",
     "grpcio>=1.75.0,<2.0.0",
     "grpcio-tools>=1.75.0,<2.0.0",
+    "opentelemetry-api>=1.37.0",
+    "opentelemetry-sdk>=1.37.0",
+    "opentelemetry-exporter-otlp-proto-http>=1.37.0",
 ]
 [project.scripts]

langgraph-api 0.4.29__tar.gz → 0.4.30__tar.gz

Potentially problematic release.

langgraph-api 0.4.29tar.gz → 0.4.30tar.gz