npm - graphile-llm - Versions diffs - 0.7.3 → 0.8.0 - Mend

graphile-llm 0.7.3 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

package/__tests__/graphile-llm.test.js +6 -4
package/chat.d.ts +5 -5
package/chat.js +8 -16
package/config-cache.d.ts +77 -0
package/config-cache.js +148 -0
package/embedder.d.ts +5 -5
package/embedder.js +8 -16
package/env.d.ts +31 -0
package/env.js +52 -0
package/esm/__tests__/graphile-llm.test.js +6 -4
package/esm/chat.d.ts +5 -5
package/esm/chat.js +8 -16
package/esm/config-cache.d.ts +77 -0
package/esm/config-cache.js +143 -0
package/esm/embedder.d.ts +5 -5
package/esm/embedder.js +8 -16
package/esm/env.d.ts +31 -0
package/esm/env.js +49 -0
package/esm/index.d.ts +10 -1
package/esm/index.js +11 -1
package/esm/metering.d.ts +114 -0
package/esm/metering.js +358 -0
package/esm/plugins/agent-discovery-plugin.d.ts +29 -0
package/esm/plugins/agent-discovery-plugin.js +65 -0
package/esm/plugins/llm-module-plugin.d.ts +10 -1
package/esm/plugins/llm-module-plugin.js +11 -3
package/esm/plugins/metering-plugin.d.ts +42 -0
package/esm/plugins/metering-plugin.js +175 -0
package/esm/plugins/text-mutation-plugin.d.ts +4 -0
package/esm/plugins/text-mutation-plugin.js +11 -1
package/esm/plugins/text-search-plugin.d.ts +4 -0
package/esm/plugins/text-search-plugin.js +13 -1
package/esm/preset.d.ts +21 -1
package/esm/preset.js +29 -2
package/esm/types.d.ts +47 -6
package/index.d.ts +10 -1
package/index.js +23 -2
package/metering.d.ts +114 -0
package/metering.js +365 -0
package/package.json +15 -15
package/plugins/agent-discovery-plugin.d.ts +29 -0
package/plugins/agent-discovery-plugin.js +69 -0
package/plugins/llm-module-plugin.d.ts +10 -1
package/plugins/llm-module-plugin.js +11 -3
package/plugins/metering-plugin.d.ts +42 -0
package/plugins/metering-plugin.js +178 -0
package/plugins/text-mutation-plugin.d.ts +4 -0
package/plugins/text-mutation-plugin.js +11 -1
package/plugins/text-search-plugin.d.ts +4 -0
package/plugins/text-search-plugin.js +13 -1
package/preset.d.ts +21 -1
package/preset.js +29 -2
package/types.d.ts +47 -6

package/__tests__/graphile-llm.test.js CHANGED Viewed

@@ -109,11 +109,12 @@ describe('Embedder abstraction', () => {
         afterEach(() => {
             process.env = originalEnv;
         });
-        it('returns null when EMBEDDER_PROVIDER is not set', () => {
+        it('returns default ollama embedder when EMBEDDER_PROVIDER is not set', () => {
             process.env = { ...originalEnv };
             delete process.env.EMBEDDER_PROVIDER;
             const embedder = (0, embedder_1.buildEmbedderFromEnv)();
-            expect(embedder).toBeNull();
+            expect(embedder).not.toBeNull();
+            expect(typeof embedder).toBe('function');
         });
         it('builds embedder from environment variables', () => {
             process.env = {
@@ -420,11 +421,12 @@ describe('Chat completion abstraction', () => {
         afterEach(() => {
             process.env = originalEnv;
         });
-        it('returns null when CHAT_PROVIDER is not set', () => {
+        it('returns default ollama chat completer when CHAT_PROVIDER is not set', () => {
             process.env = { ...originalEnv };
             delete process.env.CHAT_PROVIDER;
             const chat = (0, chat_1.buildChatCompleterFromEnv)();
-            expect(chat).toBeNull();
+            expect(chat).not.toBeNull();
+            expect(typeof chat).toBe('function');
         });
         it('builds chat completer from environment variables', () => {
             process.env = {

package/chat.d.ts CHANGED Viewed

@@ -26,12 +26,12 @@ export declare function buildChatCompleter(config: ChatConfig): ChatFunction | n
  */
 export declare function buildChatCompleterFromModule(data: LlmModuleData): ChatFunction | null;
 /**
- * Resolve a chat completer from environment variables via getEnvOptions().
+ * Resolve a chat completer from environment variables.
  * This is a fallback for development when no llm_module or defaultChatCompleter is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   CHAT_PROVIDER - Provider name ('ollama')
- *   CHAT_MODEL    - Model identifier (e.g. 'llama3')
- *   CHAT_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   CHAT_PROVIDER  - Provider name (default: 'ollama')
+ *   CHAT_MODEL     - Model identifier (default: 'llama3')
+ *   CHAT_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 export declare function buildChatCompleterFromEnv(): ChatFunction | null;

package/chat.js CHANGED Viewed

@@ -20,7 +20,7 @@ exports.buildChatCompleter = buildChatCompleter;
 exports.buildChatCompleterFromModule = buildChatCompleterFromModule;
 exports.buildChatCompleterFromEnv = buildChatCompleterFromEnv;
 const ollama_1 = __importDefault(require("@agentic-kit/ollama"));
-const graphql_env_1 = require("@constructive-io/graphql-env");
+const env_1 = require("./env");
 // ─── Built-in Providers ─────────────────────────────────────────────────────
 /**
  * Create an Ollama-based chat completion function.
@@ -82,26 +82,18 @@ function buildChatCompleterFromModule(data) {
         provider: data.chat_provider,
         model: data.chat_model,
         baseUrl: data.chat_base_url,
-        apiKey: data.api_key_ref,
     });
 }
 /**
- * Resolve a chat completer from environment variables via getEnvOptions().
+ * Resolve a chat completer from environment variables.
  * This is a fallback for development when no llm_module or defaultChatCompleter is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   CHAT_PROVIDER - Provider name ('ollama')
- *   CHAT_MODEL    - Model identifier (e.g. 'llama3')
- *   CHAT_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   CHAT_PROVIDER  - Provider name (default: 'ollama')
+ *   CHAT_MODEL     - Model identifier (default: 'llama3')
+ *   CHAT_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 function buildChatCompleterFromEnv() {
-    const { llm } = (0, graphql_env_1.getEnvOptions)();
-    const provider = llm?.chat?.provider;
-    if (!provider)
-        return null;
-    return buildChatCompleter({
-        provider,
-        model: llm?.chat?.model,
-        baseUrl: llm?.chat?.baseUrl,
-    });
+    const { chat } = (0, env_1.getLlmEnvOptions)();
+    return buildChatCompleter(chat);
 }

package/config-cache.d.ts ADDED Viewed

@@ -0,0 +1,77 @@
+/**
+ * config-cache — Per-database LLM billing configuration cache
+ *
+ * Caches resolved billing function names per database_id.
+ * Uses an LRU cache with TTL so config changes propagate within a bounded window
+ * without requiring a server restart.
+ *
+ * Resolution flow:
+ *   Billing config from `metaschema_modules_public.billing_module`
+ *   (schema name + function names for record_usage, check_billing_quota)
+ *
+ * All queries run through the Graphile `withPgClient` callback, which gives us
+ * a client connected to the tenant database with proper role settings.
+ *
+ * The LLM module config (provider, model, etc.) is already resolved by the
+ * LlmModulePlugin at schema-build time. This cache handles the runtime-only
+ * billing piece.
+ */
+/**
+ * Generic pg client interface matching what Graphile's withPgClient provides.
+ * Avoids a hard dependency on the `pg` package.
+ */
+export interface PgClient {
+    query(sql: string, values?: unknown[]): Promise<{
+        rows: Record<string, unknown>[];
+    }>;
+}
+/**
+ * Billing function metadata resolved from the billing_module metaschema table.
+ */
+export interface BillingConfig {
+    /** Private schema containing the billing functions */
+    privateSchema: string;
+    /** Name of the record_usage function */
+    recordUsageFunction: string;
+    /** Name of the check_billing_quota function */
+    checkBillingQuotaFunction: string;
+    /** Public schema containing meters table */
+    publicSchema: string;
+}
+/**
+ * Inference log table metadata resolved from the inference_log_module.
+ */
+export interface InferenceLogConfig {
+    /** Schema containing the usage_log_inference table */
+    schema: string;
+    /** Name of the inference log table */
+    tableName: string;
+}
+/**
+ * Per-database cached configuration for the LLM billing integration.
+ */
+export interface LlmBillingCacheEntry {
+    /** Billing function references (null if billing_module not provisioned) */
+    billing: BillingConfig | null;
+    /** Inference log table references (null if inference_log_module not provisioned) */
+    inferenceLog: InferenceLogConfig | null;
+}
+/**
+ * Resolve billing config for a database.
+ * Results are cached per database_id with a 5-minute TTL.
+ *
+ * @param pgClient - A client connected to the tenant database (from withPgClient)
+ * @param databaseId - The database UUID
+ */
+export declare function getLlmBillingConfig(pgClient: PgClient, databaseId: string): Promise<LlmBillingCacheEntry>;
+/**
+ * Invalidate the cached config for a specific database (or all).
+ */
+export declare function invalidateLlmBillingConfig(databaseId?: string): void;
+/**
+ * Get cache stats for diagnostics.
+ */
+export declare function getLlmBillingCacheStats(): {
+    size: number;
+    max: number;
+};

package/config-cache.js ADDED Viewed

@@ -0,0 +1,148 @@
+"use strict";
+/**
+ * config-cache — Per-database LLM billing configuration cache
+ *
+ * Caches resolved billing function names per database_id.
+ * Uses an LRU cache with TTL so config changes propagate within a bounded window
+ * without requiring a server restart.
+ *
+ * Resolution flow:
+ *   Billing config from `metaschema_modules_public.billing_module`
+ *   (schema name + function names for record_usage, check_billing_quota)
+ *
+ * All queries run through the Graphile `withPgClient` callback, which gives us
+ * a client connected to the tenant database with proper role settings.
+ *
+ * The LLM module config (provider, model, etc.) is already resolved by the
+ * LlmModulePlugin at schema-build time. This cache handles the runtime-only
+ * billing piece.
+ */
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.getLlmBillingConfig = getLlmBillingConfig;
+exports.invalidateLlmBillingConfig = invalidateLlmBillingConfig;
+exports.getLlmBillingCacheStats = getLlmBillingCacheStats;
+const graphile_cache_1 = require("graphile-cache");
+// ─── SQL Queries ────────────────────────────────────────────────────────────
+/**
+ * Check if the billing_module table exists before querying it.
+ * This prevents hard errors on databases that don't have the billing
+ * module provisioned (the metaschema_modules_public schema or the
+ * billing_module table might not exist at all).
+ */
+const BILLING_MODULE_SQL = `
+  SELECT
+    s.schema_name AS public_schema,
+    ps.schema_name AS private_schema,
+    bm.record_usage_function
+  FROM metaschema_modules_public.billing_module bm
+  JOIN metaschema_public.schema s ON bm.schema_id = s.id
+  JOIN metaschema_public.schema ps ON bm.private_schema_id = ps.id
+  WHERE bm.database_id = $1
+  LIMIT 1
+`;
+/**
+ * Resolve the inference log module's schema and table name.
+ */
+const INFERENCE_LOG_MODULE_SQL = `
+  SELECT
+    s.schema_name AS schema,
+    ilm.inference_log_table_name AS table_name
+  FROM metaschema_modules_public.inference_log_module ilm
+  JOIN metaschema_public.schema s ON ilm.schema_id = s.id
+  WHERE ilm.database_id = $1
+  LIMIT 1
+`;
+// ─── Cache ──────────────────────────────────────────────────────────────────
+const billingCache = new graphile_cache_1.ModuleConfigCache({
+    name: 'billing-config',
+    ttlMs: 5 * 60 * 1000, // 5 minutes
+    max: 50,
+});
+// ─── Resolution Functions ───────────────────────────────────────────────────
+/**
+ * SQL to check if a schema exists. Used as a guard before querying
+ * metaschema tables that may not be provisioned.
+ */
+const SCHEMA_EXISTS_SQL = `
+  SELECT 1 FROM information_schema.schemata WHERE schema_name = $1 LIMIT 1
+`;
+async function resolveInferenceLogConfig(pgClient, databaseId) {
+    try {
+        const schemaCheck = await pgClient.query(SCHEMA_EXISTS_SQL, ['metaschema_modules_public']);
+        if (schemaCheck.rows.length === 0)
+            return null;
+        const result = await pgClient.query(INFERENCE_LOG_MODULE_SQL, [databaseId]);
+        const row = result.rows[0];
+        if (!row?.schema || !row?.table_name)
+            return null;
+        return {
+            schema: row.schema,
+            tableName: row.table_name,
+        };
+    }
+    catch {
+        return null;
+    }
+}
+async function resolveBillingConfig(pgClient, databaseId) {
+    try {
+        // Guard: check if the metaschema_modules_public schema exists.
+        // If the database doesn't have the billing module provisioned,
+        // this schema (or the billing_module table) won't exist.
+        const schemaCheck = await pgClient.query(SCHEMA_EXISTS_SQL, ['metaschema_modules_public']);
+        if (schemaCheck.rows.length === 0)
+            return null;
+        const result = await pgClient.query(BILLING_MODULE_SQL, [databaseId]);
+        const row = result.rows[0];
+        if (!row?.record_usage_function)
+            return null;
+        return {
+            publicSchema: row.public_schema,
+            privateSchema: row.private_schema,
+            recordUsageFunction: row.record_usage_function,
+            // The check_billing_quota function name follows the inflection pattern
+            checkBillingQuotaFunction: 'check_billing_quota',
+        };
+    }
+    catch {
+        // Schema/table doesn't exist or query failed — billing not available
+        return null;
+    }
+}
+// ─── Public API ─────────────────────────────────────────────────────────────
+/**
+ * Resolve billing config for a database.
+ * Results are cached per database_id with a 5-minute TTL.
+ *
+ * @param pgClient - A client connected to the tenant database (from withPgClient)
+ * @param databaseId - The database UUID
+ */
+async function getLlmBillingConfig(pgClient, databaseId) {
+    const cached = billingCache.get(databaseId);
+    if (cached)
+        return cached;
+    const [billing, inferenceLog] = await Promise.all([
+        resolveBillingConfig(pgClient, databaseId),
+        resolveInferenceLogConfig(pgClient, databaseId),
+    ]);
+    const entry = { billing, inferenceLog };
+    billingCache.set(databaseId, entry);
+    return entry;
+}
+/**
+ * Invalidate the cached config for a specific database (or all).
+ */
+function invalidateLlmBillingConfig(databaseId) {
+    if (databaseId) {
+        billingCache.delete(databaseId);
+    }
+    else {
+        billingCache.clear();
+    }
+}
+/**
+ * Get cache stats for diagnostics.
+ */
+function getLlmBillingCacheStats() {
+    return { size: billingCache.size, max: 50 };
+}

package/embedder.d.ts CHANGED Viewed

@@ -24,12 +24,12 @@ export declare function buildEmbedder(config: EmbedderConfig): EmbedderFunction
  */
 export declare function buildEmbedderFromModule(data: LlmModuleData): EmbedderFunction | null;
 /**
- * Resolve an embedder from environment variables via getEnvOptions().
+ * Resolve an embedder from environment variables.
  * This is a fallback for development when no llm_module or defaultEmbedder is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   EMBEDDER_PROVIDER - Provider name ('ollama')
- *   EMBEDDER_MODEL    - Model identifier
- *   EMBEDDER_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   EMBEDDER_PROVIDER  - Provider name (default: 'ollama')
+ *   EMBEDDER_MODEL     - Model identifier (default: 'nomic-embed-text')
+ *   EMBEDDER_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 export declare function buildEmbedderFromEnv(): EmbedderFunction | null;

package/embedder.js CHANGED Viewed

@@ -18,7 +18,7 @@ exports.buildEmbedder = buildEmbedder;
 exports.buildEmbedderFromModule = buildEmbedderFromModule;
 exports.buildEmbedderFromEnv = buildEmbedderFromEnv;
 const ollama_1 = __importDefault(require("@agentic-kit/ollama"));
-const graphql_env_1 = require("@constructive-io/graphql-env");
+const env_1 = require("./env");
 // ─── Built-in Providers ─────────────────────────────────────────────────────
 /**
  * Create an Ollama-based embedder function.
@@ -56,26 +56,18 @@ function buildEmbedderFromModule(data) {
         provider: data.embedding_provider,
         model: data.embedding_model,
         baseUrl: data.embedding_base_url,
-        apiKey: data.api_key_ref,
     });
 }
 /**
- * Resolve an embedder from environment variables via getEnvOptions().
+ * Resolve an embedder from environment variables.
  * This is a fallback for development when no llm_module or defaultEmbedder is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   EMBEDDER_PROVIDER - Provider name ('ollama')
- *   EMBEDDER_MODEL    - Model identifier
- *   EMBEDDER_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   EMBEDDER_PROVIDER  - Provider name (default: 'ollama')
+ *   EMBEDDER_MODEL     - Model identifier (default: 'nomic-embed-text')
+ *   EMBEDDER_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 function buildEmbedderFromEnv() {
-    const { llm } = (0, graphql_env_1.getEnvOptions)();
-    const provider = llm?.embedder?.provider;
-    if (!provider)
-        return null;
-    return buildEmbedder({
-        provider,
-        model: llm?.embedder?.model,
-        baseUrl: llm?.embedder?.baseUrl,
-    });
+    const { embedding } = (0, env_1.getLlmEnvOptions)();
+    return buildEmbedder(embedding);
 }

package/env.d.ts ADDED Viewed

@@ -0,0 +1,31 @@
+/**
+ * LLM Environment Configuration
+ *
+ * Single source of truth for all LLM-related environment variables and defaults.
+ * Every other module in graphile-llm imports from here — no direct process.env
+ * reads or scattered null coalescing elsewhere.
+ *
+ * Environment variables:
+ *   EMBEDDER_PROVIDER  - Embedding provider name ('ollama')
+ *   EMBEDDER_MODEL     - Embedding model (default: 'nomic-embed-text')
+ *   EMBEDDER_BASE_URL  - Embedding provider URL (default: 'http://localhost:11434')
+ *   CHAT_PROVIDER      - Chat provider name ('ollama')
+ *   CHAT_MODEL         - Chat model (default: 'llama3')
+ *   CHAT_BASE_URL      - Chat provider URL (default: 'http://localhost:11434')
+ */
+export interface LlmProviderConfig {
+    provider: string;
+    model: string;
+    baseUrl: string;
+}
+export interface LlmEnvOptions {
+    embedding: LlmProviderConfig;
+    chat: LlmProviderConfig;
+}
+/**
+ * Resolve LLM configuration from environment variables with sensible defaults.
+ *
+ * Call this once and pass the result around — never read process.env directly
+ * in plugin code.
+ */
+export declare function getLlmEnvOptions(): LlmEnvOptions;

package/env.js ADDED Viewed

@@ -0,0 +1,52 @@
+"use strict";
+/**
+ * LLM Environment Configuration
+ *
+ * Single source of truth for all LLM-related environment variables and defaults.
+ * Every other module in graphile-llm imports from here — no direct process.env
+ * reads or scattered null coalescing elsewhere.
+ *
+ * Environment variables:
+ *   EMBEDDER_PROVIDER  - Embedding provider name ('ollama')
+ *   EMBEDDER_MODEL     - Embedding model (default: 'nomic-embed-text')
+ *   EMBEDDER_BASE_URL  - Embedding provider URL (default: 'http://localhost:11434')
+ *   CHAT_PROVIDER      - Chat provider name ('ollama')
+ *   CHAT_MODEL         - Chat model (default: 'llama3')
+ *   CHAT_BASE_URL      - Chat provider URL (default: 'http://localhost:11434')
+ */
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.getLlmEnvOptions = getLlmEnvOptions;
+// ─── Defaults ───────────────────────────────────────────────────────────────
+const LLM_DEFAULTS = {
+    embedding: {
+        provider: 'ollama',
+        model: 'nomic-embed-text',
+        baseUrl: 'http://localhost:11434',
+    },
+    chat: {
+        provider: 'ollama',
+        model: 'llama3',
+        baseUrl: 'http://localhost:11434',
+    },
+};
+// ─── Resolution ─────────────────────────────────────────────────────────────
+/**
+ * Resolve LLM configuration from environment variables with sensible defaults.
+ *
+ * Call this once and pass the result around — never read process.env directly
+ * in plugin code.
+ */
+function getLlmEnvOptions() {
+    return {
+        embedding: {
+            provider: process.env.EMBEDDER_PROVIDER ?? LLM_DEFAULTS.embedding.provider,
+            model: process.env.EMBEDDER_MODEL ?? LLM_DEFAULTS.embedding.model,
+            baseUrl: process.env.EMBEDDER_BASE_URL ?? LLM_DEFAULTS.embedding.baseUrl,
+        },
+        chat: {
+            provider: process.env.CHAT_PROVIDER ?? LLM_DEFAULTS.chat.provider,
+            model: process.env.CHAT_MODEL ?? LLM_DEFAULTS.chat.model,
+            baseUrl: process.env.CHAT_BASE_URL ?? LLM_DEFAULTS.chat.baseUrl,
+        },
+    };
+}

package/esm/__tests__/graphile-llm.test.js CHANGED Viewed

@@ -71,11 +71,12 @@ describe('Embedder abstraction', () => {
         afterEach(() => {
             process.env = originalEnv;
         });
-        it('returns null when EMBEDDER_PROVIDER is not set', () => {
+        it('returns default ollama embedder when EMBEDDER_PROVIDER is not set', () => {
             process.env = { ...originalEnv };
             delete process.env.EMBEDDER_PROVIDER;
             const embedder = buildEmbedderFromEnv();
-            expect(embedder).toBeNull();
+            expect(embedder).not.toBeNull();
+            expect(typeof embedder).toBe('function');
         });
         it('builds embedder from environment variables', () => {
             process.env = {
@@ -382,11 +383,12 @@ describe('Chat completion abstraction', () => {
         afterEach(() => {
             process.env = originalEnv;
         });
-        it('returns null when CHAT_PROVIDER is not set', () => {
+        it('returns default ollama chat completer when CHAT_PROVIDER is not set', () => {
             process.env = { ...originalEnv };
             delete process.env.CHAT_PROVIDER;
             const chat = buildChatCompleterFromEnv();
-            expect(chat).toBeNull();
+            expect(chat).not.toBeNull();
+            expect(typeof chat).toBe('function');
         });
         it('builds chat completer from environment variables', () => {
             process.env = {

package/esm/chat.d.ts CHANGED Viewed

@@ -26,12 +26,12 @@ export declare function buildChatCompleter(config: ChatConfig): ChatFunction | n
  */
 export declare function buildChatCompleterFromModule(data: LlmModuleData): ChatFunction | null;
 /**
- * Resolve a chat completer from environment variables via getEnvOptions().
+ * Resolve a chat completer from environment variables.
  * This is a fallback for development when no llm_module or defaultChatCompleter is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   CHAT_PROVIDER - Provider name ('ollama')
- *   CHAT_MODEL    - Model identifier (e.g. 'llama3')
- *   CHAT_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   CHAT_PROVIDER  - Provider name (default: 'ollama')
+ *   CHAT_MODEL     - Model identifier (default: 'llama3')
+ *   CHAT_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 export declare function buildChatCompleterFromEnv(): ChatFunction | null;

package/esm/chat.js CHANGED Viewed

@@ -12,7 +12,7 @@
  *   3. Environment variables (CHAT_PROVIDER, CHAT_MODEL, CHAT_BASE_URL)
  */
 import OllamaClient from '@agentic-kit/ollama';
-import { getEnvOptions } from '@constructive-io/graphql-env';
+import { getLlmEnvOptions } from './env';
 // ─── Built-in Providers ─────────────────────────────────────────────────────
 /**
  * Create an Ollama-based chat completion function.
@@ -74,26 +74,18 @@ export function buildChatCompleterFromModule(data) {
         provider: data.chat_provider,
         model: data.chat_model,
         baseUrl: data.chat_base_url,
-        apiKey: data.api_key_ref,
     });
 }
 /**
- * Resolve a chat completer from environment variables via getEnvOptions().
+ * Resolve a chat completer from environment variables.
  * This is a fallback for development when no llm_module or defaultChatCompleter is configured.
  *
- * Environment variables (parsed by @constructive-io/graphql-env):
- *   CHAT_PROVIDER - Provider name ('ollama')
- *   CHAT_MODEL    - Model identifier (e.g. 'llama3')
- *   CHAT_BASE_URL - Provider base URL
+ * Environment variables (with defaults from env.ts):
+ *   CHAT_PROVIDER  - Provider name (default: 'ollama')
+ *   CHAT_MODEL     - Model identifier (default: 'llama3')
+ *   CHAT_BASE_URL  - Provider base URL (default: 'http://localhost:11434')
  */
 export function buildChatCompleterFromEnv() {
-    const { llm } = getEnvOptions();
-    const provider = llm?.chat?.provider;
-    if (!provider)
-        return null;
-    return buildChatCompleter({
-        provider,
-        model: llm?.chat?.model,
-        baseUrl: llm?.chat?.baseUrl,
-    });
+    const { chat } = getLlmEnvOptions();
+    return buildChatCompleter(chat);
 }

package/esm/config-cache.d.ts ADDED Viewed

@@ -0,0 +1,77 @@
+/**
+ * config-cache — Per-database LLM billing configuration cache
+ *
+ * Caches resolved billing function names per database_id.
+ * Uses an LRU cache with TTL so config changes propagate within a bounded window
+ * without requiring a server restart.
+ *
+ * Resolution flow:
+ *   Billing config from `metaschema_modules_public.billing_module`
+ *   (schema name + function names for record_usage, check_billing_quota)
+ *
+ * All queries run through the Graphile `withPgClient` callback, which gives us
+ * a client connected to the tenant database with proper role settings.
+ *
+ * The LLM module config (provider, model, etc.) is already resolved by the
+ * LlmModulePlugin at schema-build time. This cache handles the runtime-only
+ * billing piece.
+ */
+/**
+ * Generic pg client interface matching what Graphile's withPgClient provides.
+ * Avoids a hard dependency on the `pg` package.
+ */
+export interface PgClient {
+    query(sql: string, values?: unknown[]): Promise<{
+        rows: Record<string, unknown>[];
+    }>;
+}
+/**
+ * Billing function metadata resolved from the billing_module metaschema table.
+ */
+export interface BillingConfig {
+    /** Private schema containing the billing functions */
+    privateSchema: string;
+    /** Name of the record_usage function */
+    recordUsageFunction: string;
+    /** Name of the check_billing_quota function */
+    checkBillingQuotaFunction: string;
+    /** Public schema containing meters table */
+    publicSchema: string;
+}
+/**
+ * Inference log table metadata resolved from the inference_log_module.
+ */
+export interface InferenceLogConfig {
+    /** Schema containing the usage_log_inference table */
+    schema: string;
+    /** Name of the inference log table */
+    tableName: string;
+}
+/**
+ * Per-database cached configuration for the LLM billing integration.
+ */
+export interface LlmBillingCacheEntry {
+    /** Billing function references (null if billing_module not provisioned) */
+    billing: BillingConfig | null;
+    /** Inference log table references (null if inference_log_module not provisioned) */
+    inferenceLog: InferenceLogConfig | null;
+}
+/**
+ * Resolve billing config for a database.
+ * Results are cached per database_id with a 5-minute TTL.
+ *
+ * @param pgClient - A client connected to the tenant database (from withPgClient)
+ * @param databaseId - The database UUID
+ */
+export declare function getLlmBillingConfig(pgClient: PgClient, databaseId: string): Promise<LlmBillingCacheEntry>;
+/**
+ * Invalidate the cached config for a specific database (or all).
+ */
+export declare function invalidateLlmBillingConfig(databaseId?: string): void;
+/**
+ * Get cache stats for diagnostics.
+ */
+export declare function getLlmBillingCacheStats(): {
+    size: number;
+    max: number;
+};