@glueco/plugin-llm-groq 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +52 -0
- package/dist/chunk-CNIQDSXF.mjs +207 -0
- package/dist/chunk-CNIQDSXF.mjs.map +1 -0
- package/dist/chunk-MRDVVFUV.mjs +162 -0
- package/dist/chunk-MRDVVFUV.mjs.map +1 -0
- package/dist/client.d.mts +105 -0
- package/dist/client.d.ts +105 -0
- package/dist/client.js +228 -0
- package/dist/client.js.map +1 -0
- package/dist/client.mjs +58 -0
- package/dist/client.mjs.map +1 -0
- package/dist/contracts.d.mts +804 -0
- package/dist/contracts.d.ts +804 -0
- package/dist/contracts.js +198 -0
- package/dist/contracts.js.map +1 -0
- package/dist/contracts.mjs +31 -0
- package/dist/contracts.mjs.map +1 -0
- package/dist/index.d.mts +4 -0
- package/dist/index.d.ts +4 -0
- package/dist/index.js +396 -0
- package/dist/index.js.map +1 -0
- package/dist/index.mjs +37 -0
- package/dist/index.mjs.map +1 -0
- package/dist/proxy.d.mts +5 -0
- package/dist/proxy.d.ts +5 -0
- package/dist/proxy.js +368 -0
- package/dist/proxy.js.map +1 -0
- package/dist/proxy.mjs +10 -0
- package/dist/proxy.mjs.map +1 -0
- package/package.json +76 -0
package/README.md
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
1
|
+
# @glueco/plugin-llm-groq
|
|
2
|
+
|
|
3
|
+
Groq LLM plugin for Personal Resource Gateway.
|
|
4
|
+
|
|
5
|
+
## Installation
|
|
6
|
+
|
|
7
|
+
```bash
|
|
8
|
+
npm install @glueco/plugin-llm-groq
|
|
9
|
+
```
|
|
10
|
+
|
|
11
|
+
## Usage
|
|
12
|
+
|
|
13
|
+
1. Install the package
|
|
14
|
+
2. Add to `proxy.plugins.ts` at repository root:
|
|
15
|
+
|
|
16
|
+
```typescript
|
|
17
|
+
const enabledPlugins = [
|
|
18
|
+
"@glueco/plugin-llm-groq",
|
|
19
|
+
// ... other plugins
|
|
20
|
+
] as const;
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
3. Run `npm run build` or redeploy
|
|
24
|
+
|
|
25
|
+
## Supported Actions
|
|
26
|
+
|
|
27
|
+
- `chat.completions` - OpenAI-compatible chat completions
|
|
28
|
+
|
|
29
|
+
## Supported Models
|
|
30
|
+
|
|
31
|
+
- llama-3.3-70b-versatile
|
|
32
|
+
- llama-3.1-70b-versatile
|
|
33
|
+
- llama-3.1-8b-instant
|
|
34
|
+
- llama3-70b-8192
|
|
35
|
+
- llama3-8b-8192
|
|
36
|
+
- mixtral-8x7b-32768
|
|
37
|
+
- gemma2-9b-it
|
|
38
|
+
|
|
39
|
+
## Enforcement Support
|
|
40
|
+
|
|
41
|
+
This plugin supports the following enforcement knobs:
|
|
42
|
+
|
|
43
|
+
- `model` - Restrict to specific models
|
|
44
|
+
- `max_tokens` - Limit output tokens
|
|
45
|
+
- `streaming` - Enable/disable streaming
|
|
46
|
+
|
|
47
|
+
## Credentials
|
|
48
|
+
|
|
49
|
+
Required credentials in proxy admin:
|
|
50
|
+
|
|
51
|
+
- `apiKey` - Your Groq API key
|
|
52
|
+
- `baseUrl` (optional) - Custom API base URL
|
|
@@ -0,0 +1,207 @@
|
|
|
1
|
+
import {
|
|
2
|
+
ACTIONS,
|
|
3
|
+
ChatCompletionRequestSchema,
|
|
4
|
+
DEFAULT_GROQ_MODELS,
|
|
5
|
+
ENFORCEMENT_SUPPORT,
|
|
6
|
+
PLUGIN_ID,
|
|
7
|
+
PROVIDER,
|
|
8
|
+
RESOURCE_TYPE,
|
|
9
|
+
VERSION
|
|
10
|
+
} from "./chunk-MRDVVFUV.mjs";
|
|
11
|
+
|
|
12
|
+
// src/proxy.ts
|
|
13
|
+
import { createPluginBase } from "@glueco/shared";
|
|
14
|
+
var GROQ_API_URL = "https://api.groq.com/openai/v1";
|
|
15
|
+
var GroqApiError = class extends Error {
|
|
16
|
+
constructor(status, body) {
|
|
17
|
+
super(`Groq API error: ${status}`);
|
|
18
|
+
this.status = status;
|
|
19
|
+
this.body = body;
|
|
20
|
+
this.name = "GroqApiError";
|
|
21
|
+
}
|
|
22
|
+
};
|
|
23
|
+
function mapGroqError(error) {
|
|
24
|
+
let parsed = {};
|
|
25
|
+
try {
|
|
26
|
+
parsed = JSON.parse(error.body);
|
|
27
|
+
} catch {
|
|
28
|
+
}
|
|
29
|
+
const message = parsed.error?.message || error.body;
|
|
30
|
+
switch (error.status) {
|
|
31
|
+
case 400:
|
|
32
|
+
return { status: 400, code: "BAD_REQUEST", message, retryable: false };
|
|
33
|
+
case 401:
|
|
34
|
+
return {
|
|
35
|
+
status: 401,
|
|
36
|
+
code: "UNAUTHORIZED",
|
|
37
|
+
message: "Invalid API key",
|
|
38
|
+
retryable: false
|
|
39
|
+
};
|
|
40
|
+
case 403:
|
|
41
|
+
return { status: 403, code: "FORBIDDEN", message, retryable: false };
|
|
42
|
+
case 404:
|
|
43
|
+
return { status: 404, code: "NOT_FOUND", message, retryable: false };
|
|
44
|
+
case 429:
|
|
45
|
+
return { status: 429, code: "RATE_LIMITED", message, retryable: true };
|
|
46
|
+
case 500:
|
|
47
|
+
case 502:
|
|
48
|
+
case 503:
|
|
49
|
+
return {
|
|
50
|
+
status: error.status,
|
|
51
|
+
code: "PROVIDER_ERROR",
|
|
52
|
+
message,
|
|
53
|
+
retryable: true
|
|
54
|
+
};
|
|
55
|
+
default:
|
|
56
|
+
return {
|
|
57
|
+
status: error.status,
|
|
58
|
+
code: "UNKNOWN",
|
|
59
|
+
message,
|
|
60
|
+
retryable: false
|
|
61
|
+
};
|
|
62
|
+
}
|
|
63
|
+
}
|
|
64
|
+
var groqPlugin = {
|
|
65
|
+
...createPluginBase({
|
|
66
|
+
id: PLUGIN_ID,
|
|
67
|
+
resourceType: RESOURCE_TYPE,
|
|
68
|
+
provider: PROVIDER,
|
|
69
|
+
version: VERSION,
|
|
70
|
+
name: "Groq LLM",
|
|
71
|
+
actions: [...ACTIONS],
|
|
72
|
+
supports: {
|
|
73
|
+
enforcement: [...ENFORCEMENT_SUPPORT]
|
|
74
|
+
},
|
|
75
|
+
// Client contract metadata for SDK-compatible plugins
|
|
76
|
+
client: {
|
|
77
|
+
namespace: "groq",
|
|
78
|
+
actions: {
|
|
79
|
+
"chat.completions": {
|
|
80
|
+
description: "Generate chat completions using Groq's fast LLM inference"
|
|
81
|
+
}
|
|
82
|
+
}
|
|
83
|
+
}
|
|
84
|
+
}),
|
|
85
|
+
// Credential schema for UI
|
|
86
|
+
credentialSchema: {
|
|
87
|
+
fields: [
|
|
88
|
+
{
|
|
89
|
+
name: "apiKey",
|
|
90
|
+
type: "secret",
|
|
91
|
+
label: "API Key",
|
|
92
|
+
description: "Your Groq API key",
|
|
93
|
+
required: true
|
|
94
|
+
},
|
|
95
|
+
{
|
|
96
|
+
name: "baseUrl",
|
|
97
|
+
type: "url",
|
|
98
|
+
label: "Base URL",
|
|
99
|
+
description: "Custom API base URL (optional)",
|
|
100
|
+
required: false,
|
|
101
|
+
default: GROQ_API_URL
|
|
102
|
+
}
|
|
103
|
+
]
|
|
104
|
+
},
|
|
105
|
+
validateAndShape(action, input, constraints) {
|
|
106
|
+
if (action !== "chat.completions") {
|
|
107
|
+
return { valid: false, error: `Unsupported action: ${action}` };
|
|
108
|
+
}
|
|
109
|
+
const parsed = ChatCompletionRequestSchema.safeParse(input);
|
|
110
|
+
if (!parsed.success) {
|
|
111
|
+
return {
|
|
112
|
+
valid: false,
|
|
113
|
+
error: `Invalid request: ${parsed.error.errors.map((e) => e.message).join(", ")}`
|
|
114
|
+
};
|
|
115
|
+
}
|
|
116
|
+
const request = parsed.data;
|
|
117
|
+
const enforcement = {
|
|
118
|
+
model: request.model,
|
|
119
|
+
stream: request.stream ?? false,
|
|
120
|
+
usesTools: Array.isArray(request.tools) && request.tools.length > 0,
|
|
121
|
+
maxOutputTokens: request.max_tokens ?? request.max_completion_tokens
|
|
122
|
+
};
|
|
123
|
+
const allowedModels = constraints.allowedModels ?? [...DEFAULT_GROQ_MODELS];
|
|
124
|
+
if (!allowedModels.includes(request.model)) {
|
|
125
|
+
return {
|
|
126
|
+
valid: false,
|
|
127
|
+
error: `Model '${request.model}' not allowed. Allowed: ${allowedModels.join(", ")}`
|
|
128
|
+
};
|
|
129
|
+
}
|
|
130
|
+
const maxTokens = constraints.maxOutputTokens ?? 4096;
|
|
131
|
+
const requestedTokens = request.max_tokens ?? request.max_completion_tokens;
|
|
132
|
+
if (requestedTokens && requestedTokens > maxTokens) {
|
|
133
|
+
return {
|
|
134
|
+
valid: false,
|
|
135
|
+
error: `max_tokens (${requestedTokens}) exceeds limit (${maxTokens})`
|
|
136
|
+
};
|
|
137
|
+
}
|
|
138
|
+
if (request.stream && constraints.allowStreaming === false) {
|
|
139
|
+
return {
|
|
140
|
+
valid: false,
|
|
141
|
+
error: "Streaming is not allowed for this app"
|
|
142
|
+
};
|
|
143
|
+
}
|
|
144
|
+
const shapedRequest = {
|
|
145
|
+
...request,
|
|
146
|
+
max_tokens: requestedTokens ? Math.min(requestedTokens, maxTokens) : maxTokens
|
|
147
|
+
};
|
|
148
|
+
return { valid: true, shapedInput: shapedRequest, enforcement };
|
|
149
|
+
},
|
|
150
|
+
async execute(action, shapedInput, ctx, options) {
|
|
151
|
+
const request = shapedInput;
|
|
152
|
+
const baseUrl = ctx.config?.baseUrl || GROQ_API_URL;
|
|
153
|
+
const response = await fetch(`${baseUrl}/chat/completions`, {
|
|
154
|
+
method: "POST",
|
|
155
|
+
headers: {
|
|
156
|
+
"Content-Type": "application/json",
|
|
157
|
+
Authorization: `Bearer ${ctx.secret}`
|
|
158
|
+
},
|
|
159
|
+
body: JSON.stringify(request),
|
|
160
|
+
signal: options.signal
|
|
161
|
+
});
|
|
162
|
+
if (!response.ok) {
|
|
163
|
+
const errorBody = await response.text();
|
|
164
|
+
throw new GroqApiError(response.status, errorBody);
|
|
165
|
+
}
|
|
166
|
+
if (request.stream) {
|
|
167
|
+
return {
|
|
168
|
+
stream: response.body,
|
|
169
|
+
contentType: "text/event-stream"
|
|
170
|
+
};
|
|
171
|
+
} else {
|
|
172
|
+
const json = await response.json();
|
|
173
|
+
return {
|
|
174
|
+
response: json,
|
|
175
|
+
contentType: "application/json",
|
|
176
|
+
usage: this.extractUsage(json)
|
|
177
|
+
};
|
|
178
|
+
}
|
|
179
|
+
},
|
|
180
|
+
extractUsage(response) {
|
|
181
|
+
const res = response;
|
|
182
|
+
return {
|
|
183
|
+
inputTokens: res.usage?.prompt_tokens,
|
|
184
|
+
outputTokens: res.usage?.completion_tokens,
|
|
185
|
+
totalTokens: res.usage?.total_tokens,
|
|
186
|
+
model: res.model
|
|
187
|
+
};
|
|
188
|
+
},
|
|
189
|
+
mapError(error) {
|
|
190
|
+
if (error instanceof GroqApiError) {
|
|
191
|
+
return mapGroqError(error);
|
|
192
|
+
}
|
|
193
|
+
return {
|
|
194
|
+
status: 500,
|
|
195
|
+
code: "INTERNAL_ERROR",
|
|
196
|
+
message: error instanceof Error ? error.message : "Unknown error",
|
|
197
|
+
retryable: false
|
|
198
|
+
};
|
|
199
|
+
}
|
|
200
|
+
};
|
|
201
|
+
var proxy_default = groqPlugin;
|
|
202
|
+
|
|
203
|
+
export {
|
|
204
|
+
groqPlugin,
|
|
205
|
+
proxy_default
|
|
206
|
+
};
|
|
207
|
+
//# sourceMappingURL=chunk-CNIQDSXF.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../src/proxy.ts"],"sourcesContent":["// ============================================\n// GROQ PLUGIN PROXY\n// Server-side plugin implementation for the gateway\n// ============================================\n//\n// This module is imported by the proxy to handle Groq requests.\n// It should NOT be imported by target apps.\n//\n// Import path: @glueco/plugin-llm-groq/proxy\n// ============================================\n\nimport type {\n PluginContract,\n PluginResourceConstraints,\n PluginValidationResult,\n PluginExecuteContext,\n PluginExecuteOptions,\n PluginExecuteResult,\n PluginUsageMetrics,\n PluginMappedError,\n EnforcementFields,\n} from \"@glueco/shared\";\nimport { createPluginBase } from \"@glueco/shared\";\n\nimport {\n ChatCompletionRequestSchema,\n type ChatCompletionRequest,\n PLUGIN_ID,\n RESOURCE_TYPE,\n PROVIDER,\n VERSION,\n DEFAULT_GROQ_MODELS,\n ACTIONS,\n ENFORCEMENT_SUPPORT,\n} from \"./contracts\";\n\n// ============================================\n// CONFIGURATION\n// ============================================\n\nconst GROQ_API_URL = \"https://api.groq.com/openai/v1\";\n\n// ============================================\n// ERROR HANDLING\n// ============================================\n\nclass GroqApiError extends Error {\n constructor(\n public status: number,\n public body: string,\n ) {\n super(`Groq API error: ${status}`);\n this.name = \"GroqApiError\";\n }\n}\n\nfunction mapGroqError(error: GroqApiError): PluginMappedError {\n let parsed: { error?: { message?: string; type?: string; code?: string } } =\n {};\n try {\n parsed = JSON.parse(error.body);\n } catch {\n // Ignore parse errors\n }\n\n const message = parsed.error?.message || error.body;\n\n switch (error.status) {\n case 400:\n return { status: 400, code: \"BAD_REQUEST\", message, retryable: false };\n case 401:\n return {\n status: 401,\n code: \"UNAUTHORIZED\",\n message: \"Invalid API key\",\n retryable: false,\n };\n case 403:\n return { status: 403, code: \"FORBIDDEN\", message, retryable: false };\n case 404:\n return { status: 404, code: \"NOT_FOUND\", message, retryable: false };\n case 429:\n return { status: 429, code: \"RATE_LIMITED\", message, retryable: true };\n case 500:\n case 502:\n case 503:\n return {\n status: error.status,\n code: \"PROVIDER_ERROR\",\n message,\n retryable: true,\n };\n default:\n return {\n status: error.status,\n code: \"UNKNOWN\",\n message,\n retryable: false,\n };\n }\n}\n\n// ============================================\n// PLUGIN IMPLEMENTATION\n// ============================================\n\nconst groqPlugin: PluginContract = {\n ...createPluginBase({\n id: PLUGIN_ID,\n resourceType: RESOURCE_TYPE,\n provider: PROVIDER,\n version: VERSION,\n name: \"Groq LLM\",\n actions: [...ACTIONS],\n supports: {\n enforcement: [...ENFORCEMENT_SUPPORT],\n },\n // Client contract metadata for SDK-compatible plugins\n client: {\n namespace: \"groq\",\n actions: {\n \"chat.completions\": {\n description:\n \"Generate chat completions using Groq's fast LLM inference\",\n },\n },\n },\n }),\n\n // Credential schema for UI\n credentialSchema: {\n fields: [\n {\n name: \"apiKey\",\n type: \"secret\",\n label: \"API Key\",\n description: \"Your Groq API key\",\n required: true,\n },\n {\n name: \"baseUrl\",\n type: \"url\",\n label: \"Base URL\",\n description: \"Custom API base URL (optional)\",\n required: false,\n default: GROQ_API_URL,\n },\n ],\n },\n\n validateAndShape(\n action: string,\n input: unknown,\n constraints: PluginResourceConstraints,\n ): PluginValidationResult {\n if (action !== \"chat.completions\") {\n return { valid: false, error: `Unsupported action: ${action}` };\n }\n\n // Parse input - this is the schema-first validation\n const parsed = ChatCompletionRequestSchema.safeParse(input);\n if (!parsed.success) {\n return {\n valid: false,\n error: `Invalid request: ${parsed.error.errors.map((e) => e.message).join(\", \")}`,\n };\n }\n\n const request = parsed.data;\n\n // Build enforcement fields from validated request\n // These are extracted DURING validation, not after\n const enforcement: EnforcementFields = {\n model: request.model,\n stream: request.stream ?? false,\n usesTools: Array.isArray(request.tools) && request.tools.length > 0,\n maxOutputTokens: request.max_tokens ?? request.max_completion_tokens,\n };\n\n // Check allowed models\n const allowedModels = constraints.allowedModels ?? [...DEFAULT_GROQ_MODELS];\n if (!allowedModels.includes(request.model)) {\n return {\n valid: false,\n error: `Model '${request.model}' not allowed. Allowed: ${allowedModels.join(\", \")}`,\n };\n }\n\n // Enforce max tokens\n const maxTokens = constraints.maxOutputTokens ?? 4096;\n const requestedTokens = request.max_tokens ?? request.max_completion_tokens;\n\n if (requestedTokens && requestedTokens > maxTokens) {\n return {\n valid: false,\n error: `max_tokens (${requestedTokens}) exceeds limit (${maxTokens})`,\n };\n }\n\n // Check streaming permission\n if (request.stream && constraints.allowStreaming === false) {\n return {\n valid: false,\n error: \"Streaming is not allowed for this app\",\n };\n }\n\n // Shape the request (apply defaults, caps)\n const shapedRequest: ChatCompletionRequest = {\n ...request,\n max_tokens: requestedTokens\n ? Math.min(requestedTokens, maxTokens)\n : maxTokens,\n };\n\n return { valid: true, shapedInput: shapedRequest, enforcement };\n },\n\n async execute(\n action: string,\n shapedInput: unknown,\n ctx: PluginExecuteContext,\n options: PluginExecuteOptions,\n ): Promise<PluginExecuteResult> {\n const request = shapedInput as ChatCompletionRequest;\n const baseUrl = (ctx.config?.baseUrl as string) || GROQ_API_URL;\n\n const response = await fetch(`${baseUrl}/chat/completions`, {\n method: \"POST\",\n headers: {\n \"Content-Type\": \"application/json\",\n Authorization: `Bearer ${ctx.secret}`,\n },\n body: JSON.stringify(request),\n signal: options.signal,\n });\n\n if (!response.ok) {\n const errorBody = await response.text();\n throw new GroqApiError(response.status, errorBody);\n }\n\n if (request.stream) {\n // Return streaming response\n return {\n stream: response.body!,\n contentType: \"text/event-stream\",\n };\n } else {\n // Return JSON response\n const json = await response.json();\n return {\n response: json,\n contentType: \"application/json\",\n usage: this.extractUsage(json),\n };\n }\n },\n\n extractUsage(response: unknown): PluginUsageMetrics {\n const res = response as {\n usage?: {\n prompt_tokens?: number;\n completion_tokens?: number;\n total_tokens?: number;\n };\n model?: string;\n };\n\n return {\n inputTokens: res.usage?.prompt_tokens,\n outputTokens: res.usage?.completion_tokens,\n totalTokens: res.usage?.total_tokens,\n model: res.model,\n };\n },\n\n mapError(error: unknown): PluginMappedError {\n if (error instanceof GroqApiError) {\n return mapGroqError(error);\n }\n\n return {\n status: 500,\n code: \"INTERNAL_ERROR\",\n message: error instanceof Error ? error.message : \"Unknown error\",\n retryable: false,\n };\n },\n};\n\nexport default groqPlugin;\n\n// Also export named for flexibility\nexport { groqPlugin };\n"],"mappings":";;;;;;;;;;;;AAsBA,SAAS,wBAAwB;AAkBjC,IAAM,eAAe;AAMrB,IAAM,eAAN,cAA2B,MAAM;AAAA,EAC/B,YACS,QACA,MACP;AACA,UAAM,mBAAmB,MAAM,EAAE;AAH1B;AACA;AAGP,SAAK,OAAO;AAAA,EACd;AACF;AAEA,SAAS,aAAa,OAAwC;AAC5D,MAAI,SACF,CAAC;AACH,MAAI;AACF,aAAS,KAAK,MAAM,MAAM,IAAI;AAAA,EAChC,QAAQ;AAAA,EAER;AAEA,QAAM,UAAU,OAAO,OAAO,WAAW,MAAM;AAE/C,UAAQ,MAAM,QAAQ;AAAA,IACpB,KAAK;AACH,aAAO,EAAE,QAAQ,KAAK,MAAM,eAAe,SAAS,WAAW,MAAM;AAAA,IACvE,KAAK;AACH,aAAO;AAAA,QACL,QAAQ;AAAA,QACR,MAAM;AAAA,QACN,SAAS;AAAA,QACT,WAAW;AAAA,MACb;AAAA,IACF,KAAK;AACH,aAAO,EAAE,QAAQ,KAAK,MAAM,aAAa,SAAS,WAAW,MAAM;AAAA,IACrE,KAAK;AACH,aAAO,EAAE,QAAQ,KAAK,MAAM,aAAa,SAAS,WAAW,MAAM;AAAA,IACrE,KAAK;AACH,aAAO,EAAE,QAAQ,KAAK,MAAM,gBAAgB,SAAS,WAAW,KAAK;AAAA,IACvE,KAAK;AAAA,IACL,KAAK;AAAA,IACL,KAAK;AACH,aAAO;AAAA,QACL,QAAQ,MAAM;AAAA,QACd,MAAM;AAAA,QACN;AAAA,QACA,WAAW;AAAA,MACb;AAAA,IACF;AACE,aAAO;AAAA,QACL,QAAQ,MAAM;AAAA,QACd,MAAM;AAAA,QACN;AAAA,QACA,WAAW;AAAA,MACb;AAAA,EACJ;AACF;AAMA,IAAM,aAA6B;AAAA,EACjC,GAAG,iBAAiB;AAAA,IAClB,IAAI;AAAA,IACJ,cAAc;AAAA,IACd,UAAU;AAAA,IACV,SAAS;AAAA,IACT,MAAM;AAAA,IACN,SAAS,CAAC,GAAG,OAAO;AAAA,IACpB,UAAU;AAAA,MACR,aAAa,CAAC,GAAG,mBAAmB;AAAA,IACtC;AAAA;AAAA,IAEA,QAAQ;AAAA,MACN,WAAW;AAAA,MACX,SAAS;AAAA,QACP,oBAAoB;AAAA,UAClB,aACE;AAAA,QACJ;AAAA,MACF;AAAA,IACF;AAAA,EACF,CAAC;AAAA;AAAA,EAGD,kBAAkB;AAAA,IAChB,QAAQ;AAAA,MACN;AAAA,QACE,MAAM;AAAA,QACN,MAAM;AAAA,QACN,OAAO;AAAA,QACP,aAAa;AAAA,QACb,UAAU;AAAA,MACZ;AAAA,MACA;AAAA,QACE,MAAM;AAAA,QACN,MAAM;AAAA,QACN,OAAO;AAAA,QACP,aAAa;AAAA,QACb,UAAU;AAAA,QACV,SAAS;AAAA,MACX;AAAA,IACF;AAAA,EACF;AAAA,EAEA,iBACE,QACA,OACA,aACwB;AACxB,QAAI,WAAW,oBAAoB;AACjC,aAAO,EAAE,OAAO,OAAO,OAAO,uBAAuB,MAAM,GAAG;AAAA,IAChE;AAGA,UAAM,SAAS,4BAA4B,UAAU,KAAK;AAC1D,QAAI,CAAC,OAAO,SAAS;AACnB,aAAO;AAAA,QACL,OAAO;AAAA,QACP,OAAO,oBAAoB,OAAO,MAAM,OAAO,IAAI,CAAC,MAAM,EAAE,OAAO,EAAE,KAAK,IAAI,CAAC;AAAA,MACjF;AAAA,IACF;AAEA,UAAM,UAAU,OAAO;AAIvB,UAAM,cAAiC;AAAA,MACrC,OAAO,QAAQ;AAAA,MACf,QAAQ,QAAQ,UAAU;AAAA,MAC1B,WAAW,MAAM,QAAQ,QAAQ,KAAK,KAAK,QAAQ,MAAM,SAAS;AAAA,MAClE,iBAAiB,QAAQ,cAAc,QAAQ;AAAA,IACjD;AAGA,UAAM,gBAAgB,YAAY,iBAAiB,CAAC,GAAG,mBAAmB;AAC1E,QAAI,CAAC,cAAc,SAAS,QAAQ,KAAK,GAAG;AAC1C,aAAO;AAAA,QACL,OAAO;AAAA,QACP,OAAO,UAAU,QAAQ,KAAK,2BAA2B,cAAc,KAAK,IAAI,CAAC;AAAA,MACnF;AAAA,IACF;AAGA,UAAM,YAAY,YAAY,mBAAmB;AACjD,UAAM,kBAAkB,QAAQ,cAAc,QAAQ;AAEtD,QAAI,mBAAmB,kBAAkB,WAAW;AAClD,aAAO;AAAA,QACL,OAAO;AAAA,QACP,OAAO,eAAe,eAAe,oBAAoB,SAAS;AAAA,MACpE;AAAA,IACF;AAGA,QAAI,QAAQ,UAAU,YAAY,mBAAmB,OAAO;AAC1D,aAAO;AAAA,QACL,OAAO;AAAA,QACP,OAAO;AAAA,MACT;AAAA,IACF;AAGA,UAAM,gBAAuC;AAAA,MAC3C,GAAG;AAAA,MACH,YAAY,kBACR,KAAK,IAAI,iBAAiB,SAAS,IACnC;AAAA,IACN;AAEA,WAAO,EAAE,OAAO,MAAM,aAAa,eAAe,YAAY;AAAA,EAChE;AAAA,EAEA,MAAM,QACJ,QACA,aACA,KACA,SAC8B;AAC9B,UAAM,UAAU;AAChB,UAAM,UAAW,IAAI,QAAQ,WAAsB;AAEnD,UAAM,WAAW,MAAM,MAAM,GAAG,OAAO,qBAAqB;AAAA,MAC1D,QAAQ;AAAA,MACR,SAAS;AAAA,QACP,gBAAgB;AAAA,QAChB,eAAe,UAAU,IAAI,MAAM;AAAA,MACrC;AAAA,MACA,MAAM,KAAK,UAAU,OAAO;AAAA,MAC5B,QAAQ,QAAQ;AAAA,IAClB,CAAC;AAED,QAAI,CAAC,SAAS,IAAI;AAChB,YAAM,YAAY,MAAM,SAAS,KAAK;AACtC,YAAM,IAAI,aAAa,SAAS,QAAQ,SAAS;AAAA,IACnD;AAEA,QAAI,QAAQ,QAAQ;AAElB,aAAO;AAAA,QACL,QAAQ,SAAS;AAAA,QACjB,aAAa;AAAA,MACf;AAAA,IACF,OAAO;AAEL,YAAM,OAAO,MAAM,SAAS,KAAK;AACjC,aAAO;AAAA,QACL,UAAU;AAAA,QACV,aAAa;AAAA,QACb,OAAO,KAAK,aAAa,IAAI;AAAA,MAC/B;AAAA,IACF;AAAA,EACF;AAAA,EAEA,aAAa,UAAuC;AAClD,UAAM,MAAM;AASZ,WAAO;AAAA,MACL,aAAa,IAAI,OAAO;AAAA,MACxB,cAAc,IAAI,OAAO;AAAA,MACzB,aAAa,IAAI,OAAO;AAAA,MACxB,OAAO,IAAI;AAAA,IACb;AAAA,EACF;AAAA,EAEA,SAAS,OAAmC;AAC1C,QAAI,iBAAiB,cAAc;AACjC,aAAO,aAAa,KAAK;AAAA,IAC3B;AAEA,WAAO;AAAA,MACL,QAAQ;AAAA,MACR,MAAM;AAAA,MACN,SAAS,iBAAiB,QAAQ,MAAM,UAAU;AAAA,MAClD,WAAW;AAAA,IACb;AAAA,EACF;AACF;AAEA,IAAO,gBAAQ;","names":[]}
|
|
@@ -0,0 +1,162 @@
|
|
|
1
|
+
// src/contracts.ts
|
|
2
|
+
import { z } from "zod";
|
|
3
|
+
var ChatMessageSchema = z.object({
|
|
4
|
+
role: z.enum(["system", "user", "assistant", "tool"]),
|
|
5
|
+
content: z.union([
|
|
6
|
+
z.string(),
|
|
7
|
+
z.array(
|
|
8
|
+
z.object({
|
|
9
|
+
type: z.string(),
|
|
10
|
+
text: z.string().optional(),
|
|
11
|
+
image_url: z.object({
|
|
12
|
+
url: z.string(),
|
|
13
|
+
detail: z.string().optional()
|
|
14
|
+
}).optional()
|
|
15
|
+
})
|
|
16
|
+
)
|
|
17
|
+
]).nullable(),
|
|
18
|
+
name: z.string().optional(),
|
|
19
|
+
tool_calls: z.array(
|
|
20
|
+
z.object({
|
|
21
|
+
id: z.string(),
|
|
22
|
+
type: z.literal("function"),
|
|
23
|
+
function: z.object({
|
|
24
|
+
name: z.string(),
|
|
25
|
+
arguments: z.string()
|
|
26
|
+
})
|
|
27
|
+
})
|
|
28
|
+
).optional(),
|
|
29
|
+
tool_call_id: z.string().optional()
|
|
30
|
+
});
|
|
31
|
+
var ChatCompletionRequestSchema = z.object({
|
|
32
|
+
model: z.string(),
|
|
33
|
+
messages: z.array(ChatMessageSchema),
|
|
34
|
+
temperature: z.number().min(0).max(2).optional(),
|
|
35
|
+
top_p: z.number().min(0).max(1).optional(),
|
|
36
|
+
n: z.number().int().min(1).max(10).optional(),
|
|
37
|
+
stream: z.boolean().optional(),
|
|
38
|
+
stop: z.union([z.string(), z.array(z.string())]).optional(),
|
|
39
|
+
max_tokens: z.number().int().positive().optional(),
|
|
40
|
+
max_completion_tokens: z.number().int().positive().optional(),
|
|
41
|
+
presence_penalty: z.number().min(-2).max(2).optional(),
|
|
42
|
+
frequency_penalty: z.number().min(-2).max(2).optional(),
|
|
43
|
+
logit_bias: z.record(z.number()).optional(),
|
|
44
|
+
user: z.string().optional(),
|
|
45
|
+
tools: z.array(
|
|
46
|
+
z.object({
|
|
47
|
+
type: z.literal("function"),
|
|
48
|
+
function: z.object({
|
|
49
|
+
name: z.string(),
|
|
50
|
+
description: z.string().optional(),
|
|
51
|
+
parameters: z.record(z.unknown()).optional()
|
|
52
|
+
})
|
|
53
|
+
})
|
|
54
|
+
).optional(),
|
|
55
|
+
tool_choice: z.union([
|
|
56
|
+
z.literal("none"),
|
|
57
|
+
z.literal("auto"),
|
|
58
|
+
z.literal("required"),
|
|
59
|
+
z.object({
|
|
60
|
+
type: z.literal("function"),
|
|
61
|
+
function: z.object({ name: z.string() })
|
|
62
|
+
})
|
|
63
|
+
]).optional(),
|
|
64
|
+
response_format: z.object({
|
|
65
|
+
type: z.enum(["text", "json_object"])
|
|
66
|
+
}).optional(),
|
|
67
|
+
seed: z.number().int().optional()
|
|
68
|
+
});
|
|
69
|
+
var ChatCompletionChoiceSchema = z.object({
|
|
70
|
+
index: z.number(),
|
|
71
|
+
message: z.object({
|
|
72
|
+
role: z.literal("assistant"),
|
|
73
|
+
content: z.string().nullable(),
|
|
74
|
+
tool_calls: z.array(
|
|
75
|
+
z.object({
|
|
76
|
+
id: z.string(),
|
|
77
|
+
type: z.literal("function"),
|
|
78
|
+
function: z.object({
|
|
79
|
+
name: z.string(),
|
|
80
|
+
arguments: z.string()
|
|
81
|
+
})
|
|
82
|
+
})
|
|
83
|
+
).optional()
|
|
84
|
+
}),
|
|
85
|
+
finish_reason: z.string().nullable()
|
|
86
|
+
});
|
|
87
|
+
var UsageSchema = z.object({
|
|
88
|
+
prompt_tokens: z.number(),
|
|
89
|
+
completion_tokens: z.number(),
|
|
90
|
+
total_tokens: z.number()
|
|
91
|
+
});
|
|
92
|
+
var ChatCompletionResponseSchema = z.object({
|
|
93
|
+
id: z.string(),
|
|
94
|
+
object: z.literal("chat.completion"),
|
|
95
|
+
created: z.number(),
|
|
96
|
+
model: z.string(),
|
|
97
|
+
choices: z.array(ChatCompletionChoiceSchema),
|
|
98
|
+
usage: UsageSchema.optional()
|
|
99
|
+
});
|
|
100
|
+
var ChatCompletionChunkSchema = z.object({
|
|
101
|
+
id: z.string(),
|
|
102
|
+
object: z.literal("chat.completion.chunk"),
|
|
103
|
+
created: z.number(),
|
|
104
|
+
model: z.string(),
|
|
105
|
+
choices: z.array(
|
|
106
|
+
z.object({
|
|
107
|
+
index: z.number(),
|
|
108
|
+
delta: z.object({
|
|
109
|
+
role: z.string().optional(),
|
|
110
|
+
content: z.string().optional(),
|
|
111
|
+
tool_calls: z.array(
|
|
112
|
+
z.object({
|
|
113
|
+
index: z.number(),
|
|
114
|
+
id: z.string().optional(),
|
|
115
|
+
type: z.literal("function").optional(),
|
|
116
|
+
function: z.object({
|
|
117
|
+
name: z.string().optional(),
|
|
118
|
+
arguments: z.string().optional()
|
|
119
|
+
}).optional()
|
|
120
|
+
})
|
|
121
|
+
).optional()
|
|
122
|
+
}),
|
|
123
|
+
finish_reason: z.string().nullable()
|
|
124
|
+
})
|
|
125
|
+
)
|
|
126
|
+
});
|
|
127
|
+
var PLUGIN_ID = "llm:groq";
|
|
128
|
+
var RESOURCE_TYPE = "llm";
|
|
129
|
+
var PROVIDER = "groq";
|
|
130
|
+
var VERSION = "1.0.0";
|
|
131
|
+
var DEFAULT_GROQ_MODELS = [
|
|
132
|
+
"llama-3.3-70b-versatile",
|
|
133
|
+
"llama-3.1-70b-versatile",
|
|
134
|
+
"llama-3.1-8b-instant",
|
|
135
|
+
"llama3-70b-8192",
|
|
136
|
+
"llama3-8b-8192",
|
|
137
|
+
"mixtral-8x7b-32768",
|
|
138
|
+
"gemma2-9b-it"
|
|
139
|
+
];
|
|
140
|
+
var ACTIONS = ["chat.completions"];
|
|
141
|
+
var ENFORCEMENT_SUPPORT = [
|
|
142
|
+
"model",
|
|
143
|
+
"max_tokens",
|
|
144
|
+
"streaming"
|
|
145
|
+
];
|
|
146
|
+
|
|
147
|
+
export {
|
|
148
|
+
ChatMessageSchema,
|
|
149
|
+
ChatCompletionRequestSchema,
|
|
150
|
+
ChatCompletionChoiceSchema,
|
|
151
|
+
UsageSchema,
|
|
152
|
+
ChatCompletionResponseSchema,
|
|
153
|
+
ChatCompletionChunkSchema,
|
|
154
|
+
PLUGIN_ID,
|
|
155
|
+
RESOURCE_TYPE,
|
|
156
|
+
PROVIDER,
|
|
157
|
+
VERSION,
|
|
158
|
+
DEFAULT_GROQ_MODELS,
|
|
159
|
+
ACTIONS,
|
|
160
|
+
ENFORCEMENT_SUPPORT
|
|
161
|
+
};
|
|
162
|
+
//# sourceMappingURL=chunk-MRDVVFUV.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../src/contracts.ts"],"sourcesContent":["// ============================================\n// GROQ PLUGIN CONTRACTS\n// Shared request/response schemas for proxy and client\n// ============================================\n\nimport { z } from \"zod\";\n\n// ============================================\n// REQUEST SCHEMAS (OpenAI-compatible)\n// ============================================\n\nexport const ChatMessageSchema = z.object({\n role: z.enum([\"system\", \"user\", \"assistant\", \"tool\"]),\n content: z\n .union([\n z.string(),\n z.array(\n z.object({\n type: z.string(),\n text: z.string().optional(),\n image_url: z\n .object({\n url: z.string(),\n detail: z.string().optional(),\n })\n .optional(),\n }),\n ),\n ])\n .nullable(),\n name: z.string().optional(),\n tool_calls: z\n .array(\n z.object({\n id: z.string(),\n type: z.literal(\"function\"),\n function: z.object({\n name: z.string(),\n arguments: z.string(),\n }),\n }),\n )\n .optional(),\n tool_call_id: z.string().optional(),\n});\n\nexport type ChatMessage = z.infer<typeof ChatMessageSchema>;\n\nexport const ChatCompletionRequestSchema = z.object({\n model: z.string(),\n messages: z.array(ChatMessageSchema),\n temperature: z.number().min(0).max(2).optional(),\n top_p: z.number().min(0).max(1).optional(),\n n: z.number().int().min(1).max(10).optional(),\n stream: z.boolean().optional(),\n stop: z.union([z.string(), z.array(z.string())]).optional(),\n max_tokens: z.number().int().positive().optional(),\n max_completion_tokens: z.number().int().positive().optional(),\n presence_penalty: z.number().min(-2).max(2).optional(),\n frequency_penalty: z.number().min(-2).max(2).optional(),\n logit_bias: z.record(z.number()).optional(),\n user: z.string().optional(),\n tools: z\n .array(\n z.object({\n type: z.literal(\"function\"),\n function: z.object({\n name: z.string(),\n description: z.string().optional(),\n parameters: z.record(z.unknown()).optional(),\n }),\n }),\n )\n .optional(),\n tool_choice: z\n .union([\n z.literal(\"none\"),\n z.literal(\"auto\"),\n z.literal(\"required\"),\n z.object({\n type: z.literal(\"function\"),\n function: z.object({ name: z.string() }),\n }),\n ])\n .optional(),\n response_format: z\n .object({\n type: z.enum([\"text\", \"json_object\"]),\n })\n .optional(),\n seed: z.number().int().optional(),\n});\n\nexport type ChatCompletionRequest = z.infer<typeof ChatCompletionRequestSchema>;\n\n// ============================================\n// RESPONSE SCHEMAS (OpenAI-compatible)\n// ============================================\n\nexport const ChatCompletionChoiceSchema = z.object({\n index: z.number(),\n message: z.object({\n role: z.literal(\"assistant\"),\n content: z.string().nullable(),\n tool_calls: z\n .array(\n z.object({\n id: z.string(),\n type: z.literal(\"function\"),\n function: z.object({\n name: z.string(),\n arguments: z.string(),\n }),\n }),\n )\n .optional(),\n }),\n finish_reason: z.string().nullable(),\n});\n\nexport type ChatCompletionChoice = z.infer<typeof ChatCompletionChoiceSchema>;\n\nexport const UsageSchema = z.object({\n prompt_tokens: z.number(),\n completion_tokens: z.number(),\n total_tokens: z.number(),\n});\n\nexport type Usage = z.infer<typeof UsageSchema>;\n\nexport const ChatCompletionResponseSchema = z.object({\n id: z.string(),\n object: z.literal(\"chat.completion\"),\n created: z.number(),\n model: z.string(),\n choices: z.array(ChatCompletionChoiceSchema),\n usage: UsageSchema.optional(),\n});\n\nexport type ChatCompletionResponse = z.infer<\n typeof ChatCompletionResponseSchema\n>;\n\n// ============================================\n// STREAMING RESPONSE SCHEMAS\n// ============================================\n\nexport const ChatCompletionChunkSchema = z.object({\n id: z.string(),\n object: z.literal(\"chat.completion.chunk\"),\n created: z.number(),\n model: z.string(),\n choices: z.array(\n z.object({\n index: z.number(),\n delta: z.object({\n role: z.string().optional(),\n content: z.string().optional(),\n tool_calls: z\n .array(\n z.object({\n index: z.number(),\n id: z.string().optional(),\n type: z.literal(\"function\").optional(),\n function: z\n .object({\n name: z.string().optional(),\n arguments: z.string().optional(),\n })\n .optional(),\n }),\n )\n .optional(),\n }),\n finish_reason: z.string().nullable(),\n }),\n ),\n});\n\nexport type ChatCompletionChunk = z.infer<typeof ChatCompletionChunkSchema>;\n\n// ============================================\n// PLUGIN CONSTANTS\n// ============================================\n\nexport const PLUGIN_ID = \"llm:groq\" as const;\nexport const RESOURCE_TYPE = \"llm\" as const;\nexport const PROVIDER = \"groq\" as const;\nexport const VERSION = \"1.0.0\";\n\n/** Default allowed models */\nexport const DEFAULT_GROQ_MODELS = [\n \"llama-3.3-70b-versatile\",\n \"llama-3.1-70b-versatile\",\n \"llama-3.1-8b-instant\",\n \"llama3-70b-8192\",\n \"llama3-8b-8192\",\n \"mixtral-8x7b-32768\",\n \"gemma2-9b-it\",\n] as const;\n\n/** Supported actions */\nexport const ACTIONS = [\"chat.completions\"] as const;\nexport type GroqAction = (typeof ACTIONS)[number];\n\n/** Enforcement knobs */\nexport const ENFORCEMENT_SUPPORT = [\n \"model\",\n \"max_tokens\",\n \"streaming\",\n] as const;\n"],"mappings":";AAKA,SAAS,SAAS;AAMX,IAAM,oBAAoB,EAAE,OAAO;AAAA,EACxC,MAAM,EAAE,KAAK,CAAC,UAAU,QAAQ,aAAa,MAAM,CAAC;AAAA,EACpD,SAAS,EACN,MAAM;AAAA,IACL,EAAE,OAAO;AAAA,IACT,EAAE;AAAA,MACA,EAAE,OAAO;AAAA,QACP,MAAM,EAAE,OAAO;AAAA,QACf,MAAM,EAAE,OAAO,EAAE,SAAS;AAAA,QAC1B,WAAW,EACR,OAAO;AAAA,UACN,KAAK,EAAE,OAAO;AAAA,UACd,QAAQ,EAAE,OAAO,EAAE,SAAS;AAAA,QAC9B,CAAC,EACA,SAAS;AAAA,MACd,CAAC;AAAA,IACH;AAAA,EACF,CAAC,EACA,SAAS;AAAA,EACZ,MAAM,EAAE,OAAO,EAAE,SAAS;AAAA,EAC1B,YAAY,EACT;AAAA,IACC,EAAE,OAAO;AAAA,MACP,IAAI,EAAE,OAAO;AAAA,MACb,MAAM,EAAE,QAAQ,UAAU;AAAA,MAC1B,UAAU,EAAE,OAAO;AAAA,QACjB,MAAM,EAAE,OAAO;AAAA,QACf,WAAW,EAAE,OAAO;AAAA,MACtB,CAAC;AAAA,IACH,CAAC;AAAA,EACH,EACC,SAAS;AAAA,EACZ,cAAc,EAAE,OAAO,EAAE,SAAS;AACpC,CAAC;AAIM,IAAM,8BAA8B,EAAE,OAAO;AAAA,EAClD,OAAO,EAAE,OAAO;AAAA,EAChB,UAAU,EAAE,MAAM,iBAAiB;AAAA,EACnC,aAAa,EAAE,OAAO,EAAE,IAAI,CAAC,EAAE,IAAI,CAAC,EAAE,SAAS;AAAA,EAC/C,OAAO,EAAE,OAAO,EAAE,IAAI,CAAC,EAAE,IAAI,CAAC,EAAE,SAAS;AAAA,EACzC,GAAG,EAAE,OAAO,EAAE,IAAI,EAAE,IAAI,CAAC,EAAE,IAAI,EAAE,EAAE,SAAS;AAAA,EAC5C,QAAQ,EAAE,QAAQ,EAAE,SAAS;AAAA,EAC7B,MAAM,EAAE,MAAM,CAAC,EAAE,OAAO,GAAG,EAAE,MAAM,EAAE,OAAO,CAAC,CAAC,CAAC,EAAE,SAAS;AAAA,EAC1D,YAAY,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS;AAAA,EACjD,uBAAuB,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS;AAAA,EAC5D,kBAAkB,EAAE,OAAO,EAAE,IAAI,EAAE,EAAE,IAAI,CAAC,EAAE,SAAS;AAAA,EACrD,mBAAmB,EAAE,OAAO,EAAE,IAAI,EAAE,EAAE,IAAI,CAAC,EAAE,SAAS;AAAA,EACtD,YAAY,EAAE,OAAO,EAAE,OAAO,CAAC,EAAE,SAAS;AAAA,EAC1C,MAAM,EAAE,OAAO,EAAE,SAAS;AAAA,EAC1B,OAAO,EACJ;AAAA,IACC,EAAE,OAAO;AAAA,MACP,MAAM,EAAE,QAAQ,UAAU;AAAA,MAC1B,UAAU,EAAE,OAAO;AAAA,QACjB,MAAM,EAAE,OAAO;AAAA,QACf,aAAa,EAAE,OAAO,EAAE,SAAS;AAAA,QACjC,YAAY,EAAE,OAAO,EAAE,QAAQ,CAAC,EAAE,SAAS;AAAA,MAC7C,CAAC;AAAA,IACH,CAAC;AAAA,EACH,EACC,SAAS;AAAA,EACZ,aAAa,EACV,MAAM;AAAA,IACL,EAAE,QAAQ,MAAM;AAAA,IAChB,EAAE,QAAQ,MAAM;AAAA,IAChB,EAAE,QAAQ,UAAU;AAAA,IACpB,EAAE,OAAO;AAAA,MACP,MAAM,EAAE,QAAQ,UAAU;AAAA,MAC1B,UAAU,EAAE,OAAO,EAAE,MAAM,EAAE,OAAO,EAAE,CAAC;AAAA,IACzC,CAAC;AAAA,EACH,CAAC,EACA,SAAS;AAAA,EACZ,iBAAiB,EACd,OAAO;AAAA,IACN,MAAM,EAAE,KAAK,CAAC,QAAQ,aAAa,CAAC;AAAA,EACtC,CAAC,EACA,SAAS;AAAA,EACZ,MAAM,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS;AAClC,CAAC;AAQM,IAAM,6BAA6B,EAAE,OAAO;AAAA,EACjD,OAAO,EAAE,OAAO;AAAA,EAChB,SAAS,EAAE,OAAO;AAAA,IAChB,MAAM,EAAE,QAAQ,WAAW;AAAA,IAC3B,SAAS,EAAE,OAAO,EAAE,SAAS;AAAA,IAC7B,YAAY,EACT;AAAA,MACC,EAAE,OAAO;AAAA,QACP,IAAI,EAAE,OAAO;AAAA,QACb,MAAM,EAAE,QAAQ,UAAU;AAAA,QAC1B,UAAU,EAAE,OAAO;AAAA,UACjB,MAAM,EAAE,OAAO;AAAA,UACf,WAAW,EAAE,OAAO;AAAA,QACtB,CAAC;AAAA,MACH,CAAC;AAAA,IACH,EACC,SAAS;AAAA,EACd,CAAC;AAAA,EACD,eAAe,EAAE,OAAO,EAAE,SAAS;AACrC,CAAC;AAIM,IAAM,cAAc,EAAE,OAAO;AAAA,EAClC,eAAe,EAAE,OAAO;AAAA,EACxB,mBAAmB,EAAE,OAAO;AAAA,EAC5B,cAAc,EAAE,OAAO;AACzB,CAAC;AAIM,IAAM,+BAA+B,EAAE,OAAO;AAAA,EACnD,IAAI,EAAE,OAAO;AAAA,EACb,QAAQ,EAAE,QAAQ,iBAAiB;AAAA,EACnC,SAAS,EAAE,OAAO;AAAA,EAClB,OAAO,EAAE,OAAO;AAAA,EAChB,SAAS,EAAE,MAAM,0BAA0B;AAAA,EAC3C,OAAO,YAAY,SAAS;AAC9B,CAAC;AAUM,IAAM,4BAA4B,EAAE,OAAO;AAAA,EAChD,IAAI,EAAE,OAAO;AAAA,EACb,QAAQ,EAAE,QAAQ,uBAAuB;AAAA,EACzC,SAAS,EAAE,OAAO;AAAA,EAClB,OAAO,EAAE,OAAO;AAAA,EAChB,SAAS,EAAE;AAAA,IACT,EAAE,OAAO;AAAA,MACP,OAAO,EAAE,OAAO;AAAA,MAChB,OAAO,EAAE,OAAO;AAAA,QACd,MAAM,EAAE,OAAO,EAAE,SAAS;AAAA,QAC1B,SAAS,EAAE,OAAO,EAAE,SAAS;AAAA,QAC7B,YAAY,EACT;AAAA,UACC,EAAE,OAAO;AAAA,YACP,OAAO,EAAE,OAAO;AAAA,YAChB,IAAI,EAAE,OAAO,EAAE,SAAS;AAAA,YACxB,MAAM,EAAE,QAAQ,UAAU,EAAE,SAAS;AAAA,YACrC,UAAU,EACP,OAAO;AAAA,cACN,MAAM,EAAE,OAAO,EAAE,SAAS;AAAA,cAC1B,WAAW,EAAE,OAAO,EAAE,SAAS;AAAA,YACjC,CAAC,EACA,SAAS;AAAA,UACd,CAAC;AAAA,QACH,EACC,SAAS;AAAA,MACd,CAAC;AAAA,MACD,eAAe,EAAE,OAAO,EAAE,SAAS;AAAA,IACrC,CAAC;AAAA,EACH;AACF,CAAC;AAQM,IAAM,YAAY;AAClB,IAAM,gBAAgB;AACtB,IAAM,WAAW;AACjB,IAAM,UAAU;AAGhB,IAAM,sBAAsB;AAAA,EACjC;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AACF;AAGO,IAAM,UAAU,CAAC,kBAAkB;AAInC,IAAM,sBAAsB;AAAA,EACjC;AAAA,EACA;AAAA,EACA;AACF;","names":[]}
|
|
@@ -0,0 +1,105 @@
|
|
|
1
|
+
import { GatewayRequestOptions, GatewayResponse, GatewayStreamResponse, GatewayTransport } from '@glueco/sdk';
|
|
2
|
+
import { ChatCompletionRequest, ChatCompletionResponse } from './contracts.mjs';
|
|
3
|
+
export { ACTIONS, ChatCompletionChoice, ChatCompletionChoiceSchema, ChatCompletionChunk, ChatCompletionChunkSchema, ChatCompletionRequestSchema, ChatCompletionResponseSchema, ChatMessage, ChatMessageSchema, DEFAULT_GROQ_MODELS, ENFORCEMENT_SUPPORT, GroqAction, PLUGIN_ID, PROVIDER, RESOURCE_TYPE, Usage, UsageSchema, VERSION } from './contracts.mjs';
|
|
4
|
+
import 'zod';
|
|
5
|
+
|
|
6
|
+
/**
|
|
7
|
+
* Options for chat completion requests.
|
|
8
|
+
*/
|
|
9
|
+
interface ChatCompletionOptions extends Omit<GatewayRequestOptions, "stream" | "method"> {
|
|
10
|
+
/**
|
|
11
|
+
* Override for custom behavior (advanced usage).
|
|
12
|
+
*/
|
|
13
|
+
raw?: boolean;
|
|
14
|
+
}
|
|
15
|
+
/**
|
|
16
|
+
* Groq client interface.
|
|
17
|
+
* Provides typed methods for all supported actions.
|
|
18
|
+
*/
|
|
19
|
+
interface GroqClient {
|
|
20
|
+
/**
|
|
21
|
+
* Create a chat completion.
|
|
22
|
+
*
|
|
23
|
+
* @param request - Chat completion request (OpenAI-compatible format)
|
|
24
|
+
* @param options - Optional request options
|
|
25
|
+
* @returns Chat completion response
|
|
26
|
+
*
|
|
27
|
+
* @example
|
|
28
|
+
* ```ts
|
|
29
|
+
* const response = await groqClient.chatCompletions({
|
|
30
|
+
* model: "llama-3.3-70b-versatile",
|
|
31
|
+
* messages: [
|
|
32
|
+
* { role: "system", content: "You are a helpful assistant." },
|
|
33
|
+
* { role: "user", content: "What is the capital of France?" }
|
|
34
|
+
* ],
|
|
35
|
+
* temperature: 0.7,
|
|
36
|
+
* max_tokens: 1000
|
|
37
|
+
* });
|
|
38
|
+
*
|
|
39
|
+
* console.log(response.data.choices[0].message.content);
|
|
40
|
+
* ```
|
|
41
|
+
*/
|
|
42
|
+
chatCompletions(request: ChatCompletionRequest, options?: ChatCompletionOptions): Promise<GatewayResponse<ChatCompletionResponse>>;
|
|
43
|
+
/**
|
|
44
|
+
* Create a streaming chat completion.
|
|
45
|
+
*
|
|
46
|
+
* @param request - Chat completion request (stream flag will be set automatically)
|
|
47
|
+
* @param options - Optional request options
|
|
48
|
+
* @returns Streaming response with SSE stream
|
|
49
|
+
*
|
|
50
|
+
* @example
|
|
51
|
+
* ```ts
|
|
52
|
+
* const response = await groqClient.chatCompletionsStream({
|
|
53
|
+
* model: "llama-3.3-70b-versatile",
|
|
54
|
+
* messages: [{ role: "user", content: "Tell me a story" }]
|
|
55
|
+
* });
|
|
56
|
+
*
|
|
57
|
+
* const reader = response.stream.getReader();
|
|
58
|
+
* const decoder = new TextDecoder();
|
|
59
|
+
*
|
|
60
|
+
* while (true) {
|
|
61
|
+
* const { done, value } = await reader.read();
|
|
62
|
+
* if (done) break;
|
|
63
|
+
* const chunk = decoder.decode(value);
|
|
64
|
+
* // Process SSE chunk
|
|
65
|
+
* }
|
|
66
|
+
* ```
|
|
67
|
+
*/
|
|
68
|
+
chatCompletionsStream(request: Omit<ChatCompletionRequest, "stream">, options?: ChatCompletionOptions): Promise<GatewayStreamResponse>;
|
|
69
|
+
/**
|
|
70
|
+
* Get the underlying transport for advanced usage.
|
|
71
|
+
* Useful when you need direct access to the gateway.
|
|
72
|
+
*/
|
|
73
|
+
readonly transport: GatewayTransport;
|
|
74
|
+
}
|
|
75
|
+
/**
|
|
76
|
+
* Create a typed Groq client.
|
|
77
|
+
*
|
|
78
|
+
* @param transport - Gateway transport from SDK
|
|
79
|
+
* @returns Typed Groq client
|
|
80
|
+
*
|
|
81
|
+
* @example
|
|
82
|
+
* ```ts
|
|
83
|
+
* import { groq } from "@glueco/plugin-llm-groq/client";
|
|
84
|
+
* import { GatewayClient } from "@glueco/sdk";
|
|
85
|
+
*
|
|
86
|
+
* // Setup
|
|
87
|
+
* const gatewayClient = new GatewayClient({
|
|
88
|
+
* keyStorage: new FileKeyStorage('./.gateway/keys.json'),
|
|
89
|
+
* configStorage: new FileConfigStorage('./.gateway/config.json'),
|
|
90
|
+
* });
|
|
91
|
+
*
|
|
92
|
+
* // Get transport and create typed client
|
|
93
|
+
* const transport = await gatewayClient.getTransport();
|
|
94
|
+
* const groqClient = groq(transport);
|
|
95
|
+
*
|
|
96
|
+
* // Use with full type safety
|
|
97
|
+
* const response = await groqClient.chatCompletions({
|
|
98
|
+
* model: "llama-3.3-70b-versatile",
|
|
99
|
+
* messages: [{ role: "user", content: "Hello!" }]
|
|
100
|
+
* });
|
|
101
|
+
* ```
|
|
102
|
+
*/
|
|
103
|
+
declare function groq(transport: GatewayTransport): GroqClient;
|
|
104
|
+
|
|
105
|
+
export { type ChatCompletionOptions, ChatCompletionRequest, ChatCompletionResponse, type GroqClient, groq as default, groq };
|
package/dist/client.d.ts
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
1
|
+
import { GatewayRequestOptions, GatewayResponse, GatewayStreamResponse, GatewayTransport } from '@glueco/sdk';
|
|
2
|
+
import { ChatCompletionRequest, ChatCompletionResponse } from './contracts.js';
|
|
3
|
+
export { ACTIONS, ChatCompletionChoice, ChatCompletionChoiceSchema, ChatCompletionChunk, ChatCompletionChunkSchema, ChatCompletionRequestSchema, ChatCompletionResponseSchema, ChatMessage, ChatMessageSchema, DEFAULT_GROQ_MODELS, ENFORCEMENT_SUPPORT, GroqAction, PLUGIN_ID, PROVIDER, RESOURCE_TYPE, Usage, UsageSchema, VERSION } from './contracts.js';
|
|
4
|
+
import 'zod';
|
|
5
|
+
|
|
6
|
+
/**
|
|
7
|
+
* Options for chat completion requests.
|
|
8
|
+
*/
|
|
9
|
+
interface ChatCompletionOptions extends Omit<GatewayRequestOptions, "stream" | "method"> {
|
|
10
|
+
/**
|
|
11
|
+
* Override for custom behavior (advanced usage).
|
|
12
|
+
*/
|
|
13
|
+
raw?: boolean;
|
|
14
|
+
}
|
|
15
|
+
/**
|
|
16
|
+
* Groq client interface.
|
|
17
|
+
* Provides typed methods for all supported actions.
|
|
18
|
+
*/
|
|
19
|
+
interface GroqClient {
|
|
20
|
+
/**
|
|
21
|
+
* Create a chat completion.
|
|
22
|
+
*
|
|
23
|
+
* @param request - Chat completion request (OpenAI-compatible format)
|
|
24
|
+
* @param options - Optional request options
|
|
25
|
+
* @returns Chat completion response
|
|
26
|
+
*
|
|
27
|
+
* @example
|
|
28
|
+
* ```ts
|
|
29
|
+
* const response = await groqClient.chatCompletions({
|
|
30
|
+
* model: "llama-3.3-70b-versatile",
|
|
31
|
+
* messages: [
|
|
32
|
+
* { role: "system", content: "You are a helpful assistant." },
|
|
33
|
+
* { role: "user", content: "What is the capital of France?" }
|
|
34
|
+
* ],
|
|
35
|
+
* temperature: 0.7,
|
|
36
|
+
* max_tokens: 1000
|
|
37
|
+
* });
|
|
38
|
+
*
|
|
39
|
+
* console.log(response.data.choices[0].message.content);
|
|
40
|
+
* ```
|
|
41
|
+
*/
|
|
42
|
+
chatCompletions(request: ChatCompletionRequest, options?: ChatCompletionOptions): Promise<GatewayResponse<ChatCompletionResponse>>;
|
|
43
|
+
/**
|
|
44
|
+
* Create a streaming chat completion.
|
|
45
|
+
*
|
|
46
|
+
* @param request - Chat completion request (stream flag will be set automatically)
|
|
47
|
+
* @param options - Optional request options
|
|
48
|
+
* @returns Streaming response with SSE stream
|
|
49
|
+
*
|
|
50
|
+
* @example
|
|
51
|
+
* ```ts
|
|
52
|
+
* const response = await groqClient.chatCompletionsStream({
|
|
53
|
+
* model: "llama-3.3-70b-versatile",
|
|
54
|
+
* messages: [{ role: "user", content: "Tell me a story" }]
|
|
55
|
+
* });
|
|
56
|
+
*
|
|
57
|
+
* const reader = response.stream.getReader();
|
|
58
|
+
* const decoder = new TextDecoder();
|
|
59
|
+
*
|
|
60
|
+
* while (true) {
|
|
61
|
+
* const { done, value } = await reader.read();
|
|
62
|
+
* if (done) break;
|
|
63
|
+
* const chunk = decoder.decode(value);
|
|
64
|
+
* // Process SSE chunk
|
|
65
|
+
* }
|
|
66
|
+
* ```
|
|
67
|
+
*/
|
|
68
|
+
chatCompletionsStream(request: Omit<ChatCompletionRequest, "stream">, options?: ChatCompletionOptions): Promise<GatewayStreamResponse>;
|
|
69
|
+
/**
|
|
70
|
+
* Get the underlying transport for advanced usage.
|
|
71
|
+
* Useful when you need direct access to the gateway.
|
|
72
|
+
*/
|
|
73
|
+
readonly transport: GatewayTransport;
|
|
74
|
+
}
|
|
75
|
+
/**
|
|
76
|
+
* Create a typed Groq client.
|
|
77
|
+
*
|
|
78
|
+
* @param transport - Gateway transport from SDK
|
|
79
|
+
* @returns Typed Groq client
|
|
80
|
+
*
|
|
81
|
+
* @example
|
|
82
|
+
* ```ts
|
|
83
|
+
* import { groq } from "@glueco/plugin-llm-groq/client";
|
|
84
|
+
* import { GatewayClient } from "@glueco/sdk";
|
|
85
|
+
*
|
|
86
|
+
* // Setup
|
|
87
|
+
* const gatewayClient = new GatewayClient({
|
|
88
|
+
* keyStorage: new FileKeyStorage('./.gateway/keys.json'),
|
|
89
|
+
* configStorage: new FileConfigStorage('./.gateway/config.json'),
|
|
90
|
+
* });
|
|
91
|
+
*
|
|
92
|
+
* // Get transport and create typed client
|
|
93
|
+
* const transport = await gatewayClient.getTransport();
|
|
94
|
+
* const groqClient = groq(transport);
|
|
95
|
+
*
|
|
96
|
+
* // Use with full type safety
|
|
97
|
+
* const response = await groqClient.chatCompletions({
|
|
98
|
+
* model: "llama-3.3-70b-versatile",
|
|
99
|
+
* messages: [{ role: "user", content: "Hello!" }]
|
|
100
|
+
* });
|
|
101
|
+
* ```
|
|
102
|
+
*/
|
|
103
|
+
declare function groq(transport: GatewayTransport): GroqClient;
|
|
104
|
+
|
|
105
|
+
export { type ChatCompletionOptions, ChatCompletionRequest, ChatCompletionResponse, type GroqClient, groq as default, groq };
|