glm-mcp-claude 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.mcp.json.example +14 -0
- package/LICENSE +21 -0
- package/README.md +220 -0
- package/agents/glm.md +45 -0
- package/assets/demo-glm-agent-umbrella.png +0 -0
- package/assets/demo-glm-subagent-summary.png +0 -0
- package/docs/AUTOSELECT.md +58 -0
- package/docs/RULES.md +105 -0
- package/docs/research/glm-capabilities.md +241 -0
- package/docs/research/glm-failure-modes-routing.md +287 -0
- package/docs/research/glm-misc-and-integration.md +180 -0
- package/docs/research/glm-peak-usage-and-cost.md +146 -0
- package/docs/research/glm-vs-opus-scenario-matrix.md +85 -0
- package/docs/research/glm-vs-opus-toolcalling.md +134 -0
- package/glm-mcp/.env.example +32 -0
- package/glm-mcp/package-lock.json +1180 -0
- package/glm-mcp/package.json +21 -0
- package/glm-mcp/src/glmAgent.js +227 -0
- package/glm-mcp/src/glmClient.js +136 -0
- package/glm-mcp/src/index.js +306 -0
- package/glm-mcp/src/loadEnv.js +24 -0
- package/glm-mcp/src/router.js +291 -0
- package/glm-mcp/src/smoke.js +42 -0
- package/hooks/glm_subagent_router.mjs +206 -0
- package/install.mjs +132 -0
- package/package.json +47 -0
- package/uninstall.mjs +47 -0
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
# Copy to .env and fill in. .env is git-ignored.
|
|
2
|
+
|
|
3
|
+
# Your GLM (Zhipu / Z.ai) API key. Used as a Bearer token.
|
|
4
|
+
GLM_API_KEY=your-zai-key-here
|
|
5
|
+
|
|
6
|
+
# Anthropic-compatible endpoint for the GLM coding plan.
|
|
7
|
+
GLM_BASE_URL=https://api.z.ai/api/anthropic
|
|
8
|
+
|
|
9
|
+
# --- optional tuning (sensible defaults baked in) ---
|
|
10
|
+
# GLM_COST_BIAS=1.5 # how hard to favor GLM for cost (~10x cheaper). Higher = more GLM; 0 = ignore price
|
|
11
|
+
# GLM_MAX_CONCURRENT=1 # GLM caps in-flight requests ~1; keep at 1 unless your tier allows more
|
|
12
|
+
# --- output token cap (OFF by default = generous) ---
|
|
13
|
+
# By default the cap is OFF: every call may use up to GLM_MAX_TOKENS_CEILING (131072).
|
|
14
|
+
# max_tokens is a ceiling, not a target -- you pay for ACTUAL output, so leaving it off
|
|
15
|
+
# just prevents truncation. Turn the cap ON to control spend.
|
|
16
|
+
# GLM_CAP=off # off (default) | on -- enforce GLM_MAX_TOKENS when on
|
|
17
|
+
# GLM_MAX_TOKENS=32768 # the hard per-call limit applied WHEN GLM_CAP=on
|
|
18
|
+
# GLM_MAX_TOKENS_CEILING=131072 # the generous default used when the cap is OFF
|
|
19
|
+
# GLM_MAX_RETRIES=4
|
|
20
|
+
# GLM_TIMEOUT_MS=300000
|
|
21
|
+
# GLM_AGENT_MAX_ITERS=30 # max tool-loop turns for glm_agent before it stops
|
|
22
|
+
# GLM_AGENT_BASH_TIMEOUT_MS=120000 # per-command timeout for glm_agent's run_bash
|
|
23
|
+
# GLM_OFFPEAK_MODEL=glm-5.2 # model(s) for "auto" off-peak. Can be a COMMA LIST, e.g.
|
|
24
|
+
# # "glm-5.2,glm-5-turbo" -> the router auto-picks (most capable for
|
|
25
|
+
# # hard tasks, cheapest for easy ones).
|
|
26
|
+
# GLM_PEAK_MODEL=glm-5.2 # model(s) for "auto" during peak. glm-5.x carries the ~3x surcharge,
|
|
27
|
+
# # so when "auto" lands on a glm-5.x model the router routes LESS to GLM
|
|
28
|
+
# # at peak. Include a no-surcharge model (e.g. "glm-5.2,glm-4.7") and
|
|
29
|
+
# # the router will prefer it at peak -> GLM stays fine to use.
|
|
30
|
+
# GLM_CHEAP_MODEL=glm-4.5-air
|
|
31
|
+
# GLM_PEAK_START_CN=14 # peak window start, China hour (UTC+8)
|
|
32
|
+
# GLM_PEAK_END_CN=18 # peak window end (exclusive)
|