npm - @kaitranntt/ccs - Versions diffs - 3.2.0 → 3.4.0 - Mend

@kaitranntt/ccs 3.2.0 → 3.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/README.md +152 -124
package/VERSION +1 -1
package/bin/ccs.js +120 -4
package/bin/delta-accumulator.js +155 -0
package/bin/glmt-proxy.js +467 -0
package/bin/glmt-transformer.js +684 -0
package/bin/sse-parser.js +96 -0
package/config/base-glmt.settings.json +17 -0
package/lib/ccs +2 -1
package/lib/ccs.ps1 +2 -1
package/package.json +1 -1
package/scripts/postinstall.js +105 -1

package/bin/glmt-transformer.js ADDED Viewed

@@ -0,0 +1,684 @@
+#!/usr/bin/env node
+'use strict';
+const crypto = require('crypto');
+const fs = require('fs');
+const path = require('path');
+const os = require('os');
+const SSEParser = require('./sse-parser');
+const DeltaAccumulator = require('./delta-accumulator');
+/**
+ * GlmtTransformer - Convert between Anthropic and OpenAI formats with thinking support
+ *
+ * Features:
+ * - Request: Anthropic → OpenAI (inject reasoning params)
+ * - Response: OpenAI reasoning_content → Anthropic thinking blocks
+ * - Debug mode: Log raw data to ~/.ccs/logs/ (CCS_DEBUG_LOG=1)
+ * - Verbose mode: Console logging with timestamps
+ * - Validation: Self-test transformation results
+ *
+ * Usage:
+ *   const transformer = new GlmtTransformer({ verbose: true, debugLog: true });
+ *   const { openaiRequest, thinkingConfig } = transformer.transformRequest(req);
+ *   const anthropicResponse = transformer.transformResponse(resp, thinkingConfig);
+ *
+ * Control Tags (in user prompt):
+ *   <Thinking:On|Off>        - Enable/disable reasoning
+ *   <Effort:Low|Medium|High> - Control reasoning depth
+ */
+class GlmtTransformer {
+  constructor(config = {}) {
+    this.defaultThinking = config.defaultThinking ?? true;
+    this.verbose = config.verbose || false;
+    this.debugLog = config.debugLog ?? process.env.CCS_DEBUG_LOG === '1';
+    this.debugLogDir = config.debugLogDir || path.join(os.homedir(), '.ccs', 'logs');
+    this.modelMaxTokens = {
+      'GLM-4.6': 128000,
+      'GLM-4.5': 96000,
+      'GLM-4.5-air': 16000
+    };
+  }
+  /**
+   * Transform Anthropic request to OpenAI format
+   * @param {Object} anthropicRequest - Anthropic Messages API request
+   * @returns {Object} { openaiRequest, thinkingConfig }
+   */
+  transformRequest(anthropicRequest) {
+    // Log original request
+    this._writeDebugLog('request-anthropic', anthropicRequest);
+    try {
+      // 1. Extract thinking control from messages
+      const thinkingConfig = this._extractThinkingControl(
+        anthropicRequest.messages || []
+      );
+      this.log(`Extracted thinking control: ${JSON.stringify(thinkingConfig)}`);
+      // 2. Map model
+      const glmModel = this._mapModel(anthropicRequest.model);
+      // 3. Convert to OpenAI format
+      const openaiRequest = {
+        model: glmModel,
+        messages: this._sanitizeMessages(anthropicRequest.messages || []),
+        max_tokens: this._getMaxTokens(glmModel),
+        stream: anthropicRequest.stream ?? false
+      };
+      // 4. Preserve optional parameters
+      if (anthropicRequest.temperature !== undefined) {
+        openaiRequest.temperature = anthropicRequest.temperature;
+      }
+      if (anthropicRequest.top_p !== undefined) {
+        openaiRequest.top_p = anthropicRequest.top_p;
+      }
+      // 5. Handle streaming
+      // Keep stream parameter from request
+      if (anthropicRequest.stream !== undefined) {
+        openaiRequest.stream = anthropicRequest.stream;
+      }
+      // 6. Inject reasoning parameters
+      this._injectReasoningParams(openaiRequest, thinkingConfig);
+      // Log transformed request
+      this._writeDebugLog('request-openai', openaiRequest);
+      return { openaiRequest, thinkingConfig };
+    } catch (error) {
+      console.error('[glmt-transformer] Request transformation error:', error);
+      // Return original request with warning
+      return {
+        openaiRequest: anthropicRequest,
+        thinkingConfig: { thinking: false },
+        error: error.message
+      };
+    }
+  }
+  /**
+   * Transform OpenAI response to Anthropic format
+   * @param {Object} openaiResponse - OpenAI Chat Completions response
+   * @param {Object} thinkingConfig - Config from request transformation
+   * @returns {Object} Anthropic Messages API response
+   */
+  transformResponse(openaiResponse, thinkingConfig = {}) {
+    // Log original response
+    this._writeDebugLog('response-openai', openaiResponse);
+    try {
+      const choice = openaiResponse.choices?.[0];
+      if (!choice) {
+        throw new Error('No choices in OpenAI response');
+      }
+      const message = choice.message;
+      const content = [];
+      // Add thinking block if reasoning_content exists
+      if (message.reasoning_content) {
+        const length = message.reasoning_content.length;
+        const lineCount = message.reasoning_content.split('\n').length;
+        const preview = message.reasoning_content
+          .substring(0, 100)
+          .replace(/\n/g, ' ')
+          .trim();
+        this.log(`Detected reasoning_content:`);
+        this.log(`  Length: ${length} characters`);
+        this.log(`  Lines: ${lineCount}`);
+        this.log(`  Preview: ${preview}...`);
+        content.push({
+          type: 'thinking',
+          thinking: message.reasoning_content,
+          signature: this._generateThinkingSignature(message.reasoning_content)
+        });
+      } else {
+        this.log('No reasoning_content in OpenAI response');
+        this.log('Note: This is expected if thinking not requested or model cannot reason');
+      }
+      // Add text content
+      if (message.content) {
+        content.push({
+          type: 'text',
+          text: message.content
+        });
+      }
+      // Handle tool_calls if present
+      if (message.tool_calls && message.tool_calls.length > 0) {
+        message.tool_calls.forEach(toolCall => {
+          content.push({
+            type: 'tool_use',
+            id: toolCall.id,
+            name: toolCall.function.name,
+            input: JSON.parse(toolCall.function.arguments || '{}')
+          });
+        });
+      }
+      const anthropicResponse = {
+        id: openaiResponse.id || 'msg_' + Date.now(),
+        type: 'message',
+        role: 'assistant',
+        content: content,
+        model: openaiResponse.model || 'glm-4.6',
+        stop_reason: this._mapStopReason(choice.finish_reason),
+        usage: openaiResponse.usage || {
+          input_tokens: 0,
+          output_tokens: 0
+        }
+      };
+      // Validate transformation in verbose mode
+      if (this.verbose) {
+        const validation = this._validateTransformation(anthropicResponse);
+        this.log(`Transformation validation: ${validation.passed}/${validation.total} checks passed`);
+        if (!validation.valid) {
+          this.log(`Failed checks: ${JSON.stringify(validation.checks, null, 2)}`);
+        }
+      }
+      // Log transformed response
+      this._writeDebugLog('response-anthropic', anthropicResponse);
+      return anthropicResponse;
+    } catch (error) {
+      console.error('[glmt-transformer] Response transformation error:', error);
+      // Return minimal valid response
+      return {
+        id: 'msg_error_' + Date.now(),
+        type: 'message',
+        role: 'assistant',
+        content: [{
+          type: 'text',
+          text: '[Transformation Error] ' + error.message
+        }],
+        stop_reason: 'end_turn',
+        usage: { input_tokens: 0, output_tokens: 0 }
+      };
+    }
+  }
+  /**
+   * Sanitize messages for OpenAI API compatibility
+   * Remove thinking blocks and unsupported content types
+   * @param {Array} messages - Messages array
+   * @returns {Array} Sanitized messages
+   * @private
+   */
+  _sanitizeMessages(messages) {
+    return messages.map(msg => {
+      // If content is a string, return as-is
+      if (typeof msg.content === 'string') {
+        return msg;
+      }
+      // If content is an array, filter out unsupported types
+      if (Array.isArray(msg.content)) {
+        const sanitizedContent = msg.content
+          .filter(block => {
+            // Keep only text content for OpenAI
+            // Filter out: thinking, tool_use, tool_result, etc.
+            return block.type === 'text';
+          })
+          .map(block => {
+            // Return just the text content
+            return block;
+          });
+        // If we filtered everything out, return empty string
+        if (sanitizedContent.length === 0) {
+          return {
+            role: msg.role,
+            content: ''
+          };
+        }
+        // If only one text block, convert to string
+        if (sanitizedContent.length === 1 && sanitizedContent[0].type === 'text') {
+          return {
+            role: msg.role,
+            content: sanitizedContent[0].text
+          };
+        }
+        // Return array of text blocks
+        return {
+          role: msg.role,
+          content: sanitizedContent
+        };
+      }
+      // Fallback: return message as-is
+      return msg;
+    });
+  }
+  /**
+   * Extract thinking control tags from user messages
+   * @param {Array} messages - Messages array
+   * @returns {Object} { thinking: boolean, effort: string }
+   * @private
+   */
+  _extractThinkingControl(messages) {
+    const config = {
+      thinking: this.defaultThinking,
+      effort: 'medium'
+    };
+    // Scan user messages for control tags
+    for (const msg of messages) {
+      if (msg.role !== 'user') continue;
+      const content = msg.content;
+      if (typeof content !== 'string') continue;
+      // Check for <Thinking:On|Off>
+      const thinkingMatch = content.match(/<Thinking:(On|Off)>/i);
+      if (thinkingMatch) {
+        config.thinking = thinkingMatch[1].toLowerCase() === 'on';
+      }
+      // Check for <Effort:Low|Medium|High>
+      const effortMatch = content.match(/<Effort:(Low|Medium|High)>/i);
+      if (effortMatch) {
+        config.effort = effortMatch[1].toLowerCase();
+      }
+    }
+    return config;
+  }
+  /**
+   * Generate thinking signature for Claude Code UI
+   * @param {string} thinking - Thinking content
+   * @returns {Object} Signature object
+   * @private
+   */
+  _generateThinkingSignature(thinking) {
+    // Generate signature hash
+    const hash = crypto.createHash('sha256')
+      .update(thinking)
+      .digest('hex')
+      .substring(0, 16);
+    return {
+      type: 'thinking_signature',
+      hash: hash,
+      length: thinking.length,
+      timestamp: Date.now()
+    };
+  }
+  /**
+   * Inject reasoning parameters into OpenAI request
+   * @param {Object} openaiRequest - OpenAI request to modify
+   * @param {Object} thinkingConfig - Thinking configuration
+   * @returns {Object} Modified request
+   * @private
+   */
+  _injectReasoningParams(openaiRequest, thinkingConfig) {
+    // Always enable sampling for temperature/top_p to work
+    openaiRequest.do_sample = true;
+    // Add thinking-specific parameters if enabled
+    if (thinkingConfig.thinking) {
+      // Z.AI may support these parameters (based on research)
+      openaiRequest.reasoning = true;
+      openaiRequest.reasoning_effort = thinkingConfig.effort;
+    }
+    return openaiRequest;
+  }
+  /**
+   * Map Anthropic model to GLM model
+   * @param {string} anthropicModel - Anthropic model name
+   * @returns {string} GLM model name
+   * @private
+   */
+  _mapModel(anthropicModel) {
+    // Default to GLM-4.6 (latest and most capable)
+    return 'GLM-4.6';
+  }
+  /**
+   * Get max tokens for model
+   * @param {string} model - Model name
+   * @returns {number} Max tokens
+   * @private
+   */
+  _getMaxTokens(model) {
+    return this.modelMaxTokens[model] || 128000;
+  }
+  /**
+   * Map OpenAI stop reason to Anthropic stop reason
+   * @param {string} openaiReason - OpenAI finish_reason
+   * @returns {string} Anthropic stop_reason
+   * @private
+   */
+  _mapStopReason(openaiReason) {
+    const mapping = {
+      'stop': 'end_turn',
+      'length': 'max_tokens',
+      'tool_calls': 'tool_use',
+      'content_filter': 'stop_sequence'
+    };
+    return mapping[openaiReason] || 'end_turn';
+  }
+  /**
+   * Write debug log to file
+   * @param {string} type - 'request-anthropic', 'request-openai', 'response-openai', 'response-anthropic'
+   * @param {object} data - Data to log
+   * @private
+   */
+  _writeDebugLog(type, data) {
+    if (!this.debugLog) return;
+    try {
+      const timestamp = new Date().toISOString().replace(/[:.]/g, '-').split('.')[0];
+      const filename = `${timestamp}-${type}.json`;
+      const filepath = path.join(this.debugLogDir, filename);
+      // Ensure directory exists
+      fs.mkdirSync(this.debugLogDir, { recursive: true });
+      // Write file (pretty-printed)
+      fs.writeFileSync(filepath, JSON.stringify(data, null, 2) + '\n', 'utf8');
+      if (this.verbose) {
+        this.log(`Debug log written: ${filepath}`);
+      }
+    } catch (error) {
+      console.error(`[glmt-transformer] Failed to write debug log: ${error.message}`);
+    }
+  }
+  /**
+   * Validate transformed Anthropic response
+   * @param {object} anthropicResponse - Response to validate
+   * @returns {object} Validation results
+   * @private
+   */
+  _validateTransformation(anthropicResponse) {
+    const checks = {
+      hasContent: Boolean(anthropicResponse.content && anthropicResponse.content.length > 0),
+      hasThinking: anthropicResponse.content?.some(block => block.type === 'thinking') || false,
+      hasText: anthropicResponse.content?.some(block => block.type === 'text') || false,
+      validStructure: anthropicResponse.type === 'message' && anthropicResponse.role === 'assistant',
+      hasUsage: Boolean(anthropicResponse.usage)
+    };
+    const passed = Object.values(checks).filter(Boolean).length;
+    const total = Object.keys(checks).length;
+    return { checks, passed, total, valid: passed === total };
+  }
+  /**
+   * Transform OpenAI streaming delta to Anthropic events
+   * @param {Object} openaiEvent - Parsed SSE event from Z.AI
+   * @param {DeltaAccumulator} accumulator - State accumulator
+   * @returns {Array<Object>} Array of Anthropic SSE events
+   */
+  transformDelta(openaiEvent, accumulator) {
+    const events = [];
+    // Handle [DONE] marker
+    if (openaiEvent.event === 'done') {
+      return this.finalizeDelta(accumulator);
+    }
+    const choice = openaiEvent.data?.choices?.[0];
+    if (!choice) return events;
+    const delta = choice.delta;
+    if (!delta) return events;
+    // Message start
+    if (!accumulator.messageStarted) {
+      if (openaiEvent.data.model) {
+        accumulator.model = openaiEvent.data.model;
+      }
+      events.push(this._createMessageStartEvent(accumulator));
+      accumulator.messageStarted = true;
+    }
+    // Role
+    if (delta.role) {
+      accumulator.role = delta.role;
+    }
+    // Reasoning content delta (Z.AI streams incrementally - confirmed in Phase 02)
+    if (delta.reasoning_content) {
+      const currentBlock = accumulator.getCurrentBlock();
+      if (!currentBlock || currentBlock.type !== 'thinking') {
+        // Start thinking block
+        const block = accumulator.startBlock('thinking');
+        events.push(this._createContentBlockStartEvent(block));
+      }
+      accumulator.addDelta(delta.reasoning_content);
+      events.push(this._createThinkingDeltaEvent(
+        accumulator.getCurrentBlock(),
+        delta.reasoning_content
+      ));
+    }
+    // Text content delta
+    if (delta.content) {
+      const currentBlock = accumulator.getCurrentBlock();
+      // Close thinking block if transitioning from thinking to text
+      if (currentBlock && currentBlock.type === 'thinking' && !currentBlock.stopped) {
+        events.push(this._createSignatureDeltaEvent(currentBlock));
+        events.push(this._createContentBlockStopEvent(currentBlock));
+        accumulator.stopCurrentBlock();
+      }
+      if (!accumulator.getCurrentBlock() || accumulator.getCurrentBlock().type !== 'text') {
+        // Start text block
+        const block = accumulator.startBlock('text');
+        events.push(this._createContentBlockStartEvent(block));
+      }
+      accumulator.addDelta(delta.content);
+      events.push(this._createTextDeltaEvent(
+        accumulator.getCurrentBlock(),
+        delta.content
+      ));
+    }
+    // Usage update (appears in final chunk usually)
+    if (openaiEvent.data.usage) {
+      accumulator.updateUsage(openaiEvent.data.usage);
+    }
+    // Finish reason
+    if (choice.finish_reason) {
+      accumulator.finishReason = choice.finish_reason;
+    }
+    return events;
+  }
+  /**
+   * Finalize streaming and generate closing events
+   * @param {DeltaAccumulator} accumulator - State accumulator
+   * @returns {Array<Object>} Final Anthropic SSE events
+   */
+  finalizeDelta(accumulator) {
+    if (accumulator.finalized) {
+      return []; // Already finalized
+    }
+    const events = [];
+    // Close current content block if any
+    const currentBlock = accumulator.getCurrentBlock();
+    if (currentBlock && !currentBlock.stopped) {
+      if (currentBlock.type === 'thinking') {
+        events.push(this._createSignatureDeltaEvent(currentBlock));
+      }
+      events.push(this._createContentBlockStopEvent(currentBlock));
+      accumulator.stopCurrentBlock();
+    }
+    // Message delta (stop reason + usage)
+    events.push({
+      event: 'message_delta',
+      data: {
+        type: 'message_delta',
+        delta: {
+          stop_reason: this._mapStopReason(accumulator.finishReason || 'stop')
+        },
+        usage: {
+          output_tokens: accumulator.outputTokens
+        }
+      }
+    });
+    // Message stop
+    events.push({
+      event: 'message_stop',
+      data: {
+        type: 'message_stop'
+      }
+    });
+    accumulator.finalized = true;
+    return events;
+  }
+  /**
+   * Create message_start event
+   * @private
+   */
+  _createMessageStartEvent(accumulator) {
+    return {
+      event: 'message_start',
+      data: {
+        type: 'message_start',
+        message: {
+          id: accumulator.messageId,
+          type: 'message',
+          role: accumulator.role,
+          content: [],
+          model: accumulator.model || 'glm-4.6',
+          stop_reason: null,
+          usage: {
+            input_tokens: accumulator.inputTokens,
+            output_tokens: 0
+          }
+        }
+      }
+    };
+  }
+  /**
+   * Create content_block_start event
+   * @private
+   */
+  _createContentBlockStartEvent(block) {
+    return {
+      event: 'content_block_start',
+      data: {
+        type: 'content_block_start',
+        index: block.index,
+        content_block: {
+          type: block.type,
+          [block.type]: ''
+        }
+      }
+    };
+  }
+  /**
+   * Create thinking_delta event
+   * @private
+   */
+  _createThinkingDeltaEvent(block, delta) {
+    return {
+      event: 'content_block_delta',
+      data: {
+        type: 'content_block_delta',
+        index: block.index,
+        delta: {
+          type: 'thinking_delta',
+          thinking: delta
+        }
+      }
+    };
+  }
+  /**
+   * Create text_delta event
+   * @private
+   */
+  _createTextDeltaEvent(block, delta) {
+    return {
+      event: 'content_block_delta',
+      data: {
+        type: 'content_block_delta',
+        index: block.index,
+        delta: {
+          type: 'text_delta',
+          text: delta
+        }
+      }
+    };
+  }
+  /**
+   * Create signature_delta event
+   * @private
+   */
+  _createSignatureDeltaEvent(block) {
+    const signature = this._generateThinkingSignature(block.content);
+    return {
+      event: 'signature_delta',
+      data: {
+        type: 'signature_delta',
+        index: block.index,
+        signature: signature
+      }
+    };
+  }
+  /**
+   * Create content_block_stop event
+   * @private
+   */
+  _createContentBlockStopEvent(block) {
+    return {
+      event: 'content_block_stop',
+      data: {
+        type: 'content_block_stop',
+        index: block.index
+      }
+    };
+  }
+  /**
+   * Log message if verbose
+   * @param {string} message - Message to log
+   * @private
+   */
+  log(message) {
+    if (this.verbose) {
+      const timestamp = new Date().toTimeString().split(' ')[0]; // HH:MM:SS
+      console.error(`[glmt-transformer] [${timestamp}] ${message}`);
+    }
+  }
+}
+module.exports = GlmtTransformer;