npm - @kaitranntt/ccs - Versions diffs - 3.3.0 → 3.4.0 - Mend

@kaitranntt/ccs 3.3.0 → 3.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +29 -4
package/VERSION +1 -1
package/bin/delta-accumulator.js +155 -0
package/bin/glmt-proxy.js +194 -34
package/bin/glmt-transformer.js +251 -4
package/bin/sse-parser.js +96 -0
package/lib/ccs +1 -1
package/lib/ccs.ps1 +1 -1
package/package.json +1 -1

package/README.md CHANGED Viewed

@@ -205,16 +205,27 @@ Commands and skills symlinked from `~/.ccs/shared/` - no duplication across prof
 |---------|-----------------|-------------------|
 | **Endpoint** | Anthropic-compatible | OpenAI-compatible |
 | **Thinking** | No | Yes (reasoning_content) |
-| **Streaming** | Yes | No (buffered) |
+| **Streaming** | Yes | **Yes (v3.4+)** |
+| **TTFB** | <500ms | <500ms (streaming), 2-10s (buffered) |
 | **Use Case** | Fast responses | Complex reasoning |
+### Streaming Support (v3.4)
+**GLMT now supports real-time streaming** with incremental reasoning content delivery.
+- **Default**: Streaming enabled (TTFB <500ms)
+- **Disable**: Set `CCS_GLMT_STREAMING=disabled` for buffered mode
+- **Force**: Set `CCS_GLMT_STREAMING=force` to override client preferences
+**Confirmed working**: Z.AI (1498 reasoning chunks tested)
 ### How It Works
 1. CCS spawns embedded HTTP proxy on localhost
-2. Proxy converts Anthropic format → OpenAI format
+2. Proxy converts Anthropic format → OpenAI format (streaming or buffered)
 3. Forwards to Z.AI with reasoning parameters
-4. Converts `reasoning_content` → thinking blocks
-5. Thinking appears in Claude Code UI
+4. Converts `reasoning_content` → thinking blocks (incremental or complete)
+5. Thinking appears in Claude Code UI in real-time
 ### Control Tags
@@ -235,6 +246,14 @@ nano ~/.ccs/glmt.settings.json
 }
 ```
+### Security Limits
+**DoS protection** (v3.4):
+- SSE buffer: 1MB max per event
+- Content buffer: 10MB max per block (thinking/text)
+- Content blocks: 100 max per message
+- Request timeout: 120s (both streaming and buffered)
 ### Debugging
 **Enable verbose logging**:
@@ -249,6 +268,12 @@ ccs glmt --verbose "your prompt"
 # Logs: ~/.ccs/logs/
 ```
+**Check streaming mode**:
+```bash
+# Disable streaming for debugging
+CCS_GLMT_STREAMING=disabled ccs glmt "test"
+```
 **Check reasoning content**:
 ```bash
 cat ~/.ccs/logs/*response-openai.json | jq '.choices[0].message.reasoning_content'

package/VERSION CHANGED Viewed

	@@ -1 +1 @@
1	- 3.3.0
1	+ 3.4.0

package/bin/delta-accumulator.js ADDED Viewed

@@ -0,0 +1,155 @@
+#!/usr/bin/env node
+'use strict';
+/**
+ * DeltaAccumulator - Maintain state across streaming deltas
+ *
+ * Tracks:
+ * - Message metadata (id, model, role)
+ * - Content blocks (thinking, text)
+ * - Current block index
+ * - Accumulated content
+ *
+ * Usage:
+ *   const acc = new DeltaAccumulator(thinkingConfig);
+ *   const events = transformer.transformDelta(openaiEvent, acc);
+ */
+class DeltaAccumulator {
+  constructor(thinkingConfig = {}, options = {}) {
+    this.thinkingConfig = thinkingConfig;
+    this.messageId = 'msg_' + Date.now() + '_' + Math.random().toString(36).substring(7);
+    this.model = null;
+    this.role = 'assistant';
+    // Content blocks
+    this.contentBlocks = [];
+    this.currentBlockIndex = -1;
+    // Buffers
+    this.thinkingBuffer = '';
+    this.textBuffer = '';
+    // C-02 Fix: Limits to prevent unbounded accumulation
+    this.maxBlocks = options.maxBlocks || 100;
+    this.maxBufferSize = options.maxBufferSize || 10 * 1024 * 1024; // 10MB
+    // State flags
+    this.messageStarted = false;
+    this.finalized = false;
+    // Statistics
+    this.inputTokens = 0;
+    this.outputTokens = 0;
+    this.finishReason = null;
+  }
+  /**
+   * Get current content block
+   * @returns {Object|null} Current block or null
+   */
+  getCurrentBlock() {
+    if (this.currentBlockIndex >= 0 && this.currentBlockIndex < this.contentBlocks.length) {
+      return this.contentBlocks[this.currentBlockIndex];
+    }
+    return null;
+  }
+  /**
+   * Start new content block
+   * @param {string} type - Block type ('thinking' or 'text')
+   * @returns {Object} New block
+   */
+  startBlock(type) {
+    // C-02 Fix: Enforce max blocks limit
+    if (this.contentBlocks.length >= this.maxBlocks) {
+      throw new Error(`Maximum ${this.maxBlocks} content blocks exceeded (DoS protection)`);
+    }
+    this.currentBlockIndex++;
+    const block = {
+      index: this.currentBlockIndex,
+      type: type,
+      content: '',
+      started: true,
+      stopped: false
+    };
+    this.contentBlocks.push(block);
+    // Reset buffer for new block
+    if (type === 'thinking') {
+      this.thinkingBuffer = '';
+    } else if (type === 'text') {
+      this.textBuffer = '';
+    }
+    return block;
+  }
+  /**
+   * Add delta to current block
+   * @param {string} delta - Content delta
+   */
+  addDelta(delta) {
+    const block = this.getCurrentBlock();
+    if (block) {
+      if (block.type === 'thinking') {
+        // C-02 Fix: Enforce buffer size limit
+        if (this.thinkingBuffer.length + delta.length > this.maxBufferSize) {
+          throw new Error(`Thinking buffer exceeded ${this.maxBufferSize} bytes (DoS protection)`);
+        }
+        this.thinkingBuffer += delta;
+        block.content = this.thinkingBuffer;
+      } else if (block.type === 'text') {
+        // C-02 Fix: Enforce buffer size limit
+        if (this.textBuffer.length + delta.length > this.maxBufferSize) {
+          throw new Error(`Text buffer exceeded ${this.maxBufferSize} bytes (DoS protection)`);
+        }
+        this.textBuffer += delta;
+        block.content = this.textBuffer;
+      }
+    }
+  }
+  /**
+   * Mark current block as stopped
+   */
+  stopCurrentBlock() {
+    const block = this.getCurrentBlock();
+    if (block) {
+      block.stopped = true;
+    }
+  }
+  /**
+   * Update usage statistics
+   * @param {Object} usage - Usage object from OpenAI
+   */
+  updateUsage(usage) {
+    if (usage) {
+      this.inputTokens = usage.prompt_tokens || usage.input_tokens || 0;
+      this.outputTokens = usage.completion_tokens || usage.output_tokens || 0;
+    }
+  }
+  /**
+   * Get summary of accumulated state
+   * @returns {Object} Summary
+   */
+  getSummary() {
+    return {
+      messageId: this.messageId,
+      model: this.model,
+      role: this.role,
+      blockCount: this.contentBlocks.length,
+      currentIndex: this.currentBlockIndex,
+      messageStarted: this.messageStarted,
+      finalized: this.finalized,
+      usage: {
+        input_tokens: this.inputTokens,
+        output_tokens: this.outputTokens
+      }
+    };
+  }
+}
+module.exports = DeltaAccumulator;

package/bin/glmt-proxy.js CHANGED Viewed

@@ -4,6 +4,8 @@
 const http = require('http');
 const https = require('https');
 const GlmtTransformer = require('./glmt-transformer');
+const SSEParser = require('./sse-parser');
+const DeltaAccumulator = require('./delta-accumulator');
 /**
  * GlmtProxy - Embedded HTTP proxy for GLM thinking support
@@ -12,7 +14,7 @@ const GlmtTransformer = require('./glmt-transformer');
  * - Intercepts Claude CLI → Z.AI calls
  * - Transforms Anthropic format → OpenAI format
  * - Converts reasoning_content → thinking blocks
- * - Buffered mode only (streaming not supported)
+ * - Supports both streaming and buffered modes
  *
  * Lifecycle:
  * - Spawned by bin/ccs.js when 'glmt' profile detected
@@ -30,11 +32,14 @@ const GlmtTransformer = require('./glmt-transformer');
 class GlmtProxy {
   constructor(config = {}) {
     this.transformer = new GlmtTransformer({ verbose: config.verbose });
-    this.upstreamUrl = 'https://api.z.ai/api/coding/paas/v4/chat/completions';
+    // Use ANTHROPIC_BASE_URL from environment (set by settings.json) or fallback to Z.AI default
+    this.upstreamUrl = process.env.ANTHROPIC_BASE_URL || 'https://api.z.ai/api/coding/paas/v4/chat/completions';
     this.server = null;
     this.port = null;
     this.verbose = config.verbose || false;
     this.timeout = config.timeout || 120000; // 120s default
+    this.streamingEnabled = process.env.CCS_GLMT_STREAMING !== 'disabled';
+    this.forceStreaming = process.env.CCS_GLMT_STREAMING === 'force';
   }
   /**
@@ -52,8 +57,12 @@ class GlmtProxy {
         this.port = this.server.address().port;
         // Signal parent process
         console.log(`PROXY_READY:${this.port}`);
-        // One-time info message (always shown)
-        console.error(`[glmt] Proxy listening on port ${this.port} (buffered mode)`);
+        // Info message (only show in verbose mode)
+        if (this.verbose) {
+          const mode = this.streamingEnabled ? 'streaming mode' : 'buffered mode';
+          console.error(`[glmt] Proxy listening on port ${this.port} (${mode})`);
+        }
         // Debug mode notice
         if (this.transformer.debugLog) {
@@ -108,35 +117,14 @@ class GlmtProxy {
         return;
       }
-      // Transform to OpenAI format
-      const { openaiRequest, thinkingConfig } =
-        this.transformer.transformRequest(anthropicRequest);
-      this.log(`Transformed request, thinking: ${thinkingConfig.thinking}`);
-      // Forward to Z.AI
-      const openaiResponse = await this._forwardToUpstream(
-        openaiRequest,
-        req.headers
-      );
-      this.log(`Received response from upstream`);
+      // Branch: streaming or buffered
+      const useStreaming = (anthropicRequest.stream && this.streamingEnabled) || this.forceStreaming;
-      // Transform back to Anthropic format
-      const anthropicResponse = this.transformer.transformResponse(
-        openaiResponse,
-        thinkingConfig
-      );
-      // Return to Claude CLI
-      res.writeHead(200, {
-        'Content-Type': 'application/json',
-        'Access-Control-Allow-Origin': '*'
-      });
-      res.end(JSON.stringify(anthropicResponse));
-      const duration = Date.now() - startTime;
-      this.log(`Request completed in ${duration}ms`);
+      if (useStreaming) {
+        await this._handleStreamingRequest(req, res, anthropicRequest, startTime);
+      } else {
+        await this._handleBufferedRequest(req, res, anthropicRequest, startTime);
+      }
     } catch (error) {
       console.error('[glmt-proxy] Request error:', error.message);
@@ -153,6 +141,76 @@ class GlmtProxy {
     }
   }
+  /**
+   * Handle buffered (non-streaming) request
+   * @private
+   */
+  async _handleBufferedRequest(req, res, anthropicRequest, startTime) {
+    // Transform to OpenAI format
+    const { openaiRequest, thinkingConfig } =
+      this.transformer.transformRequest(anthropicRequest);
+    this.log(`Transformed request, thinking: ${thinkingConfig.thinking}`);
+    // Forward to Z.AI
+    const openaiResponse = await this._forwardToUpstream(
+      openaiRequest,
+      req.headers
+    );
+    this.log(`Received response from upstream`);
+    // Transform back to Anthropic format
+    const anthropicResponse = this.transformer.transformResponse(
+      openaiResponse,
+      thinkingConfig
+    );
+    // Return to Claude CLI
+    res.writeHead(200, {
+      'Content-Type': 'application/json',
+      'Access-Control-Allow-Origin': '*'
+    });
+    res.end(JSON.stringify(anthropicResponse));
+    const duration = Date.now() - startTime;
+    this.log(`Request completed in ${duration}ms`);
+  }
+  /**
+   * Handle streaming request
+   * @private
+   */
+  async _handleStreamingRequest(req, res, anthropicRequest, startTime) {
+    this.log('Using streaming mode');
+    // Transform request
+    const { openaiRequest, thinkingConfig } =
+      this.transformer.transformRequest(anthropicRequest);
+    // Force streaming
+    openaiRequest.stream = true;
+    // Set SSE headers
+    res.writeHead(200, {
+      'Content-Type': 'text/event-stream',
+      'Cache-Control': 'no-cache',
+      'Connection': 'keep-alive',
+      'Access-Control-Allow-Origin': '*'
+    });
+    this.log('Starting SSE stream to Claude CLI');
+    // Forward and stream
+    await this._forwardAndStreamUpstream(
+      openaiRequest,
+      req.headers,
+      res,
+      thinkingConfig,
+      startTime
+    );
+  }
   /**
    * Read request body
    * @param {http.IncomingMessage} req - Request
@@ -194,7 +252,7 @@ class GlmtProxy {
       const options = {
         hostname: url.hostname,
         port: url.port || 443,
-        path: '/api/coding/paas/v4/chat/completions', // OpenAI-compatible endpoint
+        path: url.pathname || '/api/coding/paas/v4/chat/completions',
         method: 'POST',
         headers: {
           'Content-Type': 'application/json',
@@ -206,7 +264,7 @@ class GlmtProxy {
       };
       // Debug logging
-      this.log(`Forwarding to: ${url.hostname}${options.path}`);
+      this.log(`Forwarding to: ${url.hostname}${url.pathname}`);
       // Set timeout
       const timeoutHandle = setTimeout(() => {
@@ -251,6 +309,108 @@ class GlmtProxy {
     });
   }
+  /**
+   * Forward request to Z.AI and stream response
+   * @param {Object} openaiRequest - OpenAI format request
+   * @param {Object} originalHeaders - Original request headers
+   * @param {http.ServerResponse} clientRes - Response to Claude CLI
+   * @param {Object} thinkingConfig - Thinking configuration
+   * @param {number} startTime - Request start time
+   * @returns {Promise<void>}
+   * @private
+   */
+  async _forwardAndStreamUpstream(openaiRequest, originalHeaders, clientRes, thinkingConfig, startTime) {
+    return new Promise((resolve, reject) => {
+      const url = new URL(this.upstreamUrl);
+      const requestBody = JSON.stringify(openaiRequest);
+      const options = {
+        hostname: url.hostname,
+        port: url.port || 443,
+        path: url.pathname || '/api/coding/paas/v4/chat/completions',
+        method: 'POST',
+        headers: {
+          'Content-Type': 'application/json',
+          'Content-Length': Buffer.byteLength(requestBody),
+          'Authorization': originalHeaders['authorization'] || '',
+          'User-Agent': 'CCS-GLMT-Proxy/1.0',
+          'Accept': 'text/event-stream'
+        }
+      };
+      this.log(`Forwarding streaming request to: ${url.hostname}${url.pathname}`);
+      // C-03 Fix: Apply timeout to streaming requests
+      const timeoutHandle = setTimeout(() => {
+        req.destroy();
+        reject(new Error(`Streaming request timeout after ${this.timeout}ms`));
+      }, this.timeout);
+      const req = https.request(options, (upstreamRes) => {
+        clearTimeout(timeoutHandle);
+        if (upstreamRes.statusCode !== 200) {
+          let body = '';
+          upstreamRes.on('data', chunk => body += chunk);
+          upstreamRes.on('end', () => {
+            reject(new Error(`Upstream error: ${upstreamRes.statusCode}\n${body}`));
+          });
+          return;
+        }
+        const parser = new SSEParser();
+        const accumulator = new DeltaAccumulator(thinkingConfig);
+        upstreamRes.on('data', (chunk) => {
+          try {
+            const events = parser.parse(chunk);
+            events.forEach(event => {
+              // Transform OpenAI delta → Anthropic events
+              const anthropicEvents = this.transformer.transformDelta(event, accumulator);
+              // Forward to Claude CLI
+              anthropicEvents.forEach(evt => {
+                const eventLine = `event: ${evt.event}\n`;
+                const dataLine = `data: ${JSON.stringify(evt.data)}\n\n`;
+                clientRes.write(eventLine + dataLine);
+              });
+            });
+          } catch (error) {
+            this.log(`Error processing chunk: ${error.message}`);
+          }
+        });
+        upstreamRes.on('end', () => {
+          const duration = Date.now() - startTime;
+          this.log(`Streaming completed in ${duration}ms`);
+          clientRes.end();
+          resolve();
+        });
+        upstreamRes.on('error', (error) => {
+          clearTimeout(timeoutHandle);
+          this.log(`Upstream stream error: ${error.message}`);
+          clientRes.write(`event: error\n`);
+          clientRes.write(`data: ${JSON.stringify({ error: error.message })}\n\n`);
+          clientRes.end();
+          reject(error);
+        });
+      });
+      req.on('error', (error) => {
+        clearTimeout(timeoutHandle);
+        this.log(`Request error: ${error.message}`);
+        clientRes.write(`event: error\n`);
+        clientRes.write(`data: ${JSON.stringify({ error: error.message })}\n\n`);
+        clientRes.end();
+        reject(error);
+      });
+      req.write(requestBody);
+      req.end();
+    });
+  }
   /**
    * Stop proxy server
    */

package/bin/glmt-transformer.js CHANGED Viewed

@@ -5,6 +5,8 @@ const crypto = require('crypto');
 const fs = require('fs');
 const path = require('path');
 const os = require('os');
+const SSEParser = require('./sse-parser');
+const DeltaAccumulator = require('./delta-accumulator');
 /**
  * GlmtTransformer - Convert between Anthropic and OpenAI formats with thinking support
@@ -73,10 +75,10 @@ class GlmtTransformer {
         openaiRequest.top_p = anthropicRequest.top_p;
       }
-      // 5. Handle streaming (not yet supported)
-      // Silently override to buffered mode
-      if (anthropicRequest.stream) {
-        openaiRequest.stream = false;
+      // 5. Handle streaming
+      // Keep stream parameter from request
+      if (anthropicRequest.stream !== undefined) {
+        openaiRequest.stream = anthropicRequest.stream;
       }
       // 6. Inject reasoning parameters
@@ -421,6 +423,251 @@ class GlmtTransformer {
     return { checks, passed, total, valid: passed === total };
   }
+  /**
+   * Transform OpenAI streaming delta to Anthropic events
+   * @param {Object} openaiEvent - Parsed SSE event from Z.AI
+   * @param {DeltaAccumulator} accumulator - State accumulator
+   * @returns {Array<Object>} Array of Anthropic SSE events
+   */
+  transformDelta(openaiEvent, accumulator) {
+    const events = [];
+    // Handle [DONE] marker
+    if (openaiEvent.event === 'done') {
+      return this.finalizeDelta(accumulator);
+    }
+    const choice = openaiEvent.data?.choices?.[0];
+    if (!choice) return events;
+    const delta = choice.delta;
+    if (!delta) return events;
+    // Message start
+    if (!accumulator.messageStarted) {
+      if (openaiEvent.data.model) {
+        accumulator.model = openaiEvent.data.model;
+      }
+      events.push(this._createMessageStartEvent(accumulator));
+      accumulator.messageStarted = true;
+    }
+    // Role
+    if (delta.role) {
+      accumulator.role = delta.role;
+    }
+    // Reasoning content delta (Z.AI streams incrementally - confirmed in Phase 02)
+    if (delta.reasoning_content) {
+      const currentBlock = accumulator.getCurrentBlock();
+      if (!currentBlock || currentBlock.type !== 'thinking') {
+        // Start thinking block
+        const block = accumulator.startBlock('thinking');
+        events.push(this._createContentBlockStartEvent(block));
+      }
+      accumulator.addDelta(delta.reasoning_content);
+      events.push(this._createThinkingDeltaEvent(
+        accumulator.getCurrentBlock(),
+        delta.reasoning_content
+      ));
+    }
+    // Text content delta
+    if (delta.content) {
+      const currentBlock = accumulator.getCurrentBlock();
+      // Close thinking block if transitioning from thinking to text
+      if (currentBlock && currentBlock.type === 'thinking' && !currentBlock.stopped) {
+        events.push(this._createSignatureDeltaEvent(currentBlock));
+        events.push(this._createContentBlockStopEvent(currentBlock));
+        accumulator.stopCurrentBlock();
+      }
+      if (!accumulator.getCurrentBlock() || accumulator.getCurrentBlock().type !== 'text') {
+        // Start text block
+        const block = accumulator.startBlock('text');
+        events.push(this._createContentBlockStartEvent(block));
+      }
+      accumulator.addDelta(delta.content);
+      events.push(this._createTextDeltaEvent(
+        accumulator.getCurrentBlock(),
+        delta.content
+      ));
+    }
+    // Usage update (appears in final chunk usually)
+    if (openaiEvent.data.usage) {
+      accumulator.updateUsage(openaiEvent.data.usage);
+    }
+    // Finish reason
+    if (choice.finish_reason) {
+      accumulator.finishReason = choice.finish_reason;
+    }
+    return events;
+  }
+  /**
+   * Finalize streaming and generate closing events
+   * @param {DeltaAccumulator} accumulator - State accumulator
+   * @returns {Array<Object>} Final Anthropic SSE events
+   */
+  finalizeDelta(accumulator) {
+    if (accumulator.finalized) {
+      return []; // Already finalized
+    }
+    const events = [];
+    // Close current content block if any
+    const currentBlock = accumulator.getCurrentBlock();
+    if (currentBlock && !currentBlock.stopped) {
+      if (currentBlock.type === 'thinking') {
+        events.push(this._createSignatureDeltaEvent(currentBlock));
+      }
+      events.push(this._createContentBlockStopEvent(currentBlock));
+      accumulator.stopCurrentBlock();
+    }
+    // Message delta (stop reason + usage)
+    events.push({
+      event: 'message_delta',
+      data: {
+        type: 'message_delta',
+        delta: {
+          stop_reason: this._mapStopReason(accumulator.finishReason || 'stop')
+        },
+        usage: {
+          output_tokens: accumulator.outputTokens
+        }
+      }
+    });
+    // Message stop
+    events.push({
+      event: 'message_stop',
+      data: {
+        type: 'message_stop'
+      }
+    });
+    accumulator.finalized = true;
+    return events;
+  }
+  /**
+   * Create message_start event
+   * @private
+   */
+  _createMessageStartEvent(accumulator) {
+    return {
+      event: 'message_start',
+      data: {
+        type: 'message_start',
+        message: {
+          id: accumulator.messageId,
+          type: 'message',
+          role: accumulator.role,
+          content: [],
+          model: accumulator.model || 'glm-4.6',
+          stop_reason: null,
+          usage: {
+            input_tokens: accumulator.inputTokens,
+            output_tokens: 0
+          }
+        }
+      }
+    };
+  }
+  /**
+   * Create content_block_start event
+   * @private
+   */
+  _createContentBlockStartEvent(block) {
+    return {
+      event: 'content_block_start',
+      data: {
+        type: 'content_block_start',
+        index: block.index,
+        content_block: {
+          type: block.type,
+          [block.type]: ''
+        }
+      }
+    };
+  }
+  /**
+   * Create thinking_delta event
+   * @private
+   */
+  _createThinkingDeltaEvent(block, delta) {
+    return {
+      event: 'content_block_delta',
+      data: {
+        type: 'content_block_delta',
+        index: block.index,
+        delta: {
+          type: 'thinking_delta',
+          thinking: delta
+        }
+      }
+    };
+  }
+  /**
+   * Create text_delta event
+   * @private
+   */
+  _createTextDeltaEvent(block, delta) {
+    return {
+      event: 'content_block_delta',
+      data: {
+        type: 'content_block_delta',
+        index: block.index,
+        delta: {
+          type: 'text_delta',
+          text: delta
+        }
+      }
+    };
+  }
+  /**
+   * Create signature_delta event
+   * @private
+   */
+  _createSignatureDeltaEvent(block) {
+    const signature = this._generateThinkingSignature(block.content);
+    return {
+      event: 'signature_delta',
+      data: {
+        type: 'signature_delta',
+        index: block.index,
+        signature: signature
+      }
+    };
+  }
+  /**
+   * Create content_block_stop event
+   * @private
+   */
+  _createContentBlockStopEvent(block) {
+    return {
+      event: 'content_block_stop',
+      data: {
+        type: 'content_block_stop',
+        index: block.index
+      }
+    };
+  }
   /**
    * Log message if verbose
    * @param {string} message - Message to log

package/bin/sse-parser.js ADDED Viewed

@@ -0,0 +1,96 @@
+#!/usr/bin/env node
+'use strict';
+/**
+ * SSEParser - Parse Server-Sent Events (SSE) stream
+ *
+ * Handles:
+ * - Incomplete events across chunks
+ * - Multiple events in single chunk
+ * - Malformed data (skip gracefully)
+ * - [DONE] marker
+ *
+ * Usage:
+ *   const parser = new SSEParser();
+ *   stream.on('data', chunk => {
+ *     const events = parser.parse(chunk);
+ *     events.forEach(event => { ... });
+ *   });
+ */
+class SSEParser {
+  constructor(options = {}) {
+    this.buffer = '';
+    this.eventCount = 0;
+    this.maxBufferSize = options.maxBufferSize || 1024 * 1024; // 1MB default
+  }
+  /**
+   * Parse chunk and extract SSE events
+   * @param {Buffer|string} chunk - Data chunk from stream
+   * @returns {Array<Object>} Array of parsed events
+   */
+  parse(chunk) {
+    this.buffer += chunk.toString();
+    // C-01 Fix: Prevent unbounded buffer growth (DoS protection)
+    if (this.buffer.length > this.maxBufferSize) {
+      throw new Error(`SSE buffer exceeded ${this.maxBufferSize} bytes (DoS protection)`);
+    }
+    const lines = this.buffer.split('\n');
+    // Keep incomplete line in buffer
+    this.buffer = lines.pop() || '';
+    const events = [];
+    let currentEvent = { event: 'message', data: '' };
+    for (const line of lines) {
+      if (line.startsWith('event: ')) {
+        currentEvent.event = line.substring(7).trim();
+      } else if (line.startsWith('data: ')) {
+        const data = line.substring(6);
+        if (data === '[DONE]') {
+          this.eventCount++;
+          events.push({
+            event: 'done',
+            data: null,
+            index: this.eventCount
+          });
+          currentEvent = { event: 'message', data: '' };
+        } else {
+          try {
+            currentEvent.data = JSON.parse(data);
+            this.eventCount++;
+            currentEvent.index = this.eventCount;
+            events.push(currentEvent);
+            currentEvent = { event: 'message', data: '' };
+          } catch (e) {
+            // H-01 Fix: Log parse errors for debugging
+            if (typeof console !== 'undefined' && console.error) {
+              console.error('[SSEParser] Malformed JSON event:', e.message, 'Data:', data.substring(0, 100));
+            }
+          }
+        }
+      } else if (line.startsWith('id: ')) {
+        currentEvent.id = line.substring(4).trim();
+      } else if (line.startsWith('retry: ')) {
+        currentEvent.retry = parseInt(line.substring(7), 10);
+      }
+      // Empty lines separate events (already handled by JSON parsing)
+    }
+    return events;
+  }
+  /**
+   * Reset parser state (for reuse)
+   */
+  reset() {
+    this.buffer = '';
+    this.eventCount = 0;
+  }
+}
+module.exports = SSEParser;

package/lib/ccs CHANGED Viewed

@@ -2,7 +2,7 @@
 set -euo pipefail
 # Version (updated by scripts/bump-version.sh)
-CCS_VERSION="3.3.0"
+CCS_VERSION="3.4.0"
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 readonly CONFIG_FILE="${CCS_CONFIG:-$HOME/.ccs/config.json}"
 readonly PROFILES_JSON="$HOME/.ccs/profiles.json"

package/lib/ccs.ps1 CHANGED Viewed

@@ -12,7 +12,7 @@ param(
 $ErrorActionPreference = "Stop"
 # Version (updated by scripts/bump-version.sh)
-$CcsVersion = "3.3.0"
+$CcsVersion = "3.4.0"
 $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
 $ConfigFile = if ($env:CCS_CONFIG) { $env:CCS_CONFIG } else { "$env:USERPROFILE\.ccs\config.json" }
 $ProfilesJson = "$env:USERPROFILE\.ccs\profiles.json"

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@kaitranntt/ccs",
-  "version": "3.3.0",
+  "version": "3.4.0",
   "description": "Claude Code Switch - Instant profile switching between Claude Sonnet 4.5 and GLM 4.6",
   "keywords": [
     "cli",