RubyGems - openclacky - Versions diffs - 1.1.0 → 1.1.2 - Mend

openclacky 1.1.0 → 1.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +37 -0
data/README.md +28 -7
data/lib/clacky/agent/llm_caller.rb +23 -1
data/lib/clacky/agent/session_serializer.rb +6 -1
data/lib/clacky/agent/skill_manager.rb +18 -5
data/lib/clacky/agent.rb +14 -5
data/lib/clacky/anthropic_stream_aggregator.rb +135 -0
data/lib/clacky/bedrock_stream_aggregator.rb +137 -0
data/lib/clacky/brand_config.rb +68 -15
data/lib/clacky/cli.rb +18 -19
data/lib/clacky/client.rb +146 -17
data/lib/clacky/default_skills/onboard/SKILL.md +6 -2
data/lib/clacky/default_skills/onboard/scripts/import_external_skills.rb +50 -6
data/lib/clacky/openai_stream_aggregator.rb +130 -0
data/lib/clacky/server/channel/adapters/weixin/adapter.rb +169 -6
data/lib/clacky/server/channel/channel_ui_controller.rb +6 -0
data/lib/clacky/server/http_server.rb +9 -3
data/lib/clacky/server/web_ui_controller.rb +8 -4
data/lib/clacky/tools/terminal.rb +11 -0
data/lib/clacky/ui2/components/input_area.rb +10 -1
data/lib/clacky/ui2/components/todo_area.rb +22 -2
data/lib/clacky/ui2/layout_manager.rb +70 -14
data/lib/clacky/ui2/progress_handle.rb +86 -15
data/lib/clacky/ui2/ui_controller.rb +47 -7
data/lib/clacky/utils/logger.rb +7 -0
data/lib/clacky/version.rb +1 -1
data/lib/clacky/web/app.css +6 -4
data/lib/clacky/web/i18n.js +21 -6
data/lib/clacky/web/index.html +8 -6
data/lib/clacky/web/sessions.js +171 -58
data/lib/clacky/web/vendor/katex/auto-render.min.js +1 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_AMS-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Caligraphic-Bold.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Caligraphic-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Fraktur-Bold.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Fraktur-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Main-Bold.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Main-BoldItalic.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Main-Italic.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Main-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Math-BoldItalic.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Math-Italic.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_SansSerif-Bold.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_SansSerif-Italic.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_SansSerif-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Script-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Size1-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Size2-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Size3-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Size4-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/fonts/KaTeX_Typewriter-Regular.woff2 +0 -0
data/lib/clacky/web/vendor/katex/katex.min.css +1 -0
data/lib/clacky/web/vendor/katex/katex.min.js +1 -0
data/lib/clacky/web/ws-dispatcher.js +19 -4
data/lib/clacky.rb +3 -0
data/scripts/build/src/install.sh.cc +15 -5
data/scripts/install.ps1 +14 -3
data/scripts/install.sh +15 -5
metadata +28 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: e897a7568d8b457d317c56ff402a76c1907b4a158e0e7382586e2b66115ee0f7
-  data.tar.gz: 5fbeb452695441035d7f7d4f7ba1f0ef63dbb198daebb17600eb6e9f9fb72c46
+  metadata.gz: 47f1d9f1ecb4338e0a19ce771dea37724ebfc70d9e0052dc7403e096a25c415d
+  data.tar.gz: 6887db06529972b393c75c92e17b47da8294abae765ceff7280d71943a160c85
 SHA512:
-  metadata.gz: 64d4764470f2f8bac52e7e8233afbf441336c8a81238def9800cf6735a90798435cc8d43e9056aa4c6e53f51760067e57b5b2670263339590b7f9fd744cc6920
-  data.tar.gz: c27a2313d3595adcb48a66e396c9eec8947550132a74bb5b8535b11d93e639b240bc1dafeab0a7bf9b4af665c2fa6a22630f8b23ab0061b2de4ebbfcae1f3299
+  metadata.gz: b49465d66eb2be634790d10813ac5988aca23f54a4d3c36c9690bd40bf0024ea5f7275b3bc1b89247aaa16cc30dbf1c1439733c51bdfc1f5750e02c7efbc8e80
+  data.tar.gz: f0f4397dd4cca183f199545e7c5db6b4902382c66c237257e8b2a99847e49702881dd8bcf60a78201ee18526ae2b04bd4217bf6def502ccf3ce8a7fb6fb0bdd0

data/CHANGELOG.md CHANGED Viewed

@@ -5,6 +5,43 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+## [1.1.2] - 2026-05-20
+### Added
+- Streaming response with real-time token display in WebUI
+- Stream thinking progress indicator during agent reasoning
+- Time-to-first-token (TTFT) display in WebUI
+- LaTeX rendering support in WebUI
+- Cache hit rate display in WebUI
+### Fixed
+- Reasoning content properly passed as `<think>` tags to WebUI
+- User-set session name no longer overwritten by auto-rename (#136)
+- Server command now supports `--help`/`-h`/`--bind`/`-b` and `-p` alias for `--port` (#135)
+- WSL.exe output encoding and premature WSL1 fallback detection (#130)
+- Hide edit/delete model options when no models are configured (#133)
+- BrowserManager MCP process cleanup on agent exit in CLI mode (#132)
+- Windows-native OpenClaw config detection on WSL during onboarding (#129)
+### More
+- Updated Windows installation docs and added GitHub star history
+## [1.1.1] - 2026-05-17
+### Added
+- **WeChat SendQueue with batching, throttling, and retry.** Messages sent to multiple WeChat official account users are now queued, batched (up to 100 recipients per call), throttled to 1 batch/second, and automatically retried on failure — preventing 45007 rate-limit errors during broadcasts. (#127)
+- **Session ID in TUI session bar.** The terminal UI session bar now displays the session ID alongside the session name, making it easy to identify sessions when cross-referencing with logs or Web UI.
+- **TUI todo clean-up on task completion.** Completed todos are now removed from the terminal display when a task finishes, keeping the TUI uncluttered. (#94)
+### Improved
+- **Brand skills persist across same-brand upgrades.** Brand skills are no longer removed and re-downloaded when the brand stays the same after an upgrade — eliminating unnecessary network calls and keeping skill state stable.
+- **Ruby 2.6 install reliability.** The installer now pre-installs rouge 3.30.0 before `gem install` and retries with a pinned version on Ruby 2.6, avoiding dependency resolution failures on older macOS system Ruby.
+### Fixed
+- **TUI progress bar flicker.** The progress bar in terminal mode no longer flashes when updating rapidly, providing a smoother visual experience.
+- **Xcode command auto-install loop.** The agent no longer gets stuck in a loop trying to auto-install missing Xcode command-line tools.
+- **Brand license warning after 3-day idle.** Fixed a spurious license warning that appeared on startup after the server had been idle for 3 days.
 ## [1.1.0] - 2026-05-15
 ### Added

data/README.md CHANGED Viewed

@@ -18,7 +18,7 @@ Same task, how much do you pay? Under comparable agent workloads, OpenClacky sav
 | Agent | Relative cost | Notes |
 |---|---|---|
-| **OpenClacky** | **~0.8–1.2×** | 16 tools · ~100% cache hit · subagent routing |
+| **OpenClacky** | **~0.8** | 16 tools · ~100% cache hit · subagent routing |
 | Claude Code | 1.0× (baseline) | World-class harness, closed-source subscription |
 | OpenClaw | ~1.5× | Comparable harness agent |
 | Hermes | ~3× | 52 built-in tools — schema bloat ~3–4× |
@@ -31,11 +31,11 @@ Core agent capability is roughly on par across the field — the real differenti
 | Feature | Claude Code | OpenClaw | Hermes | **OpenClacky** |
 |---|:---:|:---:|:---:|:---:|
-| Token cost | 1.0× | ~1.5× | ~3× | **~0.8–1.2×** |
+| Token cost | 1.0× | ~1.5× | ~3× | **~0.8** |
 | Open source | ❌ Closed | ✅ Open | ✅ Open | ✅ MIT |
 | BYOK / model freedom | ❌ Anthropic only | ✅ | ✅ | ✅ |
 | Skill self-evolution | ❌ | ❌ | ✅ | ✅ |
-| IM integration (Feishu / WeCom / WeChat) | ❌ | ✅ | ✅ | ✅ |
+| IM integration (Feishu/WeCom/WeChat/Discord/Telegram) | ❌ | ✅ | ✅ | ✅ |
 ## How we get the cost down
@@ -80,18 +80,29 @@ More options: https://www.openclacky.com/
 ### Command line
-**Requirements:** Ruby >= 3.1.0
+One-line install(Mac/Ubuntu):
 ```bash
-gem install openclacky
+/bin/bash -c "$(curl -sSL https://raw.githubusercontent.com/clacky-ai/openclacky/main/scripts/install.sh)"
 ```
-Or one-line install:
+Windows:
 ```bash
-/bin/bash -c "$(curl -sSL https://raw.githubusercontent.com/clacky-ai/openclacky/main/scripts/install.sh)"
+powershell -c "& ([scriptblock]::Create((irm 'https://raw.githubusercontent.com/clacky-ai/openclacky/main/scripts/install.ps1')))"
 ```
+or using Ruby(3.x/4.x):
+**Requirements:** Ruby >= 3.1.0
+```bash
+gem install openclacky
+```
+see more: https://www.openclacky.com/docs/installation
 ## Quick Start
 ### Terminal (CLI)
@@ -137,6 +148,16 @@ $ openclacky
 > How does the payment module work?
 ```
+## Star History
+<a href="https://www.star-history.com/?repos=clacky-ai%2Fopenclacky&type=date&legend=top-left">
+ <picture>
+   <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/chart?repos=clacky-ai/openclacky&type=date&theme=dark&legend=top-left" />
+   <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/chart?repos=clacky-ai/openclacky&type=date&legend=top-left" />
+   <img alt="Star History Chart" src="https://api.star-history.com/chart?repos=clacky-ai/openclacky&type=date&legend=top-left" />
+ </picture>
+</a>
 ## Advanced — Creator Program
 Already power users are turning their workflows into vertical AI experts on OpenClacky — encrypted distribution, License management, self-set pricing. Legal, healthcare, financial planning, and more.

data/lib/clacky/agent/llm_caller.rb CHANGED Viewed

@@ -103,7 +103,8 @@ module Clacky
             model: current_model,
             tools: tools_to_send,
             max_tokens: @config.max_tokens,
-            enable_caching: @config.enable_prompt_caching
+            enable_caching: @config.enable_prompt_caching,
+            on_chunk: build_progress_on_chunk
           )
           # Successful response — if we were probing, confirm primary is healthy.
@@ -748,6 +749,27 @@ module Clacky
           "Upstream response was truncated mid tool-call — asking model to use smaller steps and retrying..."
         )
       end
+      # Build a streaming progress callback for Client#send_messages_with_tools.
+      # Returns nil when no UI is attached, so the client skips the streaming
+      # plumbing entirely. Callback throttles UI updates to avoid flooding the
+      # progress handle on fast streams.
+      private def build_progress_on_chunk
+        return nil unless @ui
+        last_emit_at = 0.0
+        min_interval = 0.25
+        ->(input_tokens:, output_tokens:) {
+          now = Process.clock_gettime(Process::CLOCK_MONOTONIC)
+          return if now - last_emit_at < min_interval && output_tokens > 0
+          last_emit_at = now
+          @ui.show_progress(
+            progress_type: "thinking",
+            phase: "active",
+            metadata: { input_tokens: input_tokens, output_tokens: output_tokens }
+          )
+        }
+      end
     end
   end
 end

data/lib/clacky/agent/session_serializer.rb CHANGED Viewed

@@ -471,8 +471,13 @@ module Clacky
         case msg[:role].to_s
         when "assistant"
-          # Text content
+          # Text content — prepend reasoning/thinking content wrapped in <think> tags
+          # so the Web UI renders it as a collapsible thinking block
           text = extract_text_from_content(msg[:content]).to_s.strip
+          reasoning = msg[:reasoning_content]
+          if reasoning && !reasoning.to_s.strip.empty?
+            text = "<think>\n#{reasoning}\n</think>\n#{text}"
+          end
           ui.show_assistant_message(text, files: []) unless text.empty?
           # Tool calls embedded in assistant message

data/lib/clacky/agent/skill_manager.rb CHANGED Viewed

@@ -91,6 +91,20 @@ module Clacky
       # Keeps context tokens bounded regardless of how many skills are installed.
       MAX_CONTEXT_SKILLS = 30
+      # Process-wide deduper for the "skill context limit" warning so that
+      # every newly constructed Agent (sub-agents, retries, web turns…) doesn't
+      # re-emit the same line.
+      @skill_limit_warned_signatures = {}
+      @skill_limit_warn_mutex = Mutex.new
+      def self.warn_skill_limit_once(signature, &block)
+        @skill_limit_warn_mutex.synchronize do
+          return if @skill_limit_warned_signatures[signature]
+          @skill_limit_warned_signatures[signature] = true
+        end
+        block.call
+      end
       # Generate skill context - loads all auto-invocable skills allowed by the agent profile
       # @return [String] Skill context to add to system prompt
       def build_skill_context
@@ -103,17 +117,16 @@ module Clacky
         auto_invocable = all_skills.select(&:model_invocation_allowed?)
         # Enforce system prompt injection limit to control token usage.
-        # Warn only when the set of dropped skills *changes* — this message
-        # is otherwise emitted once per agent turn (build_skill_context is
-        # called during every system prompt assembly) and floods the log.
+        # Warn at most once per process per dropped-set signature — build_skill_context
+        # runs on every system-prompt assembly and is invoked from many short-lived
+        # Agent instances (sub-agents, web turns…), so per-instance dedup wasn't enough.
         if auto_invocable.size > MAX_CONTEXT_SKILLS
           kept    = auto_invocable.first(MAX_CONTEXT_SKILLS)
           dropped = auto_invocable.drop(MAX_CONTEXT_SKILLS)
           dropped_names = dropped.map(&:identifier)
           signature = dropped_names.sort.join(",")
-          if @skill_limit_warned_signature != signature
-            @skill_limit_warned_signature = signature
+          SkillManager.warn_skill_limit_once(signature) do
             Clacky::Logger.warn(
               "Skill context limit: #{auto_invocable.size} auto-invocable skills found, " \
               "only injecting first #{MAX_CONTEXT_SKILLS} " \

data/lib/clacky/agent.rb CHANGED Viewed

@@ -427,7 +427,7 @@ module Clacky
               tool_calls_count: (response[:tool_calls] || []).size
             )
             if response[:content] && !response[:content].empty?
-              emit_assistant_message(response[:content])
+              emit_assistant_message(response[:content], reasoning_content: response[:reasoning_content])
             end
             # Show token usage after the assistant message so WebUI renders it below the bubble
@@ -448,7 +448,7 @@ module Clacky
           # Show assistant message if there's content before tool calls
           if response[:content] && !response[:content].empty?
-            emit_assistant_message(response[:content])
+            emit_assistant_message(response[:content], reasoning_content: response[:reasoning_content])
           end
           # Show token usage after assistant message (or immediately if no message).
@@ -1532,11 +1532,20 @@ module Clacky
     # and cannot load file:// directly) and must stay scoped to the Web UI
     # controller. IM channel subscribers need the original file:// markdown so
     # parse_file_links can extract paths and deliver images as native attachments.
-    private def emit_assistant_message(content)
-      return if content.nil? || content.empty?
+    private def emit_assistant_message(content, reasoning_content: nil)
+      # Prepend reasoning/thinking content (from thinking-mode providers like
+      # DeepSeek V4, Kimi K2) wrapped in <think> tags so the Web UI renders it
+      # as a collapsible thinking block (see sessions.js _renderMarkdown).
+      if reasoning_content && !reasoning_content.to_s.strip.empty?
+        full_content = "<think>\n#{reasoning_content}\n</think>\n#{content}"
+      else
+        full_content = content
+      end
+      return if full_content.nil? || full_content.to_s.strip.empty?
       parsed = parse_file_links(content)
-      @ui&.show_assistant_message(parsed[:text], files: parsed[:files])
+      @ui&.show_assistant_message(full_content, files: parsed[:files])
     end
     # Track modified files for Time Machine snapshots

data/lib/clacky/anthropic_stream_aggregator.rb ADDED Viewed

@@ -0,0 +1,135 @@
+# frozen_string_literal: true
+require "json"
+module Clacky
+  # Reassembles an Anthropic Messages SSE stream (event: message_start /
+  # content_block_start / content_block_delta / content_block_stop /
+  # message_delta / message_stop / ping) into the same hash shape that
+  # MessageFormat::Anthropic.parse_response expects from a non-streaming
+  # response, while invoking on_chunk(input_tokens:, output_tokens:) as
+  # usage accumulates.
+  #
+  # Wire reference: https://docs.anthropic.com/en/api/messages-streaming
+  class AnthropicStreamAggregator
+    def initialize(on_chunk: nil)
+      @on_chunk = on_chunk
+      @blocks = {}
+      @stop_reason = nil
+      @usage = {}
+      @last_input_tokens = 0
+      @last_output_tokens = 0
+    end
+    def handle(event, data_str)
+      data = parse_or_nil(data_str)
+      return unless data
+      case event
+      when "message_start"
+        msg = data["message"] || {}
+        if (u = msg["usage"])
+          @usage.merge!(u)
+          emit_usage_progress
+        end
+      when "content_block_start"
+        idx = data["index"] || @blocks.size
+        cb = data["content_block"] || {}
+        case cb["type"]
+        when "tool_use"
+          @blocks[idx] = { kind: :tool_use, id: cb["id"], name: cb["name"], input_str: +"" }
+        else
+          @blocks[idx] = { kind: :text, text: +"" }
+        end
+      when "content_block_delta"
+        idx = data["index"] || 0
+        delta = data["delta"] || {}
+        block = (@blocks[idx] ||= { kind: :text, text: +"" })
+        case delta["type"]
+        when "text_delta"
+          block[:kind] ||= :text
+          block[:text] ||= +""
+          block[:text] << delta["text"].to_s
+        when "input_json_delta"
+          block[:kind] = :tool_use
+          block[:input_str] ||= +""
+          block[:input_str] << delta["partial_json"].to_s
+        when "thinking_delta"
+          block[:kind] = :thinking
+          block[:thinking] ||= +""
+          block[:thinking] << delta["thinking"].to_s
+        end
+        emit_estimate_progress
+      when "content_block_stop"
+        # Nothing to do: blocks are finalised in to_h.
+      when "message_delta"
+        if (d = data["delta"])
+          @stop_reason = d["stop_reason"] if d["stop_reason"]
+        end
+        if (u = data["usage"])
+          @usage.merge!(u)
+          emit_usage_progress
+        end
+      when "message_stop", "ping", "error"
+        # no-op
+      end
+    end
+    # Canonical non-streaming Anthropic response shape consumed by
+    # MessageFormat::Anthropic.parse_response.
+    def to_h
+      content_blocks = @blocks.keys.sort.map do |idx|
+        b = @blocks[idx]
+        case b[:kind]
+        when :tool_use
+          input_value =
+            if b[:input_str].to_s.empty?
+              {}
+            else
+              JSON.parse(b[:input_str]) rescue b[:input_str]
+            end
+          { "type" => "tool_use", "id" => b[:id], "name" => b[:name], "input" => input_value }
+        else
+          { "type" => "text", "text" => b[:text].to_s }
+        end
+      end
+      { "content" => content_blocks, "stop_reason" => @stop_reason, "usage" => @usage }
+    end
+    private def parse_or_nil(s)
+      JSON.parse(s)
+    rescue JSON::ParserError
+      nil
+    end
+    private def emit_usage_progress
+      return unless @on_chunk
+      input  = @usage["input_tokens"].to_i + @usage["cache_read_input_tokens"].to_i
+      output = @usage["output_tokens"].to_i
+      return if input == @last_input_tokens && output == @last_output_tokens
+      @last_input_tokens = input
+      @last_output_tokens = output
+      @on_chunk.call(input_tokens: input, output_tokens: output)
+    rescue => e
+      Clacky::Logger.warn("[AnthropicStreamAggregator] on_chunk: #{e.class}: #{e.message}")
+    end
+    private def emit_estimate_progress
+      return unless @on_chunk
+      output = approximate_output_tokens
+      return if output == @last_output_tokens
+      @last_output_tokens = output
+      @on_chunk.call(input_tokens: @last_input_tokens, output_tokens: output)
+    rescue => e
+      Clacky::Logger.warn("[AnthropicStreamAggregator] on_chunk: #{e.class}: #{e.message}")
+    end
+    private def approximate_output_tokens
+      total_chars = @blocks.values.sum do |b|
+        b[:text].to_s.bytesize + b[:input_str].to_s.bytesize + b[:thinking].to_s.bytesize
+      end
+      (total_chars / 4.0).ceil
+    end
+  end
+end

data/lib/clacky/bedrock_stream_aggregator.rb ADDED Viewed

@@ -0,0 +1,137 @@
+# frozen_string_literal: true
+require "json"
+module Clacky
+  # Reassembles a Bedrock Converse event stream into the same hash shape that
+  # MessageFormat::Bedrock.parse_response expects from a non-streaming response,
+  # while invoking on_chunk(input_tokens:, output_tokens:) as usage information
+  # accumulates.
+  #
+  # Bedrock event-stream events handled (passed through as raw event JSON):
+  #
+  #   messageStart      → { role: "assistant" }
+  #   contentBlockStart → { start: {toolUse: {toolUseId, name}} | {}, contentBlockIndex: N }
+  #   contentBlockDelta → { delta: {text: "..."} | {toolUse: {input: "..."}}, contentBlockIndex: N }
+  #   contentBlockStop  → { contentBlockIndex: N }
+  #   messageStop       → { stopReason: "end_turn" | "tool_use" | "max_tokens" | ... }
+  #   metadata          → { usage: {inputTokens, outputTokens, cacheReadInputTokens, cacheWriteInputTokens}, metrics: {...} }
+  #
+  # Tool-use input is streamed as a sequence of partial JSON strings; we
+  # concatenate and let the response parser leave it as a string for downstream
+  # tool dispatch (which calls JSON.parse with a {} fallback).
+  class BedrockStreamAggregator
+    def initialize(on_chunk: nil)
+      @on_chunk = on_chunk
+      @role = "assistant"
+      @blocks = {}
+      @stop_reason = nil
+      @usage = {}
+      @last_input_tokens = 0
+      @last_output_tokens = 0
+    end
+    def handle(event, data_str)
+      data = parse_or_nil(data_str)
+      return unless data
+      case event
+      when "messageStart"
+        @role = data["role"] || @role
+      when "contentBlockStart"
+        idx = data["contentBlockIndex"] || @blocks.size
+        start = data["start"] || {}
+        if (tu = start["toolUse"])
+          @blocks[idx] = { kind: :tool_use, id: tu["toolUseId"], name: tu["name"], input_str: +"" }
+        else
+          @blocks[idx] = { kind: :text, text: +"" }
+        end
+      when "contentBlockDelta"
+        idx = data["contentBlockIndex"] || 0
+        delta = data["delta"] || {}
+        block = (@blocks[idx] ||= { kind: :text, text: +"" })
+        if delta["text"]
+          block[:kind] ||= :text
+          block[:text] ||= +""
+          block[:text] << delta["text"]
+        elsif (tu = delta["toolUse"])
+          block[:kind] = :tool_use
+          block[:input_str] ||= +""
+          block[:input_str] << tu["input"].to_s
+          block[:id]   ||= tu["toolUseId"]
+          block[:name] ||= tu["name"]
+        elsif (rc = delta["reasoningContent"])
+          block[:kind] = :reasoning
+          block[:reasoning] ||= +""
+          block[:reasoning] << rc["text"].to_s
+        end
+        emit_estimate_progress
+      when "contentBlockStop"
+        # Nothing to assemble: blocks are kept as-is until messageStop.
+      when "messageStop"
+        @stop_reason = data["stopReason"] || @stop_reason
+      when "metadata"
+        if (u = data["usage"])
+          @usage.merge!(u)
+          emit_usage_progress(u)
+        end
+      end
+    end
+    # Render the canonical non-streaming Bedrock response hash so the existing
+    # MessageFormat::Bedrock.parse_response can consume it unchanged.
+    def to_h
+      content_blocks = @blocks.keys.sort.map do |idx|
+        b = @blocks[idx]
+        case b[:kind]
+        when :tool_use
+          input_value = b[:input_str].to_s.empty? ? {} : (JSON.parse(b[:input_str]) rescue b[:input_str])
+          { "toolUse" => { "toolUseId" => b[:id], "name" => b[:name], "input" => input_value } }
+        else
+          { "text" => b[:text].to_s }
+        end
+      end
+      {
+        "output"     => { "message" => { "role" => @role, "content" => content_blocks } },
+        "stopReason" => @stop_reason,
+        "usage"      => @usage
+      }
+    end
+    private def parse_or_nil(s)
+      JSON.parse(s)
+    rescue JSON::ParserError
+      nil
+    end
+    private def emit_usage_progress(u)
+      return unless @on_chunk
+      input  = u["inputTokens"].to_i + u["cacheReadInputTokens"].to_i
+      output = u["outputTokens"].to_i
+      return if input == @last_input_tokens && output == @last_output_tokens
+      @last_input_tokens = input
+      @last_output_tokens = output
+      @on_chunk.call(input_tokens: input, output_tokens: output)
+    rescue => e
+      Clacky::Logger.warn("[BedrockStreamAggregator] on_chunk: #{e.class}: #{e.message}")
+    end
+    private def emit_estimate_progress
+      return unless @on_chunk
+      output = approximate_output_tokens
+      return if output == @last_output_tokens
+      @last_output_tokens = output
+      @on_chunk.call(input_tokens: @last_input_tokens, output_tokens: output)
+    rescue => e
+      Clacky::Logger.warn("[BedrockStreamAggregator] on_chunk: #{e.class}: #{e.message}")
+    end
+    private def approximate_output_tokens
+      total_chars = @blocks.values.sum do |b|
+        b[:text].to_s.bytesize + b[:input_str].to_s.bytesize + b[:reasoning].to_s.bytesize
+      end
+      (total_chars / 4.0).ceil
+    end
+  end
+end