RubyGems - smart_prompt - Versions diffs - 0.4.4 → 0.5.0 - Mend

smart_prompt 0.4.4 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +10 -10
data/README.cn.md +307 -64
data/README.md +311 -64
data/Rakefile +10 -1
data/config/anthropic_config.yml +151 -0
data/config/image_generation_config.yml +22 -0
data/config/multimodal_config.yml +85 -0
data/config/sensenova_config.yml +63 -0
data/config/zhipu_config.yml +73 -0
data/examples/anthropic_basic_chat.rb +143 -0
data/examples/anthropic_example.rb +232 -0
data/examples/anthropic_multimodal.rb +212 -0
data/examples/anthropic_streaming.rb +312 -0
data/examples/anthropic_tool_calling.rb +393 -0
data/examples/automatic_cleanup_example.rb +109 -0
data/examples/history_management_examples.rb +522 -0
data/examples/image_generation_example.rb +130 -0
data/examples/monitoring_example.rb +121 -0
data/examples/multimodal_example.rb +63 -0
data/examples/relevance_based_strategy_example.rb +87 -0
data/examples/sensenova_example.rb +129 -0
data/examples/stt_example.rb +287 -0
data/examples/tts_example.rb +244 -0
data/examples/video_generation_example.rb +189 -0
data/examples/zhipu_example.rb +151 -0
data/lib/smart_prompt/anthropic_adapter.rb +363 -281
data/lib/smart_prompt/compression_engine.rb +201 -0
data/lib/smart_prompt/context_strategy.rb +22 -0
data/lib/smart_prompt/conversation.rb +81 -191
data/lib/smart_prompt/engine.rb +36 -19
data/lib/smart_prompt/history_manager.rb +596 -0
data/lib/smart_prompt/hybrid_strategy.rb +222 -0
data/lib/smart_prompt/image_generation_adapter.rb +297 -0
data/lib/smart_prompt/lru_cache.rb +133 -0
data/lib/smart_prompt/message.rb +57 -0
data/lib/smart_prompt/multimodal_adapter.rb +277 -0
data/lib/smart_prompt/openai_adapter.rb +1 -25
data/lib/smart_prompt/persistence_layer.rb +197 -0
data/lib/smart_prompt/relevance_based_strategy.rb +221 -0
data/lib/smart_prompt/sensenova_adapter.rb +410 -0
data/lib/smart_prompt/session.rb +140 -0
data/lib/smart_prompt/sliding_window_strategy.rb +100 -0
data/lib/smart_prompt/stt_adapter.rb +381 -0
data/lib/smart_prompt/summary_based_strategy.rb +152 -0
data/lib/smart_prompt/token_counter.rb +74 -0
data/lib/smart_prompt/tts_adapter.rb +403 -0
data/lib/smart_prompt/version.rb +1 -1
data/lib/smart_prompt/video_generation_adapter.rb +330 -0
data/lib/smart_prompt/worker.rb +25 -3
data/lib/smart_prompt/zhipu_adapter.rb +616 -0
data/lib/smart_prompt.rb +22 -2
data/workers/history_management_examples.rb +407 -0
data/workers/image_generation_workers.rb +119 -0
data/workers/multimodal_workers.rb +110 -0
data/workers/sensenova_workers.rb +62 -0
data/workers/stt_workers.rb +195 -0
data/workers/tts_workers.rb +388 -0
data/workers/video_generation_workers.rb +264 -0
data/workers/zhipu_workers.rb +113 -0
metadata +84 -8

data/lib/smart_prompt/video_generation_adapter.rb ADDED Viewed

@@ -0,0 +1,330 @@
+require "openai"
+require "base64"
+require "net/http"
+require "uri"
+module SmartPrompt
+  class VideoGenerationAdapter < LLMAdapter
+    SUPPORTED_IMAGE_FORMATS = %w[jpg jpeg png gif bmp webp]
+    SUPPORTED_VIDEO_FORMATS = %w[mp4 mov avi mkv webm]
+    def initialize(config)
+      super
+      api_key = @config["api_key"]
+      if api_key.is_a?(String) && api_key.start_with?("ENV[") && api_key.end_with?("]")
+        api_key = eval(api_key)
+      end
+      begin
+        @client = OpenAI::Client.new(
+          access_token: api_key,
+          uri_base: @config["url"],
+          request_timeout: 600, # Longer timeout for video generation
+        )
+      rescue OpenAI::ConfigurationError => e
+        SmartPrompt.logger.error "Failed to initialize VideoGeneration client: #{e.message}"
+        raise LLMAPIError, "Invalid VideoGeneration configuration: #{e.message}"
+      rescue OpenAI::Error => e
+        SmartPrompt.logger.error "Failed to initialize VideoGeneration client: #{e.message}"
+        raise LLMAPIError, "VideoGeneration authentication failed: #{e.message}"
+      rescue SocketError => e
+        SmartPrompt.logger.error "Failed to initialize VideoGeneration client: #{e.message}"
+        raise LLMAPIError, "Network error: Unable to connect to VideoGeneration API"
+      rescue => e
+        SmartPrompt.logger.error "Failed to initialize VideoGeneration client: #{e.message}"
+        raise Error, "Unexpected error initializing VideoGeneration client: #{e.message}"
+      ensure
+        SmartPrompt.logger.info "Successfully created a VideoGeneration client."
+      end
+    end
+    # Text-to-video generation
+    def generate_video(prompt, model: nil, duration: 4, resolution: "720p", fps: 24, seed: nil)
+      SmartPrompt.logger.info "VideoGenerationAdapter: Generating video from text"
+      model_name = model || @config["model"]
+      begin
+        # SiliconFlow uses OpenAI-compatible API format for video generation
+        # Note: This might require custom implementation as OpenAI gem doesn't have video endpoints
+        parameters = {
+          model: model_name,
+          prompt: prompt,
+          duration: duration,
+          resolution: resolution,
+          fps: fps
+        }
+        parameters[:seed] = seed if seed
+        SmartPrompt.logger.info "Video generation parameters: #{parameters}"
+        # Custom implementation for video generation
+        # Since OpenAI gem doesn't support video endpoints, we'll use direct HTTP calls
+        response = submit_video_generation_request(parameters)
+        @last_response = response
+        # Process response
+        if response["data"] && response["data"]["video_url"]
+          video_data = {
+            video_url: response["data"]["video_url"],
+            status: response["data"]["status"],
+            job_id: response["data"]["id"],
+            created_at: response["data"]["created_at"]
+          }
+          SmartPrompt.logger.info "Video generation job submitted successfully"
+          return video_data
+        else
+          SmartPrompt.logger.error "No video data in response"
+          raise LLMAPIError, "No video data in response"
+        end
+      rescue OpenAI::Error => e
+        SmartPrompt.logger.error "Video generation API error: #{e.message}"
+        raise LLMAPIError, "Video generation API error: #{e.message}"
+      rescue JSON::ParserError => e
+        SmartPrompt.logger.error "Failed to parse video generation response"
+        raise LLMAPIError, "Failed to parse video generation response"
+      rescue => e
+        SmartPrompt.logger.error "Unexpected error during video generation: #{e.message}"
+        raise Error, "Unexpected error during video generation: #{e.message}"
+      end
+    end
+    # Image-to-video generation
+    def create_video_from_image(image_file, prompt, model: nil, duration: 4, resolution: "720p", fps: 24, seed: nil)
+      SmartPrompt.logger.info "VideoGenerationAdapter: Creating video from image"
+      model_name = model || @config["model"]
+      begin
+        # Prepare image file
+        unless File.exist?(image_file)
+          raise Error, "Image file not found: #{image_file}"
+        end
+        file_ext = File.extname(image_file).downcase.delete(".")
+        unless SUPPORTED_IMAGE_FORMATS.include?(file_ext)
+          raise Error, "Unsupported image format: #{file_ext}"
+        end
+        # Convert image to base64 for API submission
+        image_data = File.binread(image_file)
+        base64_image = Base64.strict_encode64(image_data)
+        parameters = {
+          model: model_name,
+          image: base64_image,
+          prompt: prompt,
+          duration: duration,
+          resolution: resolution,
+          fps: fps
+        }
+        parameters[:seed] = seed if seed
+        SmartPrompt.logger.info "Image-to-video parameters: #{parameters}"
+        # Custom implementation for image-to-video generation
+        response = submit_image_to_video_request(parameters)
+        @last_response = response
+        if response["data"] && response["data"]["video_url"]
+          video_data = {
+            video_url: response["data"]["video_url"],
+            status: response["data"]["status"],
+            job_id: response["data"]["id"],
+            created_at: response["data"]["created_at"]
+          }
+          SmartPrompt.logger.info "Image-to-video job submitted successfully"
+          return video_data
+        else
+          SmartPrompt.logger.error "No video data in image-to-video response"
+          raise LLMAPIError, "No video data in image-to-video response"
+        end
+      rescue => e
+        SmartPrompt.logger.error "Unexpected error during image-to-video generation: #{e.message}"
+        raise Error, "Unexpected error during image-to-video generation: #{e.message}"
+      end
+    end
+    # Check video generation status
+    def check_video_status(job_id)
+      SmartPrompt.logger.info "VideoGenerationAdapter: Checking video generation status"
+      begin
+        response = check_video_generation_status(job_id)
+        @last_response = response
+        if response["data"]
+          status_data = {
+            job_id: response["data"]["id"],
+            status: response["data"]["status"],
+            video_url: response["data"]["video_url"],
+            progress: response["data"]["progress"],
+            created_at: response["data"]["created_at"],
+            updated_at: response["data"]["updated_at"]
+          }
+          SmartPrompt.logger.info "Video status: #{status_data[:status]}, Progress: #{status_data[:progress]}"
+          return status_data
+        else
+          SmartPrompt.logger.error "No status data in response"
+          raise LLMAPIError, "No status data in response"
+        end
+      rescue => e
+        SmartPrompt.logger.error "Error checking video status: #{e.message}"
+        raise Error, "Error checking video status: #{e.message}"
+      end
+    end
+    # Download video to file
+    def download_video(video_url, output_path)
+      SmartPrompt.logger.info "VideoGenerationAdapter: Downloading video"
+      begin
+        uri = URI.parse(video_url)
+        http = Net::HTTP.new(uri.host, uri.port)
+        http.use_ssl = (uri.scheme == 'https')
+        request = Net::HTTP::Get.new(uri.request_uri)
+        response = http.request(request)
+        if response.is_a?(Net::HTTPSuccess)
+          # Create directory if it doesn't exist
+          FileUtils.mkdir_p(File.dirname(output_path))
+          File.binwrite(output_path, response.body)
+          SmartPrompt.logger.info "Video downloaded successfully to: #{output_path}"
+          return output_path
+        else
+          SmartPrompt.logger.error "Failed to download video: #{response.code}"
+          raise Error, "Failed to download video: #{response.code}"
+        end
+      rescue => e
+        SmartPrompt.logger.error "Error downloading video: #{e.message}"
+        raise Error, "Error downloading video: #{e.message}"
+      end
+    end
+    # Wait for video generation to complete
+    def wait_for_video_completion(job_id, check_interval: 10, timeout: 600)
+      SmartPrompt.logger.info "VideoGenerationAdapter: Waiting for video generation to complete"
+      start_time = Time.now
+      loop do
+        status = check_video_status(job_id)
+        case status[:status]
+        when "completed"
+          SmartPrompt.logger.info "Video generation completed successfully"
+          return status
+        when "failed"
+          SmartPrompt.logger.error "Video generation failed"
+          raise LLMAPIError, "Video generation failed"
+        when "cancelled"
+          SmartPrompt.logger.error "Video generation was cancelled"
+          raise LLMAPIError, "Video generation was cancelled"
+        else
+          # Still processing
+          elapsed_time = Time.now - start_time
+          if elapsed_time > timeout
+            SmartPrompt.logger.error "Video generation timeout after #{timeout} seconds"
+            raise LLMAPIError, "Video generation timeout"
+          end
+          SmartPrompt.logger.info "Video generation in progress: #{status[:progress]}%"
+          sleep(check_interval)
+        end
+      end
+    end
+    private
+    # Custom implementation for video generation API call
+    def submit_video_generation_request(parameters)
+      # Since OpenAI gem doesn't support video endpoints, we implement custom HTTP call
+      uri = URI.parse("#{@config['url']}/videos/generations")
+      http = Net::HTTP.new(uri.host, uri.port)
+      http.use_ssl = (uri.scheme == 'https')
+      http.read_timeout = 600
+      request = Net::HTTP::Post.new(uri.request_uri)
+      request['Content-Type'] = 'application/json'
+      request['Authorization'] = "Bearer #{@config['api_key']}"
+      request.body = parameters.to_json
+      response = http.request(request)
+      if response.is_a?(Net::HTTPSuccess)
+        JSON.parse(response.body)
+      else
+        raise LLMAPIError, "Video generation API error: #{response.code} - #{response.body}"
+      end
+    end
+    # Custom implementation for image-to-video API call
+    def submit_image_to_video_request(parameters)
+      uri = URI.parse("#{@config['url']}/videos/generations")
+      http = Net::HTTP.new(uri.host, uri.port)
+      http.use_ssl = (uri.scheme == 'https')
+      http.read_timeout = 600
+      request = Net::HTTP::Post.new(uri.request_uri)
+      request['Content-Type'] = 'application/json'
+      request['Authorization'] = "Bearer #{@config['api_key']}"
+      request.body = parameters.to_json
+      response = http.request(request)
+      if response.is_a?(Net::HTTPSuccess)
+        JSON.parse(response.body)
+      else
+        raise LLMAPIError, "Image-to-video API error: #{response.code} - #{response.body}"
+      end
+    end
+    # Custom implementation for checking video generation status
+    def check_video_generation_status(job_id)
+      uri = URI.parse("#{@config['url']}/videos/#{job_id}")
+      http = Net::HTTP.new(uri.host, uri.port)
+      http.use_ssl = (uri.scheme == 'https')
+      request = Net::HTTP::Get.new(uri.request_uri)
+      request['Authorization'] = "Bearer #{@config['api_key']}"
+      response = http.request(request)
+      if response.is_a?(Net::HTTPSuccess)
+        JSON.parse(response.body)
+      else
+        raise LLMAPIError, "Status check API error: #{response.code} - #{response.body}"
+      end
+    end
+    # Override send_request to provide a meaningful error for chat operations
+    def send_request(messages, model = nil, temperature = 0.7, tools = nil, proc = nil)
+      SmartPrompt.logger.error "VideoGenerationAdapter does not support chat operations. Use generate_video, create_video_from_image, or check_video_status methods instead."
+      raise NotImplementedError, "VideoGenerationAdapter does not support chat operations"
+    end
+    # Override embeddings method
+    def embeddings(text, model)
+      SmartPrompt.logger.error "VideoGenerationAdapter does not support embeddings operations."
+      raise NotImplementedError, "VideoGenerationAdapter does not support embeddings operations"
+    end
+  end
+end

data/lib/smart_prompt/worker.rb CHANGED Viewed

@@ -11,13 +11,28 @@ module SmartPrompt
     end
     def execute(params = {})
-      @conversation = Conversation.new(@engine, params[:tools]) unless @conversation
+      # Generate default session ID if using history and no session_id provided
+      session_id = params[:session_id] || "default"
+      if params[:with_history] && !session_id && @engine.history_manager
+        session_id = "worker_#{@name}_#{Time.now.to_i}"
+        SmartPrompt.logger.info "Generated default session ID: #{session_id}"
+      end
+      if @conversation.nil? || @conversation.session_id != session_id
+        @conversation = Conversation.new(@engine, params[:tools], session_id)
+      end
       context = WorkerContext.new(@conversation, params, @engine)
       context.instance_eval(&@code)
     end
     def execute_by_stream(params = {}, &proc)
-      @conversation = Conversation.new(@engine, params[:tools])
+      # Generate default session ID if using history and no session_id provided
+      session_id = params[:session_id]
+      if params[:with_history] && !session_id && @engine.history_manager
+        session_id = "worker_#{@name}_#{Time.now.to_i}"
+        SmartPrompt.logger.info "Generated default session ID: #{session_id}"
+      end
+      @conversation = Conversation.new(@engine, params[:tools], session_id)
       context = WorkerContext.new(@conversation, params, @engine, proc)
       context.instance_eval(&@code)
     end
@@ -50,7 +65,7 @@ module SmartPrompt
             @conversation.send_msg_by_stream(params, &@proc)
           end
         elsif method == :sys_msg
-          @conversation.sys_msg(*args, params)
+          @conversation.sys_msg(*args)
         elsif method == :prompt
           @conversation.prompt(*args, with_history: params[:with_history])
         else
@@ -73,6 +88,13 @@ module SmartPrompt
       @proc
     end
+    # Expose the engine so workers can reach a configured adapter directly (e.g.
+    # `engine.llms["..."]`) for methods Conversation doesn't delegate, such as
+    # generate_video / synthesize_to_file / transcribe_audio.
+    def engine
+      @engine
+    end
     def call_worker(worker_name, params = {})
       worker = Worker.new(worker_name, @engine)
       worker.execute(params)