RubyGems - llm_meta_client - Versions diffs - 0.4.0 → 0.5.0 - Mend

llm_meta_client 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 620e720960f5e05d563885fa2e00900311d6a7b4543fa13f9d3c476515edd40c
-  data.tar.gz: 33981d0657e520260b569873c5547e3279eba4325f88a812d8bf28d18941ac88
+  metadata.gz: 60116965474267f22c077da1849611c0b6c4490a876a98deebfa243d2f9aef49
+  data.tar.gz: 748fdc1631edcb65c7792b1dc13a3ae8d0625422c05d4e4a47732f9c8167a7d9
 SHA512:
-  metadata.gz: a557328075624b4ff7d17eda2ed181e178f5dfda39a23a9f87029141e04b22b78e6f648f81d751f6c92add2f0b54462b28c443bce2d4cf6fcc90f0dee5e1f175
-  data.tar.gz: f5b8ecaeec9af8153d8bbbed4d6056ba5213d267fba01381088d1f53bee80d6f1525d04992b79325476da5ce664976da9ab831844b02828e6b2db9279eb02ef0
+  metadata.gz: c87684a604a914fe6097a1277948d009530f83a07ec7991aa5b6caa92ce8d2eb9568b4a55b648ba2b50f12e06bb9df95e31333bd211a56289cad4c3c3c8ddc33
+  data.tar.gz: 6ba2df271d37e40be53981e40c8c416239318872118019da88bdd35a845607d28e95d9f33e53328442b85f309448e30e6d7b8a874dcbd68996760be61ea97cb3

data/CHANGELOG.md CHANGED Viewed

@@ -5,6 +5,16 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+## [0.5.0] - 2026-03-17
+### Added
+- Generation settings support:
+  - `generation_settings` parameter in `ServerQuery` API layer for configuring LLM generation parameters
+  - `generation_settings` threading through `Chat` model
+  - `generation_settings` parameter extraction in `ChatsController`
+  - Generation settings UI components for configuring parameters in chat forms
 ## [0.4.0] - 2026-03-11
 ### Added

data/app/assets/stylesheets/llm_meta_client/generation_settings.css ADDED Viewed

@@ -0,0 +1,90 @@
+/* Generation Settings */
+.generation-settings-field {
+  margin-bottom: 10px;
+}
+.generation-settings-toggle-button {
+  display: flex;
+  align-items: center;
+  gap: 6px;
+  background: none;
+  border: 1px solid #d1d5db;
+  border-radius: 6px;
+  padding: 6px 12px;
+  font-size: 13px;
+  font-weight: 600;
+  color: #374151;
+  cursor: pointer;
+  transition: border-color 0.2s, background-color 0.2s;
+  &:hover {
+    background-color: #f9fafb;
+    border-color: #9ca3af;
+  }
+}
+.generation-settings-panel {
+  margin-top: 8px;
+  border: 1px solid #e5e7eb;
+  border-radius: 8px;
+  background-color: #f9fafb;
+  padding: 12px 16px;
+}
+.generation-setting-item {
+  margin-bottom: 14px;
+  &:last-child {
+    margin-bottom: 0;
+  }
+  label {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    font-size: 13px;
+    font-weight: 600;
+    color: #374151;
+    margin-bottom: 4px;
+  }
+  input[type="range"] {
+    width: 100%;
+    accent-color: #3b82f6;
+    cursor: pointer;
+  }
+  .max-tokens-input {
+    width: 100%;
+    padding: 6px 10px;
+    border: 1px solid #d1d5db;
+    border-radius: 6px;
+    font-size: 13px;
+    background-color: white;
+    transition: border-color 0.2s;
+    &:focus {
+      outline: none;
+      border-color: #3b82f6;
+      box-shadow: 0 0 0 3px rgba(59, 130, 246, 0.1);
+    }
+    &::placeholder {
+      color: #9ca3af;
+    }
+  }
+}
+.setting-value {
+  font-weight: 700;
+  color: #3b82f6;
+  font-size: 13px;
+}
+.setting-range-labels {
+  display: flex;
+  justify-content: space-between;
+  font-size: 11px;
+  color: #9ca3af;
+  margin-top: 2px;
+}

data/lib/generators/llm_meta_client/scaffold/scaffold_generator.rb CHANGED Viewed

@@ -34,6 +34,7 @@ module LlmMetaClient
         template "app/views/shared/_api_key_field.html.erb"
         template "app/views/shared/_model_field.html.erb"
         template "app/views/shared/_tool_selector_field.html.erb"
+        template "app/views/shared/_generation_settings_field.html.erb"
         template "app/views/layouts/application.html.erb"
         template "app/views/layouts/_header.html.erb"
         template "app/views/layouts/_sidebar.html.erb"
@@ -44,6 +45,7 @@ module LlmMetaClient
         template "app/javascript/controllers/chats_form_controller.js"
         template "app/javascript/controllers/chat_title_edit_controller.js"
         template "app/javascript/controllers/tool_selector_controller.js"
+        template "app/javascript/controllers/generation_settings_controller.js"
         copy_file "app/javascript/popover.js"
       end

data/lib/generators/llm_meta_client/scaffold/templates/app/controllers/chats_controller.rb CHANGED Viewed

@@ -82,7 +82,7 @@ class ChatsController < ApplicationController
       # Send to LLM and get assistant response
       begin
-        @assistant_message = @chat.add_assistant_response(@prompt_execution, jwt_token, tool_ids: tool_ids_param)
+        @assistant_message = @chat.add_assistant_response(@prompt_execution, jwt_token, tool_ids: tool_ids_param, generation_settings: generation_settings_param)
         # Generate chat title from the user's prompt (only if title is not yet set)
         @chat.generate_title(params[:message], jwt_token)
       rescue StandardError => e
@@ -172,7 +172,7 @@ class ChatsController < ApplicationController
       # Send to LLM and get assistant response
       begin
-        @assistant_message = @chat.add_assistant_response(@prompt_execution, jwt_token, tool_ids: tool_ids_param)
+        @assistant_message = @chat.add_assistant_response(@prompt_execution, jwt_token, tool_ids: tool_ids_param, generation_settings: generation_settings_param)
       rescue StandardError => e
         Rails.logger.error "Error in chat response: #{e.class} - #{e.message}\n#{e.backtrace&.join("\n")}"
         @error_message = "An error occurred while getting the response. Please try again."
@@ -191,4 +191,14 @@ class ChatsController < ApplicationController
   def tool_ids_param
     params[:tool_ids].presence || []
   end
+  def generation_settings_param
+    settings = {}
+    settings[:temperature] = params[:temperature].to_f if params[:temperature].present?
+    settings[:top_k] = params[:top_k].to_i if params[:top_k].present?
+    settings[:top_p] = params[:top_p].to_f if params[:top_p].present?
+    settings[:max_tokens] = params[:max_tokens].to_i if params[:max_tokens].present?
+    settings[:repeat_penalty] = params[:repeat_penalty].to_f if params[:repeat_penalty].present?
+    settings
+  end
 end

data/lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/generation_settings_controller.js ADDED Viewed

@@ -0,0 +1,51 @@
+import { Controller } from "@hotwired/stimulus"
+// Connects to data-controller="generation-settings"
+export default class extends Controller {
+  static targets = [
+    "toggleButton",
+    "toggleIcon",
+    "panel",
+    "temperatureRange",
+    "temperatureValue",
+    "topKRange",
+    "topKValue",
+    "topPRange",
+    "topPValue",
+    "maxTokensInput",
+    "repeatPenaltyRange",
+    "repeatPenaltyValue",
+  ]
+  connect() {
+    this.expanded = false
+  }
+  toggle() {
+    if (!this.hasPanelTarget) return
+    this.expanded = !this.expanded
+    this.panelTarget.style.display = this.expanded ? "block" : "none"
+    if (this.hasToggleIconTarget) {
+      this.toggleIconTarget.classList.toggle("bi-chevron-down", !this.expanded)
+      this.toggleIconTarget.classList.toggle("bi-chevron-up", this.expanded)
+    }
+  }
+  updateTemperature() {
+    this.temperatureValueTarget.textContent = this.temperatureRangeTarget.value
+  }
+  updateTopK() {
+    this.topKValueTarget.textContent = this.topKRangeTarget.value
+  }
+  updateTopP() {
+    this.topPValueTarget.textContent = this.topPRangeTarget.value
+  }
+  updateRepeatPenalty() {
+    this.repeatPenaltyValueTarget.textContent = this.repeatPenaltyRangeTarget.value
+  }
+}

data/lib/generators/llm_meta_client/scaffold/templates/app/models/chat.rb CHANGED Viewed

@@ -67,8 +67,8 @@ class Chat < ApplicationRecord
   end
   # Add assistant response by sending to LLM
-  def add_assistant_response(prompt_execution, jwt_token, tool_ids: [])
-    response_content = send_to_llm(jwt_token, tool_ids: tool_ids)
+  def add_assistant_response(prompt_execution, jwt_token, tool_ids: [], generation_settings: {})
+    response_content = send_to_llm(jwt_token, tool_ids: tool_ids, generation_settings: generation_settings)
     prompt_execution.update!(
       llm_platform: llm_type(jwt_token),
       response: response_content
@@ -122,7 +122,7 @@ class Chat < ApplicationRecord
   end
   # Send messages to LLM and get response
-  def send_to_llm(jwt_token, tool_ids: [])
+  def send_to_llm(jwt_token, tool_ids: [], generation_settings: {})
     # Get LLM options
     llm_options = LlmMetaClient::ServerResource.available_llm_options(jwt_token)
@@ -149,6 +149,6 @@ class Chat < ApplicationRecord
     summarized_context += "Additional prompt: Responses from the assistant must consist solely of the response body."
     # Send chat request using LlmMetaClient::ServerQuery
-    LlmMetaClient::ServerQuery.new.call(jwt_token, llm_uuid, model, summarized_context, prompt, tool_ids: tool_ids)
+    LlmMetaClient::ServerQuery.new.call(jwt_token, llm_uuid, model, summarized_context, prompt, tool_ids: tool_ids, generation_settings: generation_settings)
   end
 end

data/lib/generators/llm_meta_client/scaffold/templates/app/views/chats/edit.html.erb CHANGED Viewed

@@ -18,6 +18,7 @@
         <%% if user_signed_in? %>
           <%%= render "shared/tool_selector_field", stimulus_controller: "tool-selector" %>
         <%% end %>
+        <%%= render "shared/generation_settings_field", stimulus_controller: "generation-settings" %>
       <%% end %>
       <div class="input-wrapper">
         <%%= f.text_area :message,

data/lib/generators/llm_meta_client/scaffold/templates/app/views/chats/new.html.erb CHANGED Viewed

@@ -18,6 +18,7 @@
         <%% if user_signed_in? %>
           <%%= render "shared/tool_selector_field", stimulus_controller: "tool-selector" %>
         <%% end %>
+        <%%= render "shared/generation_settings_field", stimulus_controller: "generation-settings" %>
       <%% end %>
       <div class="input-wrapper">
         <%%= f.text_area :message,

data/lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_generation_settings_field.html.erb ADDED Viewed

@@ -0,0 +1,87 @@
+<%%
+  stimulus_controller = local_assigns[:stimulus_controller] || "generation-settings"
+%>
+<div class="generation-settings-field" data-controller="<%%= stimulus_controller %>">
+  <div class="generation-settings-toggle">
+    <button type="button"
+            class="generation-settings-toggle-button"
+            data-<%%= stimulus_controller %>-target="toggleButton"
+            data-action="click-><%%= stimulus_controller %>#toggle">
+      <i class="bi bi-sliders"></i>
+      Generation Settings
+      <i class="bi bi-chevron-down toggle-icon" data-<%%= stimulus_controller %>-target="toggleIcon"></i>
+    </button>
+  </div>
+  <div class="generation-settings-panel" data-<%%= stimulus_controller %>-target="panel" style="display: none;">
+    <div class="generation-setting-item">
+      <label for="temperature">
+        Temperature
+        <span class="setting-value" data-<%%= stimulus_controller %>-target="temperatureValue">0.7</span>
+      </label>
+      <input type="range" name="temperature" id="temperature"
+             min="0" max="2" step="0.1" value="0.7"
+             data-<%%= stimulus_controller %>-target="temperatureRange"
+             data-action="input-><%%= stimulus_controller %>#updateTemperature">
+      <div class="setting-range-labels">
+        <span>0 (deterministic)</span>
+        <span>2 (creative)</span>
+      </div>
+    </div>
+    <div class="generation-setting-item">
+      <label for="top_k">
+        Top-K
+        <span class="setting-value" data-<%%= stimulus_controller %>-target="topKValue">40</span>
+      </label>
+      <input type="range" name="top_k" id="top_k"
+             min="1" max="100" step="1" value="40"
+             data-<%%= stimulus_controller %>-target="topKRange"
+             data-action="input-><%%= stimulus_controller %>#updateTopK">
+      <div class="setting-range-labels">
+        <span>1 (focused)</span>
+        <span>100 (diverse)</span>
+      </div>
+    </div>
+    <div class="generation-setting-item">
+      <label for="top_p">
+        Top-P
+        <span class="setting-value" data-<%%= stimulus_controller %>-target="topPValue">0.9</span>
+      </label>
+      <input type="range" name="top_p" id="top_p"
+             min="0" max="1" step="0.05" value="0.9"
+             data-<%%= stimulus_controller %>-target="topPRange"
+             data-action="input-><%%= stimulus_controller %>#updateTopP">
+      <div class="setting-range-labels">
+        <span>0 (narrow)</span>
+        <span>1 (broad)</span>
+      </div>
+    </div>
+    <div class="generation-setting-item">
+      <label for="max_tokens">
+        Max Tokens
+      </label>
+      <input type="number" name="max_tokens" id="max_tokens"
+             min="1" max="128000" step="1" value=""
+             placeholder="Default (model-dependent)"
+             class="max-tokens-input"
+             data-<%%= stimulus_controller %>-target="maxTokensInput">
+    </div>
+    <div class="generation-setting-item">
+      <label for="repeat_penalty">
+        Repeat Penalty
+        <span class="setting-value" data-<%%= stimulus_controller %>-target="repeatPenaltyValue">1.1</span>
+      </label>
+      <input type="range" name="repeat_penalty" id="repeat_penalty"
+             min="1" max="2" step="0.05" value="1.1"
+             data-<%%= stimulus_controller %>-target="repeatPenaltyRange"
+             data-action="input-><%%= stimulus_controller %>#updateRepeatPenalty">
+      <div class="setting-range-labels">
+        <span>1.0 (no penalty)</span>
+        <span>2.0 (strong)</span>
+      </div>
+    </div>
+  </div>
+</div>

data/lib/llm_meta_client/server_query.rb CHANGED Viewed

@@ -1,11 +1,11 @@
 module LlmMetaClient
   class ServerQuery
-    def call(id_token, api_key_uuid, model_id, context, user_content, tool_ids: [])
+    def call(id_token, api_key_uuid, model_id, context, user_content, tool_ids: [], generation_settings: {})
       debug_log "Context: #{context}"
       context_and_user_content = "Context:#{context}, User Prompt: #{user_content}"
       debug_log "Request to LLM: \n===>\n#{context_and_user_content}\n===>"
-      response = request(api_key_uuid, id_token, model_id, context_and_user_content, tool_ids)
+      response = request(api_key_uuid, id_token, model_id, context_and_user_content, tool_ids, generation_settings)
       raise Exceptions::ServerError, "LLM server returned HTTP #{response.code}" unless response.success?
@@ -28,12 +28,13 @@ module LlmMetaClient
       Rails.logger.info(message) if Rails.env.development?
     end
-    def request(api_key_uuid, id_token, model_id, user_content, tool_ids)
+    def request(api_key_uuid, id_token, model_id, user_content, tool_ids, generation_settings)
       headers = { "Content-Type" => "application/json" }
       headers["Authorization"] = "Bearer #{id_token}" if id_token.present?
       body = { prompt: user_content.to_s }
       body[:tool_ids] = tool_ids if tool_ids.present?
+      body[:generation_settings] = generation_settings if generation_settings.present?
       HTTParty.post(
         url(api_key_uuid, model_id),

data/lib/llm_meta_client/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module LlmMetaClient
-  VERSION = "0.4.0"
+  VERSION = "0.5.0"
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: llm_meta_client
 version: !ruby/object:Gem::Version
-  version: 0.4.0
+  version: 0.5.0
 platform: ruby
 authors:
 - dhq_boiler
@@ -85,6 +85,7 @@ files:
 - README.md
 - Rakefile
 - app/assets/stylesheets/llm_meta_client/application.css
+- app/assets/stylesheets/llm_meta_client/generation_settings.css
 - app/controllers/llm_meta_client/application_controller.rb
 - app/helpers/llm_meta_client/application_helper.rb
 - app/jobs/llm_meta_client/application_job.rb
@@ -106,6 +107,7 @@ files:
 - lib/generators/llm_meta_client/scaffold/templates/app/controllers/prompts_controller.rb
 - lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/chat_title_edit_controller.js
 - lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/chats_form_controller.js
+- lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/generation_settings_controller.js
 - lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/llm_selector_controller.js
 - lib/generators/llm_meta_client/scaffold/templates/app/javascript/controllers/tool_selector_controller.js
 - lib/generators/llm_meta_client/scaffold/templates/app/javascript/popover.js
@@ -122,6 +124,7 @@ files:
 - lib/generators/llm_meta_client/scaffold/templates/app/views/layouts/application.html.erb
 - lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_api_key_field.html.erb
 - lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_family_field.html.erb
+- lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_generation_settings_field.html.erb
 - lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_model_field.html.erb
 - lib/generators/llm_meta_client/scaffold/templates/app/views/shared/_tool_selector_field.html.erb
 - lib/generators/llm_meta_client/scaffold/templates/config/initializers/llm_service.rb