RubyGems - lex-llm-ollama - Versions diffs - 0.2.8 → 0.2.9 - Mend

lex-llm-ollama 0.2.8 → 0.2.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +9 -0
data/lib/legion/extensions/llm/ollama/provider.rb +85 -8
data/lib/legion/extensions/llm/ollama/version.rb +1 -1
metadata +1 -1

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 20e5e1a5989633a805483200893d6d11c6f0af9b3d9b3204defad0e33e0be5ed
-  data.tar.gz: 8dd17ebb04df4e90b75438f8f4ba86bb289db4ccde25f1b71d36253a9075450c
+  metadata.gz: 90c9bd5b9b740637320d528012401d93d38e1d0b38396c3baa51ad45067547aa
+  data.tar.gz: 1024e115de9bea52c58b3fb20bbbf1fc561bc6299f4bdfea4a95d2c7899618c8
 SHA512:
-  metadata.gz: '0944f1f288b824bcc09b9ca13e9ece5d67553fe4d706e26a7d77b37c1fa71c594eaeb8b0f2f8fd9817259463e9289257019b700a4a02019077f1c889e0b7aa8a'
-  data.tar.gz: 32c4de66b95c05e9b0349a2c1da79f826fd701fd9aa61d25957291076c3e6ca87fa79338fd323e652c1e441342bb54f6a1dc97b03bd5ffafe56c3eb32411eeb1
+  metadata.gz: 7222b463dd74c7ba154d363dabaf451979562831313583ac2e6fc034ddda595c13b3c4b1ae6772906842a92aa83842bb9a37c2c99f198c5a4985c82a3f61174c
+  data.tar.gz: 682b890f4c30d28d0786c6d3f7d03ac1d024fbec025119373346f9bcb87cad22391328b02238007ab9550cf6dd8ef07f565cc69628e26084fc2815a4b2d8e095

data/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,14 @@
 # Changelog
+## 0.2.9 - 2026-05-13
+- Add `fetch_model_detail` — calls POST `/api/show` to retrieve the real context window from Ollama.
+- Add `resolve_context_window` — tries live model detail cache first, falls back to static prefix map.
+- Add `extract_context_window` — parses `num_ctx` from `model_info` hash or `parameters` string in the `/api/show` response.
+- Add `CONTEXT_WINDOWS` static fallback map covering common Ollama model families.
+- Add `rescue Faraday::ConnectionFailed` in `discover_offerings` with a concise warn log instead of an unhandled exception.
+- Add `show_model_url` endpoint helper returning `/api/show`.
 ## 0.2.8 - 2026-05-12
 - Include `Legion::Logging::Helper` directly in Ollama provider, actor, and fleet runner runtime surfaces.

data/lib/legion/extensions/llm/ollama/provider.rb CHANGED Viewed

@@ -87,6 +87,16 @@ module Legion
             raise
           end
+          def fetch_model_detail(model_name)
+            raw = show_model(model_name)
+            context_window = extract_context_window(raw)
+            { context_window: context_window }.compact
+          rescue StandardError => e
+            handle_exception(e, level: :warn, handled: true, operation: 'ollama.fetch_model_detail',
+                                model: model_name)
+            nil
+          end
           def pull_model(model, stream: false)
             log.debug { "ollama provider pulling model=#{model} stream=#{stream}" }
             log.info { "pulling model #{model} stream=#{stream}" }
@@ -100,21 +110,49 @@ module Legion
             log.debug do
               "ollama provider discovering offerings live=#{live} cached_model_count=#{Array(@cached_models).size}"
             end
-            models = if live
-                       @cached_models = list_models
-                     else
-                       Array(@cached_models)
-                     end
-            models.map { |model_info| offering_from_model(model_info) }.tap do |offerings|
+            resolve_models(live).map { |model_info| offering_from_model(model_info) }.tap do |offerings|
               log.debug { "ollama provider built offering_count=#{offerings.size} live=#{live}" }
             end
+          rescue Faraday::ConnectionFailed => e
+            log.warn("[ollama] instance=#{provider_instance_id} unreachable: #{e.message}")
+            []
           rescue StandardError => e
-            handle_exception(e, level: :warn, handled: true, operation: 'ollama.discover_offerings')
+            handle_exception(e, level: :warn, handled: true, operation: 'ollama.discover_offerings',
+                                backtrace_limit: 3)
             []
           end
+          CONTEXT_WINDOWS = {
+            'qwen3' => 128_000,
+            'qwen2.5' => 128_000,
+            'llama3' => 128_000,
+            'llama3.1' => 128_000,
+            'llama3.2' => 128_000,
+            'llama3.3' => 128_000,
+            'gemma2' => 8_192,
+            'gemma3' => 128_000,
+            'mistral' => 128_000,
+            'deepseek' => 128_000,
+            'phi3' => 128_000,
+            'phi4' => 16_384,
+            'command-r' => 128_000,
+            'codellama' => 16_384,
+            'nomic-embed' => 8_192,
+            'mxbai-embed' => 512,
+            'snowflake' => 512,
+            'bge' => 512
+          }.freeze
           private
+          def resolve_models(live)
+            if live
+              @cached_models = list_models
+            else
+              Array(@cached_models)
+            end
+          end
           def offering_from_model(model_info)
             Legion::Extensions::Llm::Routing::ModelOffering.new(
               provider_family: :ollama,
@@ -146,7 +184,46 @@ module Legion
           end
           def offering_limits(model_info)
-            { context_window: model_info.context_length }.compact
+            ctx = model_info.context_length || resolve_context_window(model_info.id)
+            ctx ? { context_window: ctx } : {}
+          end
+          def resolve_context_window(model_id)
+            detail = model_detail(model_id)
+            return detail[:context_window] if detail.is_a?(Hash) && detail[:context_window]
+            infer_context_window(model_id)
+          end
+          def infer_context_window(model_id)
+            name = model_id.to_s.split(':').first
+            CONTEXT_WINDOWS.find { |prefix, _| name.start_with?(prefix) }&.last
+          end
+          def extract_context_window(raw)
+            return nil unless raw.is_a?(Hash)
+            from_model_info(raw) || from_parameters_string(raw)
+          end
+          def from_model_info(raw)
+            model_info = raw['model_info'] || raw[:model_info]
+            return unless model_info.is_a?(Hash)
+            num_ctx_from_hash(model_info)&.to_i
+          end
+          def num_ctx_from_hash(model_info)
+            model_info['num_ctx'] || model_info[:num_ctx] ||
+              model_info.find { |k, _| k.to_s.end_with?('.context_length') }&.last
+          end
+          def from_parameters_string(raw)
+            params = raw['parameters'] || raw[:parameters]
+            return unless params.is_a?(String)
+            match = params.match(/num_ctx\s+(\d+)/)
+            match[1].to_i if match
           end
           def offering_metadata(model_info)

data/lib/legion/extensions/llm/ollama/version.rb CHANGED Viewed

@@ -4,7 +4,7 @@ module Legion
   module Extensions
     module Llm
       module Ollama
-        VERSION = '0.2.8'
+        VERSION = '0.2.9'
       end
     end
   end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: lex-llm-ollama
 version: !ruby/object:Gem::Version
-  version: 0.2.8
+  version: 0.2.9
 platform: ruby
 authors:
 - LegionIO