lex-llm-gateway 0.2.10 → 0.2.12
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +10 -0
- data/lib/legion/extensions/llm/gateway/runners/fleet_handler.rb +8 -4
- data/lib/legion/extensions/llm/gateway/runners/inference.rb +38 -4
- data/lib/legion/extensions/llm/gateway/version.rb +1 -1
- data/lib/legion/extensions/llm/gateway.rb +2 -1
- metadata +1 -1
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 23b44bc07cb28fc0e364b119984909f1d8becba720ea547b1255a8512188dec7
|
|
4
|
+
data.tar.gz: a4aae0ecf4e1b053405f74628af518156ae2ffc3d0678b4f920771a9e6a68ee6
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 1cf5d4fe5d3f0728dee2dfa04019f62c7e2fd799527df6a79b069f9aabf4ef7cff44674fa0405406e200705faaa03eff282c60ab9b0ca3db25a5f93fa7bb6c1f
|
|
7
|
+
data.tar.gz: c01a0edb556ccf0346b111b6187f05e4083dde3c52ecbc43707fbb720c40a73501a76a98c85e37389512fb2db0184d631ba98edbecab77b456cd1af1401b882d
|
data/CHANGELOG.md
CHANGED
|
@@ -1,5 +1,15 @@
|
|
|
1
1
|
# Changelog
|
|
2
2
|
|
|
3
|
+
## [0.2.12] - 2026-03-24
|
|
4
|
+
|
|
5
|
+
### Fixed
|
|
6
|
+
- fix `uninitialized constant Legion::Extensions::Llm::Gateway` when `ensure_namespace` pre-creates `Llm` as empty module before gem loads — unconditionally `remove_const(:Llm)` then reassign alias to `LLM`
|
|
7
|
+
|
|
8
|
+
## [0.2.11] - 2026-03-23
|
|
9
|
+
|
|
10
|
+
### Changed
|
|
11
|
+
- Add `caller:` identity to all `Legion::LLM` call sites: 3 pipeline-path calls in `Runners::Inference` (`chat`, `embed`, `structured`) and 4 fleet worker calls in `Runners::FleetHandler` (`call_chat` ×2, `call_structured`, `call_embed`) with `extension: 'lex-llm-gateway'` and `operation: 'inference'`/`'fleet'`
|
|
12
|
+
|
|
3
13
|
## [0.2.10] - 2026-03-23
|
|
4
14
|
|
|
5
15
|
### Added
|
|
@@ -48,9 +48,11 @@ module Legion
|
|
|
48
48
|
def call_chat(payload)
|
|
49
49
|
messages = payload[:messages]
|
|
50
50
|
if messages.is_a?(Array) && messages.size > 1
|
|
51
|
-
Legion::LLM.chat(model: payload[:model], messages: messages
|
|
51
|
+
Legion::LLM.chat(model: payload[:model], messages: messages,
|
|
52
|
+
caller: { extension: 'lex-llm-gateway', operation: 'fleet' })
|
|
52
53
|
else
|
|
53
|
-
Legion::LLM.chat(model: payload[:model], message: messages&.dig(0, :content)
|
|
54
|
+
Legion::LLM.chat(model: payload[:model], message: messages&.dig(0, :content),
|
|
55
|
+
caller: { extension: 'lex-llm-gateway', operation: 'fleet' })
|
|
54
56
|
end
|
|
55
57
|
end
|
|
56
58
|
|
|
@@ -58,13 +60,15 @@ module Legion
|
|
|
58
60
|
Legion::LLM.structured(
|
|
59
61
|
model: payload[:model],
|
|
60
62
|
messages: payload[:messages],
|
|
61
|
-
schema: payload[:schema]
|
|
63
|
+
schema: payload[:schema],
|
|
64
|
+
caller: { extension: 'lex-llm-gateway', operation: 'fleet' }
|
|
62
65
|
)
|
|
63
66
|
end
|
|
64
67
|
|
|
65
68
|
def call_embed(payload)
|
|
66
69
|
text = payload[:text] || payload.dig(:messages, 0, :content)
|
|
67
|
-
Legion::LLM.embed(model: payload[:model], text: text
|
|
70
|
+
Legion::LLM.embed(model: payload[:model], text: text,
|
|
71
|
+
caller: { extension: 'lex-llm-gateway', operation: 'fleet' })
|
|
68
72
|
end
|
|
69
73
|
|
|
70
74
|
def build_response(correlation_id, response)
|
|
@@ -5,10 +5,16 @@ module Legion
|
|
|
5
5
|
module LLM
|
|
6
6
|
module Gateway
|
|
7
7
|
module Runners
|
|
8
|
-
module Inference
|
|
8
|
+
module Inference # rubocop:disable Metrics/ModuleLength
|
|
9
9
|
module_function
|
|
10
10
|
|
|
11
|
-
def chat(model: nil, provider: nil, **opts)
|
|
11
|
+
def chat(model: nil, provider: nil, **opts) # rubocop:disable Metrics/MethodLength
|
|
12
|
+
if pipeline_available?
|
|
13
|
+
log_deprecation(:chat)
|
|
14
|
+
return Legion::LLM.chat(model: model, provider: provider,
|
|
15
|
+
caller: { extension: 'lex-llm-gateway', operation: 'inference' }, **opts)
|
|
16
|
+
end
|
|
17
|
+
|
|
12
18
|
start_ms = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond)
|
|
13
19
|
response = dispatch_chat(model: model, provider: provider, **opts)
|
|
14
20
|
elapsed_ms = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond) - start_ms
|
|
@@ -17,7 +23,13 @@ module Legion
|
|
|
17
23
|
response
|
|
18
24
|
end
|
|
19
25
|
|
|
20
|
-
def embed(text: nil, model: nil, provider: nil, **)
|
|
26
|
+
def embed(text: nil, model: nil, provider: nil, **) # rubocop:disable Metrics/MethodLength
|
|
27
|
+
if pipeline_available?
|
|
28
|
+
log_deprecation(:embed)
|
|
29
|
+
return Legion::LLM.embed(text, model: model, provider: provider,
|
|
30
|
+
caller: { extension: 'lex-llm-gateway', operation: 'inference' }, **)
|
|
31
|
+
end
|
|
32
|
+
|
|
21
33
|
start_ms = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond)
|
|
22
34
|
response = dispatch_embed(text: text, model: model, provider: provider, **)
|
|
23
35
|
elapsed_ms = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond) - start_ms
|
|
@@ -26,7 +38,14 @@ module Legion
|
|
|
26
38
|
response
|
|
27
39
|
end
|
|
28
40
|
|
|
29
|
-
def structured(messages: nil, schema: nil, model: nil, provider: nil, **)
|
|
41
|
+
def structured(messages: nil, schema: nil, model: nil, provider: nil, **) # rubocop:disable Metrics/MethodLength
|
|
42
|
+
if pipeline_available?
|
|
43
|
+
log_deprecation(:structured)
|
|
44
|
+
return Legion::LLM.structured(messages: messages, schema: schema, model: model,
|
|
45
|
+
provider: provider,
|
|
46
|
+
caller: { extension: 'lex-llm-gateway', operation: 'inference' }, **)
|
|
47
|
+
end
|
|
48
|
+
|
|
30
49
|
start_ms = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond)
|
|
31
50
|
response = dispatch_structured(messages: messages, schema: schema, model: model,
|
|
32
51
|
provider: provider, **)
|
|
@@ -36,6 +55,21 @@ module Legion
|
|
|
36
55
|
response
|
|
37
56
|
end
|
|
38
57
|
|
|
58
|
+
def pipeline_available?
|
|
59
|
+
defined?(Legion::LLM::Pipeline::Executor) &&
|
|
60
|
+
defined?(Legion::LLM) &&
|
|
61
|
+
Legion::LLM.respond_to?(:pipeline_enabled?) &&
|
|
62
|
+
Legion::LLM.pipeline_enabled?
|
|
63
|
+
end
|
|
64
|
+
|
|
65
|
+
def log_deprecation(method)
|
|
66
|
+
return unless defined?(Legion::Logging)
|
|
67
|
+
|
|
68
|
+
Legion::Logging.warn(
|
|
69
|
+
"lex-llm-gateway is deprecated for #{method}, use Legion::LLM.#{method} directly"
|
|
70
|
+
)
|
|
71
|
+
end
|
|
72
|
+
|
|
39
73
|
def dispatch_chat(message: nil, messages: nil, model: nil, provider: nil, **opts)
|
|
40
74
|
tier = opts[:tier]
|
|
41
75
|
Legion::Logging.debug "[Gateway::Inference] dispatch_chat tier=#{tier}" if defined?(Legion::Logging)
|