lex-llm-vertex 0.1.0 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +8 -0
- data/README.md +1 -1
- data/lex-llm-vertex.gemspec +1 -1
- data/lib/legion/extensions/llm/vertex/provider.rb +13 -2
- data/lib/legion/extensions/llm/vertex/registry_event_builder.rb +93 -0
- data/lib/legion/extensions/llm/vertex/registry_publisher.rb +100 -0
- data/lib/legion/extensions/llm/vertex/transport/exchanges/llm_registry.rb +24 -0
- data/lib/legion/extensions/llm/vertex/transport/messages/registry_event.rb +42 -0
- data/lib/legion/extensions/llm/vertex/version.rb +1 -1
- data/lib/legion/extensions/llm/vertex.rb +2 -0
- metadata +7 -3
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: ec3d331cb0dbdaa46060ab18d4a4a64e080dbabe31792ae89c77fc3c529b9adb
|
|
4
|
+
data.tar.gz: 671c60635f11ae3bb574a5025fade36e5d10611537fac7b2555e4aef4daaca8a
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 8125a85339134d6ab2c6a53d63d948119e35fd677da77ed2ef8b2328f700103f9f6227cc6bb7a58fc2f1b23ddb76fcb832e9c8abcd50d5ec5bafdf757f0eeb71
|
|
7
|
+
data.tar.gz: 53c2c6802901fd9f154571392759679dd901986c2b136d7b3da46fefa7089e1b2f4ddb2063e2a8563d03d31fa77ad689f576a1d737e5914fc98c26da2ac1618e
|
data/CHANGELOG.md
CHANGED
|
@@ -1,5 +1,13 @@
|
|
|
1
1
|
# Changelog
|
|
2
2
|
|
|
3
|
+
## 0.1.2 - 2026-04-28
|
|
4
|
+
|
|
5
|
+
- Publish best-effort `llm.registry` live readiness and live publisher-model availability events using `lex-llm` registry envelopes when transport is already available.
|
|
6
|
+
|
|
7
|
+
## 0.1.1 - 2026-04-28
|
|
8
|
+
|
|
9
|
+
- Require `lex-llm >= 0.1.5` for the shared model offering, alias, readiness, and fleet lane contract used by Vertex routing metadata.
|
|
10
|
+
|
|
3
11
|
## 0.1.0 - 2026-04-28
|
|
4
12
|
|
|
5
13
|
- Initial Legion::Extensions::Llm Vertex AI provider extension scaffold.
|
data/README.md
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
|
|
3
3
|
Google Cloud Vertex AI provider extension for `Legion::Extensions::Llm`.
|
|
4
4
|
|
|
5
|
-
This gem adds a hosted Vertex AI provider surface for Legion LLM routing without depending on the old `legion-llm` gem. It keeps discovery offline by default, preserves full Vertex publisher model resource names for routing, and exposes project/location instance metadata for multi-region provider fleets.
|
|
5
|
+
This gem adds a hosted Vertex AI provider surface for Legion LLM routing without depending on the old `legion-llm` gem. It keeps discovery offline by default, preserves full Vertex publisher model resource names for routing, and exposes project/location instance metadata for multi-region provider fleets. It requires `lex-llm >= 0.1.5` for the shared model offering, alias, readiness, and fleet lane contract.
|
|
6
6
|
|
|
7
7
|
## Install
|
|
8
8
|
|
data/lex-llm-vertex.gemspec
CHANGED
|
@@ -26,5 +26,5 @@ Gem::Specification.new do |spec|
|
|
|
26
26
|
spec.add_dependency 'legion-json', '>= 1.2.1'
|
|
27
27
|
spec.add_dependency 'legion-logging', '>= 1.3.2'
|
|
28
28
|
spec.add_dependency 'legion-settings', '>= 1.3.14'
|
|
29
|
-
spec.add_dependency 'lex-llm', '>= 0.1.
|
|
29
|
+
spec.add_dependency 'lex-llm', '>= 0.1.5'
|
|
30
30
|
end
|
|
@@ -37,6 +37,8 @@ module Legion
|
|
|
37
37
|
MODEL_FAMILIES = STATIC_MODELS.to_h { |entry| [entry.fetch(:model), entry.fetch(:model_family)] }.freeze
|
|
38
38
|
|
|
39
39
|
class << self
|
|
40
|
+
attr_writer :registry_publisher
|
|
41
|
+
|
|
40
42
|
def slug = 'vertex'
|
|
41
43
|
|
|
42
44
|
def configuration_options
|
|
@@ -54,6 +56,10 @@ module Legion
|
|
|
54
56
|
def configuration_requirements = []
|
|
55
57
|
def capabilities = Capabilities
|
|
56
58
|
|
|
59
|
+
def registry_publisher
|
|
60
|
+
@registry_publisher ||= RegistryPublisher.new
|
|
61
|
+
end
|
|
62
|
+
|
|
57
63
|
def resolve_model_id(model_id, config: nil)
|
|
58
64
|
configured_aliases = config.respond_to?(:vertex_model_aliases) ? config.vertex_model_aliases : nil
|
|
59
65
|
aliases = ALIASES.merge((configured_aliases || {}).transform_keys(&:to_s))
|
|
@@ -112,7 +118,9 @@ module Legion
|
|
|
112
118
|
|
|
113
119
|
response = connection.get(models_url)
|
|
114
120
|
models = response.body['publisherModels'] || response.body['models'] || []
|
|
115
|
-
models.map { |model| offering_from_live_model(model) }
|
|
121
|
+
models.map { |model| offering_from_live_model(model) }.tap do |offerings|
|
|
122
|
+
self.class.registry_publisher.publish_offerings_async(offerings, readiness: readiness(live: false))
|
|
123
|
+
end
|
|
116
124
|
end
|
|
117
125
|
|
|
118
126
|
def offering_for(model:, model_family: nil, instance_id: :default, **metadata)
|
|
@@ -151,7 +159,10 @@ module Legion
|
|
|
151
159
|
end
|
|
152
160
|
|
|
153
161
|
def readiness(live: false)
|
|
154
|
-
health(live:).merge(local: false, remote: true, api_base: api_base,
|
|
162
|
+
health(live:).merge(local: false, remote: true, api_base: api_base,
|
|
163
|
+
endpoints: endpoint_manifest).tap do |metadata|
|
|
164
|
+
self.class.registry_publisher.publish_readiness_async(metadata) if live
|
|
165
|
+
end
|
|
155
166
|
end
|
|
156
167
|
|
|
157
168
|
def chat(messages, model:, temperature: nil, max_tokens: nil, tools: {}, tool_prefs: nil, params: {})
|
|
@@ -0,0 +1,93 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
module Legion
|
|
4
|
+
module Extensions
|
|
5
|
+
module Llm
|
|
6
|
+
module Vertex
|
|
7
|
+
# Builds sanitized lex-llm registry envelopes for Vertex provider state.
|
|
8
|
+
class RegistryEventBuilder
|
|
9
|
+
def readiness(readiness)
|
|
10
|
+
registry_event_class.public_send(
|
|
11
|
+
readiness[:ready] ? :available : :unavailable,
|
|
12
|
+
provider_offering(readiness),
|
|
13
|
+
runtime: runtime_metadata,
|
|
14
|
+
health: readiness_health(readiness),
|
|
15
|
+
metadata: readiness_metadata(readiness)
|
|
16
|
+
)
|
|
17
|
+
end
|
|
18
|
+
|
|
19
|
+
def offering_available(offering, readiness:)
|
|
20
|
+
registry_event_class.available(
|
|
21
|
+
offering,
|
|
22
|
+
runtime: runtime_metadata,
|
|
23
|
+
health: offering_health(readiness),
|
|
24
|
+
metadata: offering_metadata
|
|
25
|
+
)
|
|
26
|
+
end
|
|
27
|
+
|
|
28
|
+
private
|
|
29
|
+
|
|
30
|
+
def provider_offering(readiness)
|
|
31
|
+
{
|
|
32
|
+
provider_family: :vertex,
|
|
33
|
+
provider_instance: provider_instance,
|
|
34
|
+
transport: :http,
|
|
35
|
+
model: 'provider-readiness',
|
|
36
|
+
usage_type: :inference,
|
|
37
|
+
capabilities: [],
|
|
38
|
+
health: readiness_health(readiness),
|
|
39
|
+
metadata: { lex: :llm_vertex, provider_readiness: true }
|
|
40
|
+
}
|
|
41
|
+
end
|
|
42
|
+
|
|
43
|
+
def readiness_health(readiness)
|
|
44
|
+
health = {
|
|
45
|
+
ready: readiness[:ready] == true,
|
|
46
|
+
status: readiness[:ready] ? :available : :unavailable,
|
|
47
|
+
checked: readiness[:checked] != false
|
|
48
|
+
}
|
|
49
|
+
add_readiness_error(health, readiness)
|
|
50
|
+
end
|
|
51
|
+
|
|
52
|
+
def add_readiness_error(health, source)
|
|
53
|
+
error_class = source[:error] || source['error']
|
|
54
|
+
error_message = source[:message] || source['message']
|
|
55
|
+
health[:error_class] = error_class if error_class
|
|
56
|
+
health[:error] = error_message if error_message
|
|
57
|
+
health
|
|
58
|
+
end
|
|
59
|
+
|
|
60
|
+
def offering_health(readiness)
|
|
61
|
+
ready = readiness.fetch(:ready, true) == true
|
|
62
|
+
{ ready:, status: ready ? :available : :degraded, checked: readiness[:checked] != false }
|
|
63
|
+
end
|
|
64
|
+
|
|
65
|
+
def readiness_metadata(readiness)
|
|
66
|
+
{
|
|
67
|
+
extension: :lex_llm_vertex,
|
|
68
|
+
provider: :vertex,
|
|
69
|
+
configured: readiness[:configured] == true,
|
|
70
|
+
live: readiness[:live] == true
|
|
71
|
+
}
|
|
72
|
+
end
|
|
73
|
+
|
|
74
|
+
def offering_metadata
|
|
75
|
+
{ extension: :lex_llm_vertex, provider: :vertex }
|
|
76
|
+
end
|
|
77
|
+
|
|
78
|
+
def runtime_metadata
|
|
79
|
+
{ node: provider_instance }
|
|
80
|
+
end
|
|
81
|
+
|
|
82
|
+
def provider_instance
|
|
83
|
+
:vertex
|
|
84
|
+
end
|
|
85
|
+
|
|
86
|
+
def registry_event_class
|
|
87
|
+
::Legion::Extensions::Llm::Routing::RegistryEvent
|
|
88
|
+
end
|
|
89
|
+
end
|
|
90
|
+
end
|
|
91
|
+
end
|
|
92
|
+
end
|
|
93
|
+
end
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
module Legion
|
|
4
|
+
module Extensions
|
|
5
|
+
module Llm
|
|
6
|
+
module Vertex
|
|
7
|
+
# Best-effort publisher for Vertex provider availability events.
|
|
8
|
+
class RegistryPublisher
|
|
9
|
+
APP_ID = 'lex-llm-vertex'
|
|
10
|
+
|
|
11
|
+
def initialize(builder: RegistryEventBuilder.new)
|
|
12
|
+
@builder = builder
|
|
13
|
+
end
|
|
14
|
+
|
|
15
|
+
def publish_readiness_async(readiness)
|
|
16
|
+
schedule { publish_event(@builder.readiness(readiness)) }
|
|
17
|
+
end
|
|
18
|
+
|
|
19
|
+
def publish_offerings_async(offerings, readiness:)
|
|
20
|
+
schedule do
|
|
21
|
+
Array(offerings).each do |offering|
|
|
22
|
+
publish_event(@builder.offering_available(offering, readiness:))
|
|
23
|
+
end
|
|
24
|
+
end
|
|
25
|
+
end
|
|
26
|
+
|
|
27
|
+
private
|
|
28
|
+
|
|
29
|
+
def schedule(&)
|
|
30
|
+
return false unless publishing_available?
|
|
31
|
+
|
|
32
|
+
Thread.new do
|
|
33
|
+
Thread.current.abort_on_exception = false
|
|
34
|
+
yield
|
|
35
|
+
rescue StandardError => e
|
|
36
|
+
log_publish_failure(e, level: :debug)
|
|
37
|
+
end
|
|
38
|
+
rescue StandardError => e
|
|
39
|
+
log_publish_failure(e, level: :debug)
|
|
40
|
+
false
|
|
41
|
+
end
|
|
42
|
+
|
|
43
|
+
def publish_event(event)
|
|
44
|
+
return false unless publishing_available?
|
|
45
|
+
|
|
46
|
+
message_class.new(event:, app_id: APP_ID).publish(spool: false)
|
|
47
|
+
rescue StandardError => e
|
|
48
|
+
log_publish_failure(e)
|
|
49
|
+
false
|
|
50
|
+
end
|
|
51
|
+
|
|
52
|
+
def publishing_available?
|
|
53
|
+
return false unless registry_event_available?
|
|
54
|
+
return false unless transport_message_available?
|
|
55
|
+
return true unless defined?(::Legion::Transport::Connection)
|
|
56
|
+
return true unless ::Legion::Transport::Connection.respond_to?(:session_open?)
|
|
57
|
+
|
|
58
|
+
::Legion::Transport::Connection.session_open?
|
|
59
|
+
rescue StandardError
|
|
60
|
+
false
|
|
61
|
+
end
|
|
62
|
+
|
|
63
|
+
def registry_event_available?
|
|
64
|
+
defined?(::Legion::Extensions::Llm::Routing::RegistryEvent)
|
|
65
|
+
end
|
|
66
|
+
|
|
67
|
+
def transport_message_available?
|
|
68
|
+
return true if message_class_defined?
|
|
69
|
+
return false unless defined?(::Legion::Transport::Message) && defined?(::Legion::Transport::Exchange)
|
|
70
|
+
|
|
71
|
+
require 'legion/extensions/llm/vertex/transport/messages/registry_event'
|
|
72
|
+
message_class_defined?
|
|
73
|
+
rescue LoadError
|
|
74
|
+
false
|
|
75
|
+
end
|
|
76
|
+
|
|
77
|
+
def message_class_defined?
|
|
78
|
+
defined?(::Legion::Extensions::Llm::Vertex::Transport::Messages::RegistryEvent)
|
|
79
|
+
end
|
|
80
|
+
|
|
81
|
+
def message_class
|
|
82
|
+
::Legion::Extensions::Llm::Vertex::Transport::Messages::RegistryEvent
|
|
83
|
+
end
|
|
84
|
+
|
|
85
|
+
def log_publish_failure(error, level: :warn)
|
|
86
|
+
message = "[lex-llm-vertex] llm.registry publish failed: #{error.class}: #{error.message}"
|
|
87
|
+
logger = ::Legion::Extensions::Llm.logger if defined?(::Legion::Extensions::Llm)
|
|
88
|
+
if logger.respond_to?(level)
|
|
89
|
+
logger.public_send(level, message)
|
|
90
|
+
elsif logger.respond_to?(:debug)
|
|
91
|
+
logger.debug(message)
|
|
92
|
+
end
|
|
93
|
+
rescue StandardError
|
|
94
|
+
nil
|
|
95
|
+
end
|
|
96
|
+
end
|
|
97
|
+
end
|
|
98
|
+
end
|
|
99
|
+
end
|
|
100
|
+
end
|
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
module Legion
|
|
4
|
+
module Extensions
|
|
5
|
+
module Llm
|
|
6
|
+
module Vertex
|
|
7
|
+
module Transport
|
|
8
|
+
module Exchanges
|
|
9
|
+
# Topic exchange for Vertex provider availability events.
|
|
10
|
+
class LlmRegistry < ::Legion::Transport::Exchange
|
|
11
|
+
def exchange_name
|
|
12
|
+
'llm.registry'
|
|
13
|
+
end
|
|
14
|
+
|
|
15
|
+
def default_type
|
|
16
|
+
'topic'
|
|
17
|
+
end
|
|
18
|
+
end
|
|
19
|
+
end
|
|
20
|
+
end
|
|
21
|
+
end
|
|
22
|
+
end
|
|
23
|
+
end
|
|
24
|
+
end
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
# frozen_string_literal: true
|
|
2
|
+
|
|
3
|
+
require 'legion/extensions/llm/vertex/transport/exchanges/llm_registry'
|
|
4
|
+
|
|
5
|
+
module Legion
|
|
6
|
+
module Extensions
|
|
7
|
+
module Llm
|
|
8
|
+
module Vertex
|
|
9
|
+
module Transport
|
|
10
|
+
module Messages
|
|
11
|
+
# Publishes lex-llm RegistryEvent envelopes to the llm.registry exchange.
|
|
12
|
+
class RegistryEvent < ::Legion::Transport::Message
|
|
13
|
+
def initialize(event:, **options)
|
|
14
|
+
super(**event.to_h.merge(options))
|
|
15
|
+
end
|
|
16
|
+
|
|
17
|
+
def exchange
|
|
18
|
+
Transport::Exchanges::LlmRegistry
|
|
19
|
+
end
|
|
20
|
+
|
|
21
|
+
def routing_key
|
|
22
|
+
@options[:routing_key] || "llm.registry.#{@options.fetch(:event_type)}"
|
|
23
|
+
end
|
|
24
|
+
|
|
25
|
+
def type
|
|
26
|
+
'llm.registry.event'
|
|
27
|
+
end
|
|
28
|
+
|
|
29
|
+
def app_id
|
|
30
|
+
@options[:app_id] || RegistryPublisher::APP_ID
|
|
31
|
+
end
|
|
32
|
+
|
|
33
|
+
def persistent # rubocop:disable Naming/PredicateMethod
|
|
34
|
+
false
|
|
35
|
+
end
|
|
36
|
+
end
|
|
37
|
+
end
|
|
38
|
+
end
|
|
39
|
+
end
|
|
40
|
+
end
|
|
41
|
+
end
|
|
42
|
+
end
|
|
@@ -2,6 +2,8 @@
|
|
|
2
2
|
|
|
3
3
|
require 'legion/extensions/llm'
|
|
4
4
|
require 'legion/extensions/llm/vertex/provider'
|
|
5
|
+
require 'legion/extensions/llm/vertex/registry_event_builder'
|
|
6
|
+
require 'legion/extensions/llm/vertex/registry_publisher'
|
|
5
7
|
require 'legion/extensions/llm/vertex/version'
|
|
6
8
|
|
|
7
9
|
module Legion
|
metadata
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: lex-llm-vertex
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.1.
|
|
4
|
+
version: 0.1.2
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- LegionIO
|
|
@@ -57,14 +57,14 @@ dependencies:
|
|
|
57
57
|
requirements:
|
|
58
58
|
- - ">="
|
|
59
59
|
- !ruby/object:Gem::Version
|
|
60
|
-
version: 0.1.
|
|
60
|
+
version: 0.1.5
|
|
61
61
|
type: :runtime
|
|
62
62
|
prerelease: false
|
|
63
63
|
version_requirements: !ruby/object:Gem::Requirement
|
|
64
64
|
requirements:
|
|
65
65
|
- - ">="
|
|
66
66
|
- !ruby/object:Gem::Version
|
|
67
|
-
version: 0.1.
|
|
67
|
+
version: 0.1.5
|
|
68
68
|
description: Google Cloud Vertex AI provider integration for the LegionIO LLM routing
|
|
69
69
|
framework.
|
|
70
70
|
email:
|
|
@@ -85,6 +85,10 @@ files:
|
|
|
85
85
|
- lex-llm-vertex.gemspec
|
|
86
86
|
- lib/legion/extensions/llm/vertex.rb
|
|
87
87
|
- lib/legion/extensions/llm/vertex/provider.rb
|
|
88
|
+
- lib/legion/extensions/llm/vertex/registry_event_builder.rb
|
|
89
|
+
- lib/legion/extensions/llm/vertex/registry_publisher.rb
|
|
90
|
+
- lib/legion/extensions/llm/vertex/transport/exchanges/llm_registry.rb
|
|
91
|
+
- lib/legion/extensions/llm/vertex/transport/messages/registry_event.rb
|
|
88
92
|
- lib/legion/extensions/llm/vertex/version.rb
|
|
89
93
|
homepage: https://github.com/LegionIO/lex-llm-vertex
|
|
90
94
|
licenses:
|