llm.rb 4.0.0 → 4.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/LICENSE +2 -2
- data/README.md +226 -192
- data/lib/llm/agent.rb +226 -0
- data/lib/llm/bot.rb +57 -28
- data/lib/llm/error.rb +4 -0
- data/lib/llm/function/tracing.rb +19 -0
- data/lib/llm/function.rb +16 -3
- data/lib/llm/json_adapter.rb +1 -1
- data/lib/llm/message.rb +7 -0
- data/lib/llm/prompt.rb +85 -0
- data/lib/llm/provider.rb +74 -10
- data/lib/llm/providers/anthropic/error_handler.rb +27 -5
- data/lib/llm/providers/anthropic/files.rb +22 -16
- data/lib/llm/providers/anthropic/models.rb +4 -3
- data/lib/llm/providers/anthropic.rb +6 -5
- data/lib/llm/providers/deepseek.rb +3 -3
- data/lib/llm/providers/gemini/error_handler.rb +34 -12
- data/lib/llm/providers/gemini/files.rb +18 -13
- data/lib/llm/providers/gemini/images.rb +4 -3
- data/lib/llm/providers/gemini/models.rb +4 -3
- data/lib/llm/providers/gemini.rb +36 -13
- data/lib/llm/providers/llamacpp.rb +3 -3
- data/lib/llm/providers/ollama/error_handler.rb +28 -6
- data/lib/llm/providers/ollama/models.rb +4 -3
- data/lib/llm/providers/ollama.rb +9 -7
- data/lib/llm/providers/openai/audio.rb +10 -7
- data/lib/llm/providers/openai/error_handler.rb +41 -14
- data/lib/llm/providers/openai/files.rb +19 -14
- data/lib/llm/providers/openai/images.rb +10 -7
- data/lib/llm/providers/openai/models.rb +4 -3
- data/lib/llm/providers/openai/moderations.rb +4 -3
- data/lib/llm/providers/openai/responses.rb +10 -7
- data/lib/llm/providers/openai/vector_stores.rb +34 -23
- data/lib/llm/providers/openai.rb +9 -7
- data/lib/llm/providers/xai.rb +3 -3
- data/lib/llm/providers/zai.rb +2 -2
- data/lib/llm/schema/object.rb +2 -2
- data/lib/llm/schema.rb +16 -2
- data/lib/llm/server_tool.rb +3 -3
- data/lib/llm/session.rb +3 -0
- data/lib/llm/tracer/logger.rb +192 -0
- data/lib/llm/tracer/null.rb +49 -0
- data/lib/llm/tracer/telemetry.rb +255 -0
- data/lib/llm/tracer.rb +134 -0
- data/lib/llm/version.rb +1 -1
- data/lib/llm.rb +5 -3
- data/llm.gemspec +4 -1
- metadata +39 -3
- data/lib/llm/builder.rb +0 -61
|
@@ -10,10 +10,21 @@ class LLM::Ollama
|
|
|
10
10
|
attr_reader :res
|
|
11
11
|
|
|
12
12
|
##
|
|
13
|
+
# @return [Object, nil]
|
|
14
|
+
# The span
|
|
15
|
+
attr_reader :span
|
|
16
|
+
|
|
17
|
+
##
|
|
18
|
+
# @param [LLM::Tracer] tracer
|
|
19
|
+
# The tracer
|
|
20
|
+
# @param [Object, nil] span
|
|
21
|
+
# The span
|
|
13
22
|
# @param [Net::HTTPResponse] res
|
|
14
23
|
# The response from the server
|
|
15
|
-
# @return [LLM::
|
|
16
|
-
def initialize(res)
|
|
24
|
+
# @return [LLM::Ollama::ErrorHandler]
|
|
25
|
+
def initialize(tracer, span, res)
|
|
26
|
+
@tracer = tracer
|
|
27
|
+
@span = span
|
|
17
28
|
@res = res
|
|
18
29
|
end
|
|
19
30
|
|
|
@@ -21,15 +32,26 @@ class LLM::Ollama
|
|
|
21
32
|
# @raise [LLM::Error]
|
|
22
33
|
# Raises a subclass of {LLM::Error LLM::Error}
|
|
23
34
|
def raise_error!
|
|
35
|
+
ex = error
|
|
36
|
+
@tracer.on_request_error(ex:, span:)
|
|
37
|
+
ensure
|
|
38
|
+
raise(ex)
|
|
39
|
+
end
|
|
40
|
+
|
|
41
|
+
private
|
|
42
|
+
|
|
43
|
+
##
|
|
44
|
+
# @return [LLM::Error]
|
|
45
|
+
def error
|
|
24
46
|
case res
|
|
25
47
|
when Net::HTTPServerError
|
|
26
|
-
|
|
48
|
+
LLM::ServerError.new("Server error").tap { _1.response = res }
|
|
27
49
|
when Net::HTTPUnauthorized
|
|
28
|
-
|
|
50
|
+
LLM::UnauthorizedError.new("Authentication error").tap { _1.response = res }
|
|
29
51
|
when Net::HTTPTooManyRequests
|
|
30
|
-
|
|
52
|
+
LLM::RateLimitError.new("Too many requests").tap { _1.response = res }
|
|
31
53
|
else
|
|
32
|
-
|
|
54
|
+
LLM::Error.new("Unexpected response").tap { _1.response = res }
|
|
33
55
|
end
|
|
34
56
|
end
|
|
35
57
|
end
|
|
@@ -43,13 +43,14 @@ class LLM::Ollama
|
|
|
43
43
|
def all(**params)
|
|
44
44
|
query = URI.encode_www_form(params)
|
|
45
45
|
req = Net::HTTP::Get.new("/api/tags?#{query}", headers)
|
|
46
|
-
res = execute(request: req)
|
|
47
|
-
LLM::Response.new(res)
|
|
46
|
+
res, span = execute(request: req, operation: "request")
|
|
47
|
+
res = LLM::Response.new(res)
|
|
48
|
+
finish_trace(operation: "request", res:, span:)
|
|
48
49
|
end
|
|
49
50
|
|
|
50
51
|
private
|
|
51
52
|
|
|
52
|
-
[:headers, :execute].each do |m|
|
|
53
|
+
[:headers, :execute, :finish_trace].each do |m|
|
|
53
54
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
54
55
|
end
|
|
55
56
|
end
|
data/lib/llm/providers/ollama.rb
CHANGED
|
@@ -12,9 +12,9 @@ module LLM
|
|
|
12
12
|
# require "llm"
|
|
13
13
|
#
|
|
14
14
|
# llm = LLM.ollama(key: nil)
|
|
15
|
-
#
|
|
16
|
-
#
|
|
17
|
-
#
|
|
15
|
+
# ses = LLM::Session.new(llm, model: "llava")
|
|
16
|
+
# ses.talk ["Tell me about this image", ses.local_file("/images/photo.png")]
|
|
17
|
+
# ses.messages.select(&:assistant?).each { print "[#{_1.role}]", _1.content, "\n" }
|
|
18
18
|
class Ollama < Provider
|
|
19
19
|
require_relative "ollama/error_handler"
|
|
20
20
|
require_relative "ollama/request_adapter"
|
|
@@ -43,8 +43,9 @@ module LLM
|
|
|
43
43
|
params = {model:}.merge!(params)
|
|
44
44
|
req = Net::HTTP::Post.new("/v1/embeddings", headers)
|
|
45
45
|
req.body = LLM.json.dump({input:}.merge!(params))
|
|
46
|
-
res
|
|
47
|
-
ResponseAdapter.adapt(res, type: :embedding)
|
|
46
|
+
res, span = execute(request: req, operation: "embeddings", model:)
|
|
47
|
+
res = ResponseAdapter.adapt(res, type: :embedding)
|
|
48
|
+
finish_trace(operation: "embeddings", model:, res:, span:)
|
|
48
49
|
end
|
|
49
50
|
|
|
50
51
|
##
|
|
@@ -60,9 +61,10 @@ module LLM
|
|
|
60
61
|
def complete(prompt, params = {})
|
|
61
62
|
params, stream, tools, role = normalize_complete_params(params)
|
|
62
63
|
req = build_complete_request(prompt, params, role)
|
|
63
|
-
res = execute(request: req, stream: stream)
|
|
64
|
-
ResponseAdapter.adapt(res, type: :completion)
|
|
64
|
+
res, span = execute(request: req, stream: stream, operation: "chat", model: params[:model])
|
|
65
|
+
res = ResponseAdapter.adapt(res, type: :completion)
|
|
65
66
|
.extend(Module.new { define_method(:__tools__) { tools } })
|
|
67
|
+
finish_trace(operation: "chat", model: params[:model], res:, span:)
|
|
66
68
|
end
|
|
67
69
|
|
|
68
70
|
##
|
|
@@ -35,8 +35,9 @@ class LLM::OpenAI
|
|
|
35
35
|
req = Net::HTTP::Post.new("/v1/audio/speech", headers)
|
|
36
36
|
req.body = LLM.json.dump({input:, voice:, model:, response_format:}.merge!(params))
|
|
37
37
|
io = StringIO.new("".b)
|
|
38
|
-
res = execute(request: req) { _1.read_body { |chunk| io << chunk } }
|
|
39
|
-
LLM::Response.new(res).tap { _1.define_singleton_method(:audio) { io } }
|
|
38
|
+
res, span = execute(request: req, operation: "request") { _1.read_body { |chunk| io << chunk } }
|
|
39
|
+
res = LLM::Response.new(res).tap { _1.define_singleton_method(:audio) { io } }
|
|
40
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
40
41
|
end
|
|
41
42
|
|
|
42
43
|
##
|
|
@@ -56,8 +57,9 @@ class LLM::OpenAI
|
|
|
56
57
|
req = Net::HTTP::Post.new("/v1/audio/transcriptions", headers)
|
|
57
58
|
req["content-type"] = multi.content_type
|
|
58
59
|
set_body_stream(req, multi.body)
|
|
59
|
-
res = execute(request: req)
|
|
60
|
-
LLM::Response.new(res)
|
|
60
|
+
res, span = execute(request: req, operation: "request")
|
|
61
|
+
res = LLM::Response.new(res)
|
|
62
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
61
63
|
end
|
|
62
64
|
|
|
63
65
|
##
|
|
@@ -78,13 +80,14 @@ class LLM::OpenAI
|
|
|
78
80
|
req = Net::HTTP::Post.new("/v1/audio/translations", headers)
|
|
79
81
|
req["content-type"] = multi.content_type
|
|
80
82
|
set_body_stream(req, multi.body)
|
|
81
|
-
res = execute(request: req)
|
|
82
|
-
LLM::Response.new(res)
|
|
83
|
+
res, span = execute(request: req, operation: "request")
|
|
84
|
+
res = LLM::Response.new(res)
|
|
85
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
83
86
|
end
|
|
84
87
|
|
|
85
88
|
private
|
|
86
89
|
|
|
87
|
-
[:headers, :execute, :set_body_stream].each do |m|
|
|
90
|
+
[:headers, :execute, :set_body_stream, :finish_trace].each do |m|
|
|
88
91
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
89
92
|
end
|
|
90
93
|
end
|
|
@@ -10,10 +10,21 @@ class LLM::OpenAI
|
|
|
10
10
|
attr_reader :res
|
|
11
11
|
|
|
12
12
|
##
|
|
13
|
+
# @return [Object, nil]
|
|
14
|
+
# The span
|
|
15
|
+
attr_reader :span
|
|
16
|
+
|
|
17
|
+
##
|
|
18
|
+
# @param [LLM::Tracer] tracer
|
|
19
|
+
# The tracer
|
|
20
|
+
# @param [Object, nil] span
|
|
21
|
+
# The span
|
|
13
22
|
# @param [Net::HTTPResponse] res
|
|
14
23
|
# The response from the server
|
|
15
24
|
# @return [LLM::OpenAI::ErrorHandler]
|
|
16
|
-
def initialize(res)
|
|
25
|
+
def initialize(tracer, span, res)
|
|
26
|
+
@tracer = tracer
|
|
27
|
+
@span = span
|
|
17
28
|
@res = res
|
|
18
29
|
end
|
|
19
30
|
|
|
@@ -21,36 +32,52 @@ class LLM::OpenAI
|
|
|
21
32
|
# @raise [LLM::Error]
|
|
22
33
|
# Raises a subclass of {LLM::Error LLM::Error}
|
|
23
34
|
def raise_error!
|
|
35
|
+
ex = error
|
|
36
|
+
@tracer.on_request_error(ex:, span:)
|
|
37
|
+
ensure
|
|
38
|
+
raise(ex)
|
|
39
|
+
end
|
|
40
|
+
|
|
41
|
+
private
|
|
42
|
+
|
|
43
|
+
##
|
|
44
|
+
# @return [LLM::Object]
|
|
45
|
+
def body
|
|
46
|
+
@body ||= LLM.json.load(res.body)
|
|
47
|
+
end
|
|
48
|
+
|
|
49
|
+
##
|
|
50
|
+
# @return [LLM::Error]
|
|
51
|
+
def error
|
|
24
52
|
case res
|
|
25
53
|
when Net::HTTPServerError
|
|
26
|
-
|
|
54
|
+
LLM::ServerError.new("Server error").tap { _1.response = res }
|
|
27
55
|
when Net::HTTPUnauthorized
|
|
28
|
-
|
|
56
|
+
LLM::UnauthorizedError.new("Authentication error").tap { _1.response = res }
|
|
29
57
|
when Net::HTTPTooManyRequests
|
|
30
|
-
|
|
58
|
+
LLM::RateLimitError.new("Too many requests").tap { _1.response = res }
|
|
31
59
|
else
|
|
32
60
|
error = body["error"] || {}
|
|
33
61
|
case error["type"]
|
|
34
62
|
when "invalid_request_error" then handle_invalid_request(error)
|
|
35
|
-
when "server_error"
|
|
36
|
-
|
|
63
|
+
when "server_error"
|
|
64
|
+
LLM::ServerError.new(error["message"]).tap { _1.response = res }
|
|
65
|
+
else
|
|
66
|
+
LLM::Error.new(error["message"] || "Unexpected response").tap { _1.response = res }
|
|
37
67
|
end
|
|
38
68
|
end
|
|
39
69
|
end
|
|
40
70
|
|
|
41
|
-
|
|
42
|
-
|
|
71
|
+
##
|
|
72
|
+
# @param [Exception] error
|
|
73
|
+
# @return [LLM::Error]
|
|
43
74
|
def handle_invalid_request(error)
|
|
44
75
|
case error["code"]
|
|
45
76
|
when "context_length_exceeded"
|
|
46
|
-
|
|
77
|
+
LLM::ContextWindowError.new(error["message"]).tap { _1.response = res }
|
|
47
78
|
else
|
|
48
|
-
|
|
79
|
+
LLM::InvalidRequestError.new(error["message"]).tap { _1.response = res }
|
|
49
80
|
end
|
|
50
81
|
end
|
|
51
|
-
|
|
52
|
-
def body
|
|
53
|
-
@body ||= LLM.json.load(res.body)
|
|
54
|
-
end
|
|
55
82
|
end
|
|
56
83
|
end
|
|
@@ -13,10 +13,10 @@ class LLM::OpenAI
|
|
|
13
13
|
# require "llm"
|
|
14
14
|
#
|
|
15
15
|
# llm = LLM.openai(key: ENV["KEY"])
|
|
16
|
-
#
|
|
16
|
+
# ses = LLM::Session.new(llm)
|
|
17
17
|
# file = llm.files.create file: "/books/goodread.pdf"
|
|
18
|
-
#
|
|
19
|
-
#
|
|
18
|
+
# ses.talk ["Tell me about this PDF", file]
|
|
19
|
+
# ses.messages.select(&:assistant?).each { print "[#{_1.role}]", _1.content, "\n" }
|
|
20
20
|
class Files
|
|
21
21
|
##
|
|
22
22
|
# Returns a new Files object
|
|
@@ -41,8 +41,9 @@ class LLM::OpenAI
|
|
|
41
41
|
def all(**params)
|
|
42
42
|
query = URI.encode_www_form(params)
|
|
43
43
|
req = Net::HTTP::Get.new("/v1/files?#{query}", headers)
|
|
44
|
-
res = execute(request: req)
|
|
45
|
-
ResponseAdapter.adapt(res, type: :enumerable)
|
|
44
|
+
res, span = execute(request: req, operation: "request")
|
|
45
|
+
res = ResponseAdapter.adapt(res, type: :enumerable)
|
|
46
|
+
finish_trace(operation: "request", res:, span:)
|
|
46
47
|
end
|
|
47
48
|
|
|
48
49
|
##
|
|
@@ -61,8 +62,9 @@ class LLM::OpenAI
|
|
|
61
62
|
req = Net::HTTP::Post.new("/v1/files", headers)
|
|
62
63
|
req["content-type"] = multi.content_type
|
|
63
64
|
set_body_stream(req, multi.body)
|
|
64
|
-
res = execute(request: req)
|
|
65
|
-
ResponseAdapter.adapt(res, type: :file)
|
|
65
|
+
res, span = execute(request: req, operation: "request")
|
|
66
|
+
res = ResponseAdapter.adapt(res, type: :file)
|
|
67
|
+
finish_trace(operation: "request", res:, span:)
|
|
66
68
|
end
|
|
67
69
|
|
|
68
70
|
##
|
|
@@ -80,8 +82,9 @@ class LLM::OpenAI
|
|
|
80
82
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
81
83
|
query = URI.encode_www_form(params)
|
|
82
84
|
req = Net::HTTP::Get.new("/v1/files/#{file_id}?#{query}", headers)
|
|
83
|
-
res = execute(request: req)
|
|
84
|
-
ResponseAdapter.adapt(res, type: :file)
|
|
85
|
+
res, span = execute(request: req, operation: "request")
|
|
86
|
+
res = ResponseAdapter.adapt(res, type: :file)
|
|
87
|
+
finish_trace(operation: "request", res:, span:)
|
|
85
88
|
end
|
|
86
89
|
|
|
87
90
|
##
|
|
@@ -101,8 +104,9 @@ class LLM::OpenAI
|
|
|
101
104
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
102
105
|
req = Net::HTTP::Get.new("/v1/files/#{file_id}/content?#{query}", headers)
|
|
103
106
|
io = StringIO.new("".b)
|
|
104
|
-
res = execute(request: req) { |res| res.read_body { |chunk| io << chunk } }
|
|
105
|
-
LLM::Response.new(res).tap { _1.define_singleton_method(:file) { io } }
|
|
107
|
+
res, span = execute(request: req, operation: "request") { |res| res.read_body { |chunk| io << chunk } }
|
|
108
|
+
res = LLM::Response.new(res).tap { _1.define_singleton_method(:file) { io } }
|
|
109
|
+
finish_trace(operation: "request", res:, span:)
|
|
106
110
|
end
|
|
107
111
|
|
|
108
112
|
##
|
|
@@ -118,13 +122,14 @@ class LLM::OpenAI
|
|
|
118
122
|
def delete(file:)
|
|
119
123
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
120
124
|
req = Net::HTTP::Delete.new("/v1/files/#{file_id}", headers)
|
|
121
|
-
res = execute(request: req)
|
|
122
|
-
LLM::Response.new(res)
|
|
125
|
+
res, span = execute(request: req, operation: "request")
|
|
126
|
+
res = LLM::Response.new(res)
|
|
127
|
+
finish_trace(operation: "request", res:, span:)
|
|
123
128
|
end
|
|
124
129
|
|
|
125
130
|
private
|
|
126
131
|
|
|
127
|
-
[:headers, :execute, :set_body_stream].each do |m|
|
|
132
|
+
[:headers, :execute, :set_body_stream, :finish_trace].each do |m|
|
|
128
133
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
129
134
|
end
|
|
130
135
|
end
|
|
@@ -50,8 +50,9 @@ class LLM::OpenAI
|
|
|
50
50
|
def create(prompt:, model: "dall-e-3", **params)
|
|
51
51
|
req = Net::HTTP::Post.new("/v1/images/generations", headers)
|
|
52
52
|
req.body = LLM.json.dump({prompt:, n: 1, model:}.merge!(params))
|
|
53
|
-
res = execute(request: req)
|
|
54
|
-
ResponseAdapter.adapt(res, type: :image)
|
|
53
|
+
res, span = execute(request: req, operation: "request")
|
|
54
|
+
res = ResponseAdapter.adapt(res, type: :image)
|
|
55
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
55
56
|
end
|
|
56
57
|
|
|
57
58
|
##
|
|
@@ -72,8 +73,9 @@ class LLM::OpenAI
|
|
|
72
73
|
req = Net::HTTP::Post.new("/v1/images/variations", headers)
|
|
73
74
|
req["content-type"] = multi.content_type
|
|
74
75
|
set_body_stream(req, multi.body)
|
|
75
|
-
res = execute(request: req)
|
|
76
|
-
ResponseAdapter.adapt(res, type: :image)
|
|
76
|
+
res, span = execute(request: req, operation: "request")
|
|
77
|
+
res = ResponseAdapter.adapt(res, type: :image)
|
|
78
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
77
79
|
end
|
|
78
80
|
|
|
79
81
|
##
|
|
@@ -95,13 +97,14 @@ class LLM::OpenAI
|
|
|
95
97
|
req = Net::HTTP::Post.new("/v1/images/edits", headers)
|
|
96
98
|
req["content-type"] = multi.content_type
|
|
97
99
|
set_body_stream(req, multi.body)
|
|
98
|
-
res = execute(request: req)
|
|
99
|
-
ResponseAdapter.adapt(res, type: :image)
|
|
100
|
+
res, span = execute(request: req, operation: "request")
|
|
101
|
+
res = ResponseAdapter.adapt(res, type: :image)
|
|
102
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
100
103
|
end
|
|
101
104
|
|
|
102
105
|
private
|
|
103
106
|
|
|
104
|
-
[:headers, :execute, :set_body_stream].each do |m|
|
|
107
|
+
[:headers, :execute, :set_body_stream, :finish_trace].each do |m|
|
|
105
108
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
106
109
|
end
|
|
107
110
|
end
|
|
@@ -40,13 +40,14 @@ class LLM::OpenAI
|
|
|
40
40
|
def all(**params)
|
|
41
41
|
query = URI.encode_www_form(params)
|
|
42
42
|
req = Net::HTTP::Get.new("/v1/models?#{query}", headers)
|
|
43
|
-
res = execute(request: req)
|
|
44
|
-
ResponseAdapter.adapt(res, type: :enumerable)
|
|
43
|
+
res, span = execute(request: req, operation: "request")
|
|
44
|
+
res = ResponseAdapter.adapt(res, type: :enumerable)
|
|
45
|
+
finish_trace(operation: "request", res:, span:)
|
|
45
46
|
end
|
|
46
47
|
|
|
47
48
|
private
|
|
48
49
|
|
|
49
|
-
[:headers, :execute, :set_body_stream].each do |m|
|
|
50
|
+
[:headers, :execute, :set_body_stream, :finish_trace].each do |m|
|
|
50
51
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
51
52
|
end
|
|
52
53
|
end
|
|
@@ -50,13 +50,14 @@ class LLM::OpenAI
|
|
|
50
50
|
req = Net::HTTP::Post.new("/v1/moderations", headers)
|
|
51
51
|
input = RequestAdapter::Moderation.new(input).adapt
|
|
52
52
|
req.body = LLM.json.dump({input:, model:}.merge!(params))
|
|
53
|
-
res = execute(request: req)
|
|
54
|
-
ResponseAdapter.adapt(res, type: :moderations)
|
|
53
|
+
res, span = execute(request: req, operation: "request")
|
|
54
|
+
res = ResponseAdapter.adapt(res, type: :moderations)
|
|
55
|
+
finish_trace(operation: "request", model:, res:, span:)
|
|
55
56
|
end
|
|
56
57
|
|
|
57
58
|
private
|
|
58
59
|
|
|
59
|
-
[:headers, :execute].each do |m|
|
|
60
|
+
[:headers, :execute, :finish_trace].each do |m|
|
|
60
61
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
61
62
|
end
|
|
62
63
|
end
|
|
@@ -44,9 +44,10 @@ class LLM::OpenAI
|
|
|
44
44
|
messages = [*(params.delete(:input) || []), LLM::Message.new(role, prompt)]
|
|
45
45
|
body = LLM.json.dump({input: [adapt(messages, mode: :response)].flatten}.merge!(params))
|
|
46
46
|
set_body_stream(req, StringIO.new(body))
|
|
47
|
-
res = execute(request: req, stream:, stream_parser:)
|
|
48
|
-
ResponseAdapter.adapt(res, type: :responds)
|
|
47
|
+
res, span = execute(request: req, stream:, stream_parser:, operation: "chat", model: params[:model])
|
|
48
|
+
res = ResponseAdapter.adapt(res, type: :responds)
|
|
49
49
|
.extend(Module.new { define_method(:__tools__) { tools } })
|
|
50
|
+
finish_trace(operation: "chat", model: params[:model], res:, span:)
|
|
50
51
|
end
|
|
51
52
|
|
|
52
53
|
##
|
|
@@ -59,8 +60,9 @@ class LLM::OpenAI
|
|
|
59
60
|
response_id = response.respond_to?(:id) ? response.id : response
|
|
60
61
|
query = URI.encode_www_form(params)
|
|
61
62
|
req = Net::HTTP::Get.new("/v1/responses/#{response_id}?#{query}", headers)
|
|
62
|
-
res = execute(request: req)
|
|
63
|
-
ResponseAdapter.adapt(res, type: :responds)
|
|
63
|
+
res, span = execute(request: req, operation: "request")
|
|
64
|
+
res = ResponseAdapter.adapt(res, type: :responds)
|
|
65
|
+
finish_trace(operation: "request", res:, span:)
|
|
64
66
|
end
|
|
65
67
|
|
|
66
68
|
##
|
|
@@ -72,13 +74,14 @@ class LLM::OpenAI
|
|
|
72
74
|
def delete(response)
|
|
73
75
|
response_id = response.respond_to?(:id) ? response.id : response
|
|
74
76
|
req = Net::HTTP::Delete.new("/v1/responses/#{response_id}", headers)
|
|
75
|
-
res = execute(request: req)
|
|
76
|
-
LLM::Response.new(res)
|
|
77
|
+
res, span = execute(request: req, operation: "request")
|
|
78
|
+
res = LLM::Response.new(res)
|
|
79
|
+
finish_trace(operation: "request", res:, span:)
|
|
77
80
|
end
|
|
78
81
|
|
|
79
82
|
private
|
|
80
83
|
|
|
81
|
-
[:headers, :execute, :set_body_stream, :resolve_tools].each do |m|
|
|
84
|
+
[:headers, :execute, :set_body_stream, :resolve_tools, :finish_trace].each do |m|
|
|
82
85
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
83
86
|
end
|
|
84
87
|
|
|
@@ -32,8 +32,9 @@ class LLM::OpenAI
|
|
|
32
32
|
def all(**params)
|
|
33
33
|
query = URI.encode_www_form(params)
|
|
34
34
|
req = Net::HTTP::Get.new("/v1/vector_stores?#{query}", headers)
|
|
35
|
-
res = execute(request: req)
|
|
36
|
-
ResponseAdapter.adapt(res, type: :enumerable)
|
|
35
|
+
res, span = execute(request: req, operation: "request")
|
|
36
|
+
res = ResponseAdapter.adapt(res, type: :enumerable)
|
|
37
|
+
finish_trace(operation: "request", res:, span:)
|
|
37
38
|
end
|
|
38
39
|
|
|
39
40
|
##
|
|
@@ -47,8 +48,9 @@ class LLM::OpenAI
|
|
|
47
48
|
def create(name:, file_ids: nil, **params)
|
|
48
49
|
req = Net::HTTP::Post.new("/v1/vector_stores", headers)
|
|
49
50
|
req.body = LLM.json.dump(params.merge({name:, file_ids:}).compact)
|
|
50
|
-
res = execute(request: req)
|
|
51
|
-
LLM::Response.new(res)
|
|
51
|
+
res, span = execute(request: req, operation: "request")
|
|
52
|
+
res = LLM::Response.new(res)
|
|
53
|
+
finish_trace(operation: "request", res:, span:)
|
|
52
54
|
end
|
|
53
55
|
|
|
54
56
|
##
|
|
@@ -69,8 +71,9 @@ class LLM::OpenAI
|
|
|
69
71
|
def get(vector:)
|
|
70
72
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
71
73
|
req = Net::HTTP::Get.new("/v1/vector_stores/#{vector_id}", headers)
|
|
72
|
-
res = execute(request: req)
|
|
73
|
-
LLM::Response.new(res)
|
|
74
|
+
res, span = execute(request: req, operation: "request")
|
|
75
|
+
res = LLM::Response.new(res)
|
|
76
|
+
finish_trace(operation: "request", res:, span:)
|
|
74
77
|
end
|
|
75
78
|
|
|
76
79
|
##
|
|
@@ -85,8 +88,9 @@ class LLM::OpenAI
|
|
|
85
88
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
86
89
|
req = Net::HTTP::Post.new("/v1/vector_stores/#{vector_id}", headers)
|
|
87
90
|
req.body = LLM.json.dump(params.merge({name:}).compact)
|
|
88
|
-
res = execute(request: req)
|
|
89
|
-
LLM::Response.new(res)
|
|
91
|
+
res, span = execute(request: req, operation: "request")
|
|
92
|
+
res = LLM::Response.new(res)
|
|
93
|
+
finish_trace(operation: "request", res:, span:)
|
|
90
94
|
end
|
|
91
95
|
|
|
92
96
|
##
|
|
@@ -98,8 +102,9 @@ class LLM::OpenAI
|
|
|
98
102
|
def delete(vector:)
|
|
99
103
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
100
104
|
req = Net::HTTP::Delete.new("/v1/vector_stores/#{vector_id}", headers)
|
|
101
|
-
res = execute(request: req)
|
|
102
|
-
LLM::Response.new(res)
|
|
105
|
+
res, span = execute(request: req, operation: "request")
|
|
106
|
+
res = LLM::Response.new(res)
|
|
107
|
+
finish_trace(operation: "request", res:, span:)
|
|
103
108
|
end
|
|
104
109
|
|
|
105
110
|
##
|
|
@@ -114,8 +119,9 @@ class LLM::OpenAI
|
|
|
114
119
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
115
120
|
req = Net::HTTP::Post.new("/v1/vector_stores/#{vector_id}/search", headers)
|
|
116
121
|
req.body = LLM.json.dump(params.merge({query:}).compact)
|
|
117
|
-
res = execute(request: req)
|
|
118
|
-
ResponseAdapter.adapt(res, type: :enumerable)
|
|
122
|
+
res, span = execute(request: req, operation: "retrieval")
|
|
123
|
+
res = ResponseAdapter.adapt(res, type: :enumerable)
|
|
124
|
+
finish_trace(operation: "retrieval", res:, span:)
|
|
119
125
|
end
|
|
120
126
|
|
|
121
127
|
##
|
|
@@ -129,8 +135,9 @@ class LLM::OpenAI
|
|
|
129
135
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
130
136
|
query = URI.encode_www_form(params)
|
|
131
137
|
req = Net::HTTP::Get.new("/v1/vector_stores/#{vector_id}/files?#{query}", headers)
|
|
132
|
-
res = execute(request: req)
|
|
133
|
-
ResponseAdapter.adapt(res, type: :enumerable)
|
|
138
|
+
res, span = execute(request: req, operation: "request")
|
|
139
|
+
res = ResponseAdapter.adapt(res, type: :enumerable)
|
|
140
|
+
finish_trace(operation: "request", res:, span:)
|
|
134
141
|
end
|
|
135
142
|
|
|
136
143
|
##
|
|
@@ -147,8 +154,9 @@ class LLM::OpenAI
|
|
|
147
154
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
148
155
|
req = Net::HTTP::Post.new("/v1/vector_stores/#{vector_id}/files", headers)
|
|
149
156
|
req.body = LLM.json.dump(params.merge({file_id:, attributes:}).compact)
|
|
150
|
-
res = execute(request: req)
|
|
151
|
-
LLM::Response.new(res)
|
|
157
|
+
res, span = execute(request: req, operation: "request")
|
|
158
|
+
res = LLM::Response.new(res)
|
|
159
|
+
finish_trace(operation: "request", res:, span:)
|
|
152
160
|
end
|
|
153
161
|
alias_method :create_file, :add_file
|
|
154
162
|
|
|
@@ -176,8 +184,9 @@ class LLM::OpenAI
|
|
|
176
184
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
177
185
|
req = Net::HTTP::Post.new("/v1/vector_stores/#{vector_id}/files/#{file_id}", headers)
|
|
178
186
|
req.body = LLM.json.dump(params.merge({attributes:}).compact)
|
|
179
|
-
res = execute(request: req)
|
|
180
|
-
LLM::Response.new(res)
|
|
187
|
+
res, span = execute(request: req, operation: "request")
|
|
188
|
+
res = LLM::Response.new(res)
|
|
189
|
+
finish_trace(operation: "request", res:, span:)
|
|
181
190
|
end
|
|
182
191
|
|
|
183
192
|
##
|
|
@@ -192,8 +201,9 @@ class LLM::OpenAI
|
|
|
192
201
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
193
202
|
query = URI.encode_www_form(params)
|
|
194
203
|
req = Net::HTTP::Get.new("/v1/vector_stores/#{vector_id}/files/#{file_id}?#{query}", headers)
|
|
195
|
-
res = execute(request: req)
|
|
196
|
-
LLM::Response.new(res)
|
|
204
|
+
res, span = execute(request: req, operation: "request")
|
|
205
|
+
res = LLM::Response.new(res)
|
|
206
|
+
finish_trace(operation: "request", res:, span:)
|
|
197
207
|
end
|
|
198
208
|
|
|
199
209
|
##
|
|
@@ -207,8 +217,9 @@ class LLM::OpenAI
|
|
|
207
217
|
vector_id = vector.respond_to?(:id) ? vector.id : vector
|
|
208
218
|
file_id = file.respond_to?(:id) ? file.id : file
|
|
209
219
|
req = Net::HTTP::Delete.new("/v1/vector_stores/#{vector_id}/files/#{file_id}", headers)
|
|
210
|
-
res = execute(request: req)
|
|
211
|
-
LLM::Response.new(res)
|
|
220
|
+
res, span = execute(request: req, operation: "request")
|
|
221
|
+
res = LLM::Response.new(res)
|
|
222
|
+
finish_trace(operation: "request", res:, span:)
|
|
212
223
|
end
|
|
213
224
|
|
|
214
225
|
##
|
|
@@ -237,7 +248,7 @@ class LLM::OpenAI
|
|
|
237
248
|
|
|
238
249
|
private
|
|
239
250
|
|
|
240
|
-
[:headers, :execute, :set_body_stream].each do |m|
|
|
251
|
+
[:headers, :execute, :set_body_stream, :finish_trace].each do |m|
|
|
241
252
|
define_method(m) { |*args, **kwargs, &b| @provider.send(m, *args, **kwargs, &b) }
|
|
242
253
|
end
|
|
243
254
|
end
|
data/lib/llm/providers/openai.rb
CHANGED
|
@@ -10,9 +10,9 @@ module LLM
|
|
|
10
10
|
# require "llm"
|
|
11
11
|
#
|
|
12
12
|
# llm = LLM.openai(key: ENV["KEY"])
|
|
13
|
-
#
|
|
14
|
-
#
|
|
15
|
-
#
|
|
13
|
+
# ses = LLM::Session.new(llm)
|
|
14
|
+
# ses.talk ["Tell me about this photo", ses.local_file("/images/photo.png")]
|
|
15
|
+
# ses.messages.select(&:assistant?).each { print "[#{_1.role}]", _1.content, "\n" }
|
|
16
16
|
class OpenAI < Provider
|
|
17
17
|
require_relative "openai/error_handler"
|
|
18
18
|
require_relative "openai/request_adapter"
|
|
@@ -47,8 +47,9 @@ module LLM
|
|
|
47
47
|
def embed(input, model: "text-embedding-3-small", **params)
|
|
48
48
|
req = Net::HTTP::Post.new("/v1/embeddings", headers)
|
|
49
49
|
req.body = LLM.json.dump({input:, model:}.merge!(params))
|
|
50
|
-
res = execute(request: req)
|
|
51
|
-
ResponseAdapter.adapt(res, type: :embedding)
|
|
50
|
+
res, span = execute(request: req, operation: "embeddings", model:)
|
|
51
|
+
res = ResponseAdapter.adapt(res, type: :embedding)
|
|
52
|
+
finish_trace(operation: "embeddings", model:, res:, span:)
|
|
52
53
|
end
|
|
53
54
|
|
|
54
55
|
##
|
|
@@ -64,9 +65,10 @@ module LLM
|
|
|
64
65
|
def complete(prompt, params = {})
|
|
65
66
|
params, stream, tools, role = normalize_complete_params(params)
|
|
66
67
|
req = build_complete_request(prompt, params, role)
|
|
67
|
-
res = execute(request: req, stream: stream)
|
|
68
|
-
ResponseAdapter.adapt(res, type: :completion)
|
|
68
|
+
res, span = execute(request: req, stream: stream, operation: "chat", model: params[:model])
|
|
69
|
+
res = ResponseAdapter.adapt(res, type: :completion)
|
|
69
70
|
.extend(Module.new { define_method(:__tools__) { tools } })
|
|
71
|
+
finish_trace(operation: "chat", model: params[:model], res:, span:)
|
|
70
72
|
end
|
|
71
73
|
|
|
72
74
|
##
|
data/lib/llm/providers/xai.rb
CHANGED
|
@@ -11,9 +11,9 @@ module LLM
|
|
|
11
11
|
# require "llm"
|
|
12
12
|
#
|
|
13
13
|
# llm = LLM.xai(key: ENV["KEY"])
|
|
14
|
-
#
|
|
15
|
-
#
|
|
16
|
-
#
|
|
14
|
+
# ses = LLM::Session.new(llm)
|
|
15
|
+
# ses.talk ["Tell me about this photo", ses.local_file("/images/photo.png")]
|
|
16
|
+
# ses.messages.select(&:assistant?).each { print "[#{_1.role}]", _1.content, "\n" }
|
|
17
17
|
class XAI < OpenAI
|
|
18
18
|
require_relative "xai/images"
|
|
19
19
|
|
data/lib/llm/providers/zai.rb
CHANGED
|
@@ -11,8 +11,8 @@ module LLM
|
|
|
11
11
|
# require "llm"
|
|
12
12
|
#
|
|
13
13
|
# llm = LLM.zai(key: ENV["KEY"])
|
|
14
|
-
#
|
|
15
|
-
#
|
|
14
|
+
# ses = LLM::Session.new(llm, stream: $stdout)
|
|
15
|
+
# ses.talk "Hello"
|
|
16
16
|
class ZAI < OpenAI
|
|
17
17
|
##
|
|
18
18
|
# @param [String] host A regional host or the default ("api.z.ai")
|
data/lib/llm/schema/object.rb
CHANGED
|
@@ -36,7 +36,7 @@ class LLM::Schema
|
|
|
36
36
|
##
|
|
37
37
|
# @return [Hash]
|
|
38
38
|
def to_h
|
|
39
|
-
super.merge!({type: "object", properties:, required:})
|
|
39
|
+
super.merge!({type: "object", properties:, required: required_items})
|
|
40
40
|
end
|
|
41
41
|
|
|
42
42
|
##
|
|
@@ -64,7 +64,7 @@ class LLM::Schema
|
|
|
64
64
|
|
|
65
65
|
private
|
|
66
66
|
|
|
67
|
-
def
|
|
67
|
+
def required_items
|
|
68
68
|
@properties.filter_map { _2.required? ? _1 : nil }
|
|
69
69
|
end
|
|
70
70
|
end
|