RubyGems - langchainrb - Versions diffs - 0.5.0 → 0.5.2 - Mend

langchainrb 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +8 -0
data/Gemfile.lock +1 -1
data/README.md +12 -3
data/examples/create_and_manage_few_shot_prompt_templates.rb +3 -3
data/examples/create_and_manage_prompt_templates.rb +8 -4
data/examples/pdf_store_and_query_with_chroma.rb +1 -1
data/examples/store_and_query_with_pinecone.rb +2 -2
data/examples/store_and_query_with_qdrant.rb +1 -1
data/examples/store_and_query_with_weaviate.rb +1 -1
data/lib/langchain/agent/chain_of_thought_agent/chain_of_thought_agent.rb +12 -10
data/lib/langchain/agent/sql_query_agent/sql_query_agent.rb +10 -6
data/lib/langchain/llm/openai.rb +4 -11
data/lib/langchain/tool/base.rb +28 -16
data/lib/langchain/tool/calculator.rb +8 -3
data/lib/langchain/tool/database.rb +25 -10
data/lib/langchain/tool/ruby_code_interpreter.rb +1 -1
data/lib/langchain/tool/serp_api.rb +33 -10
data/lib/langchain/tool/wikipedia.rb +1 -1
data/lib/langchain/utils/token_length_validator.rb +35 -8
data/lib/langchain/version.rb +1 -1
metadata +2 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: b0a2fe8026e861c9d97465bce7da08a0b077492d6f7cf8fb42c45dbfdfe6749f
-  data.tar.gz: c04099c44a847bd9c05e8594859f92ca1f54d338c463ce59a375c2cb9731b1ad
+  metadata.gz: d36de4206b792714ba9b6773c03272e9638b14caf7140e0bc00c3e767aa5fdef
+  data.tar.gz: 819fab9de55a34e4e6dc865febc19bb9979df55fa8fc6a753774cf1961c40103
 SHA512:
-  metadata.gz: dec375b2b7cae377cf31f3f8ed0a6ac9d79215c945e7c0da78ed1fbad3c502ecfcc5ce5318c55a9a634db88fea1f5fbbeed7a0f7dc6ab8096c909e0a3ff02154
-  data.tar.gz: 558a0f6ddf90ad044f9e2cc7c6ca678958472748d2e430a3cbb4308290898b9b22a204a94a5b5943f06137f7da5238d038a65b8c79d96f8a3705499d95cfb597
+  metadata.gz: 6e180b41bbca96bd5523c276923f223bbebe470314086c6a909df440890793bcc70dbd66ecf59bf5d0fd52426650cc5d2684c56cc8fc643209cc1679527cbef4
+  data.tar.gz: af5db76c2b22b5c7bdc1170de437921e8464a16566f46a5cad465d69e6da47c97a82f7331a5ea5747840e58acc71463aa8456b03e9bc8851efda7b734e5d23cc

data/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,13 @@
 ## [Unreleased]
+## [0.5.2] - 2023-06-07
+- 🗣️ LLMs
+  - Auto-calculate the max_tokens: setting to be passed on to OpenAI
+## [0.5.1] - 2023-06-06
+- 🛠️ Tools
+  - Modified Tool usage. Agents now accept Tools instances instead of Tool strings.
 ## [0.5.0] - 2023-06-05
 - [BREAKING] LLMs are now passed as objects to Vectorsearch classes instead of `llm: :name, llm_api_key:` previously
 - 📋 Prompts

data/Gemfile.lock CHANGED Viewed

@@ -1,7 +1,7 @@
 PATH
   remote: .
   specs:
-    langchainrb (0.5.0)
+    langchainrb (0.5.2)
       colorize (~> 0.8.1)
       tiktoken_ruby (~> 0.0.5)

data/README.md CHANGED Viewed

@@ -256,7 +256,15 @@ Agents are semi-autonomous bots that can respond to user questions and use avail
 Add `gem "ruby-openai"`, `gem "eqn"`, and `gem "google_search_results"` to your Gemfile
 ```ruby
-agent = Langchain::Agent::ChainOfThoughtAgent.new(llm: Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"]), tools: ['search', 'calculator'])
+search_tool = Langchain::Tool::SerpApi.new(api_key: ENV["SERPAPI_API_KEY"])
+calculator = Langchain::Tool::Calculator.new
+openai = Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"])
+agent = Langchain::Agent::ChainOfThoughtAgent.new(
+  llm: openai,
+  tools: [search_tool, calculator]
+)
 agent.tools
 # => ["search", "calculator"]
@@ -271,11 +279,12 @@ agent.run(question: "How many full soccer fields would be needed to cover the di
 Add `gem "sequel"` to your Gemfile
 ```ruby
-agent = Langchain::Agent::SQLQueryAgent.new(llm: Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"]), db_connection_string: "postgres://user:password@localhost:5432/db_name")
+database = Langchain::Tool::Database.new(connection_string: "postgres://user:password@localhost:5432/db_name")
+agent = Langchain::Agent::SQLQueryAgent.new(llm: Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"]), db: database)
 ```
 ```ruby
-agent.ask(question: "How many users have a name with length greater than 5 in the users table?")
+agent.run(question: "How many users have a name with length greater than 5 in the users table?")
 #=> "14 users have a name with length greater than 5 in the users table."
 ```

data/examples/create_and_manage_few_shot_prompt_templates.rb CHANGED Viewed

@@ -1,10 +1,10 @@
 require "langchain"
 # Create a prompt with a few shot examples
-prompt = Prompt::FewShotPromptTemplate.new(
+prompt = Langchain::Prompt::FewShotPromptTemplate.new(
   prefix: "Write antonyms for the following words.",
   suffix: "Input: {adjective}\nOutput:",
-  example_prompt: Prompt::PromptTemplate.new(
+  example_prompt: Langchain::Prompt::PromptTemplate.new(
     input_variables: ["input", "output"],
     template: "Input: {input}\nOutput: {output}"
   ),
@@ -32,5 +32,5 @@ prompt.format(adjective: "good")
 prompt.save(file_path: "spec/fixtures/prompt/few_shot_prompt_template.json")
 # Loading a new prompt template using a JSON file
-prompt = Prompt.load_from_path(file_path: "spec/fixtures/prompt/few_shot_prompt_template.json")
+prompt = Langchain::Prompt.load_from_path(file_path: "spec/fixtures/prompt/few_shot_prompt_template.json")
 prompt.prefix # "Write antonyms for the following words."

data/examples/create_and_manage_prompt_templates.rb CHANGED Viewed

@@ -1,15 +1,15 @@
 require "langchain"
 # Create a prompt with one input variable
-prompt = Prompt::PromptTemplate.new(template: "Tell me a {adjective} joke.", input_variables: ["adjective"])
+prompt = Langchain::Prompt::PromptTemplate.new(template: "Tell me a {adjective} joke.", input_variables: ["adjective"])
 prompt.format(adjective: "funny") # "Tell me a funny joke."
 # Create a prompt with multiple input variables
-prompt = Prompt::PromptTemplate.new(template: "Tell me a {adjective} joke about {content}.", input_variables: ["adjective", "content"])
+prompt = Langchain::Prompt::PromptTemplate.new(template: "Tell me a {adjective} joke about {content}.", input_variables: ["adjective", "content"])
 prompt.format(adjective: "funny", content: "chickens") # "Tell me a funny joke about chickens."
 # Creating a PromptTemplate using just a prompt and no input_variables
-prompt = Prompt::PromptTemplate.from_template("Tell me a {adjective} joke about {content}.")
+prompt = Langchain::Prompt::PromptTemplate.from_template("Tell me a {adjective} joke about {content}.")
 prompt.input_variables # ["adjective", "content"]
 prompt.format(adjective: "funny", content: "chickens") # "Tell me a funny joke about chickens."
@@ -17,5 +17,9 @@ prompt.format(adjective: "funny", content: "chickens") # "Tell me a funny joke a
 prompt.save(file_path: "spec/fixtures/prompt/prompt_template.json")
 # Loading a new prompt template using a JSON file
-prompt = Prompt.load_from_path(file_path: "spec/fixtures/prompt/prompt_template.json")
+prompt = Langchain::Prompt.load_from_path(file_path: "spec/fixtures/prompt/prompt_template.json")
+prompt.input_variables # ["adjective", "content"]
+# Loading a new prompt template using a YAML file
+prompt = Langchain::Prompt.load_from_path(file_path: "spec/fixtures/prompt/prompt_template.yaml")
 prompt.input_variables # ["adjective", "content"]

data/examples/pdf_store_and_query_with_chroma.rb CHANGED Viewed

@@ -4,7 +4,7 @@ require "langchain"
 # or add `gem "chroma-db", "~> 0.3.0"` to your Gemfile
 # Instantiate the Chroma client
-chroma = Vectorsearch::Chroma.new(
+chroma = Langchain::Vectorsearch::Chroma.new(
   url: ENV["CHROMA_URL"],
   index_name: "documents",
   llm: Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"])

data/examples/store_and_query_with_pinecone.rb CHANGED Viewed

@@ -4,7 +4,7 @@ require "langchain"
 # or add `gem "pinecone"` to your Gemfile
 # Instantiate the Qdrant client
-pinecone = Vectorsearch::Pinecone.new(
+pinecone = Langchain::Vectorsearch::Pinecone.new(
   environment: ENV["PINECONE_ENVIRONMENT"],
   api_key: ENV["PINECONE_API_KEY"],
   index_name: "recipes",
@@ -37,7 +37,7 @@ pinecone.ask(
 )
 # Generate your an embedding and search by it
-openai = LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"])
+openai = Langchain::LLM::OpenAI.new(api_key: ENV["OPENAI_API_KEY"])
 embedding = openai.embed(text: "veggie")
 pinecone.similarity_search_by_vector(

data/examples/store_and_query_with_qdrant.rb CHANGED Viewed

@@ -4,7 +4,7 @@ require "langchain"
 # or add `gem "qdrant-ruby"` to your Gemfile
 # Instantiate the Qdrant client
-qdrant = Vectorsearch::Qdrant.new(
+qdrant = Langchain::Vectorsearch::Qdrant.new(
   url: ENV["QDRANT_URL"],
   api_key: ENV["QDRANT_API_KEY"],
   index_name: "recipes",

data/examples/store_and_query_with_weaviate.rb CHANGED Viewed

@@ -4,7 +4,7 @@ require "langchain"
 # or add `gem "weaviate-ruby"` to your Gemfile
 # Instantiate the Weaviate client
-weaviate = Vectorsearch::Weaviate.new(
+weaviate = Langchain::Vectorsearch::Weaviate.new(
   url: ENV["WEAVIATE_URL"],
   api_key: ENV["WEAVIATE_API_KEY"],
   index_name: "Recipes",

data/lib/langchain/agent/chain_of_thought_agent/chain_of_thought_agent.rb CHANGED Viewed

@@ -39,11 +39,8 @@ module Langchain::Agent
       loop do
         Langchain.logger.info("[#{self.class.name}]".red + ": Sending the prompt to the #{llm.class} LLM")
-        response = llm.complete(
-          prompt: prompt,
-          stop_sequences: ["Observation:"],
-          max_tokens: 500
-        )
+        response = llm.complete(prompt: prompt, stop_sequences: ["Observation:"])
         # Append the response to the prompt
         prompt += response
@@ -55,10 +52,11 @@ module Langchain::Agent
           # Find the input to the action in the "Action Input: [action_input]" format
           action_input = response.match(/Action Input: "?(.*)"?/)&.send(:[], -1)
-          # Retrieve the Tool::[ToolName] class and call `execute`` with action_input as the input
-          tool = Langchain::Tool.const_get(Langchain::Tool::Base::TOOLS[action.strip])
-          Langchain.logger.info("[#{self.class.name}]".red + ": Invoking \"#{tool}\" Tool with \"#{action_input}\"")
+          # Find the Tool and call `execute`` with action_input as the input
+          tool = tools.find { |tool| tool.tool_name == action.strip }
+          Langchain.logger.info("[#{self.class.name}]".red + ": Invoking \"#{tool.class}\" Tool with \"#{action_input}\"")
+          # Call `execute` with action_input as the input
           result = tool.execute(input: action_input)
           # Append the Observation to the prompt
@@ -81,12 +79,16 @@ module Langchain::Agent
     # @param tools [Array] Tools to use
     # @return [String] Prompt
     def create_prompt(question:, tools:)
+      tool_list = tools.map(&:tool_name)
       prompt_template.format(
         date: Date.today.strftime("%B %d, %Y"),
         question: question,
-        tool_names: "[#{tools.join(", ")}]",
+        tool_names: "[#{tool_list.join(", ")}]",
         tools: tools.map do |tool|
-          "#{tool}: #{Langchain::Tool.const_get(Langchain::Tool::Base::TOOLS[tool]).const_get(:DESCRIPTION)}"
+          tool_name = tool.tool_name
+          tool_description = tool.class.const_get(:DESCRIPTION)
+          "#{tool_name}: #{tool_description}"
         end.join("\n")
       )
     end

data/lib/langchain/agent/sql_query_agent/sql_query_agent.rb CHANGED Viewed

@@ -4,26 +4,30 @@ module Langchain::Agent
   class SQLQueryAgent < Base
     attr_reader :llm, :db, :schema
+    #
     # Initializes the Agent
     #
     # @param llm [Object] The LLM client to use
-    # @param db_connection_string [String] Database connection info
-    def initialize(llm:, db_connection_string:)
+    # @param db [Object] Database connection info
+    #
+    def initialize(llm:, db:)
       @llm = llm
-      @db = Langchain::Tool::Database.new(db_connection_string)
+      @db = db
       @schema = @db.schema
     end
+    #
     # Ask a question and get an answer
     #
     # @param question [String] Question to ask the LLM/Database
     # @return [String] Answer to the question
-    def ask(question:)
+    #
+    def run(question:)
       prompt = create_prompt_for_sql(question: question)
       # Get the SQL string to execute
       Langchain.logger.info("[#{self.class.name}]".red + ":  Passing the inital prompt to the #{llm.class} LLM")
-      sql_string = llm.complete(prompt: prompt, max_tokens: 500)
+      sql_string = llm.complete(prompt: prompt)
       # Execute the SQL string and collect the results
       Langchain.logger.info("[#{self.class.name}]".red + ":  Passing the SQL to the Database: #{sql_string}")
@@ -32,7 +36,7 @@ module Langchain::Agent
       # Pass the results and get the LLM to synthesize the answer to the question
       Langchain.logger.info("[#{self.class.name}]".red + ":  Passing the synthesize prompt to the #{llm.class} LLM with results: #{results}")
       prompt2 = create_prompt_for_answer(question: question, sql_query: sql_string, results: results)
-      llm.complete(prompt: prompt2, max_tokens: 500)
+      llm.complete(prompt: prompt2)
     end
     private

data/lib/langchain/llm/openai.rb CHANGED Viewed

@@ -35,7 +35,7 @@ module Langchain::LLM
     def embed(text:, **params)
       parameters = {model: DEFAULTS[:embeddings_model_name], input: text}
-      Langchain::Utils::TokenLengthValidator.validate!(text, parameters[:model])
+      Langchain::Utils::TokenLengthValidator.validate_max_tokens!(text, parameters[:model])
       response = client.embeddings(parameters: parameters.merge(params))
       response.dig("data").first.dig("embedding")
@@ -50,9 +50,8 @@ module Langchain::LLM
     def complete(prompt:, **params)
       parameters = compose_parameters DEFAULTS[:completion_model_name], params
-      Langchain::Utils::TokenLengthValidator.validate!(prompt, parameters[:model])
       parameters[:prompt] = prompt
+      parameters[:max_tokens] = Langchain::Utils::TokenLengthValidator.validate_max_tokens!(prompt, parameters[:model])
       response = client.completions(parameters: parameters)
       response.dig("choices", 0, "text")
@@ -67,9 +66,8 @@ module Langchain::LLM
     def chat(prompt:, **params)
       parameters = compose_parameters DEFAULTS[:chat_completion_model_name], params
-      Langchain::Utils::TokenLengthValidator.validate!(prompt, parameters[:model])
       parameters[:messages] = [{role: "user", content: prompt}]
+      parameters[:max_tokens] = Langchain::Utils::TokenLengthValidator.validate_max_tokens!(prompt, parameters[:model])
       response = client.chat(parameters: parameters)
       response.dig("choices", 0, "message", "content")
@@ -87,12 +85,7 @@ module Langchain::LLM
       )
       prompt = prompt_template.format(text: text)
-      complete(
-        prompt: prompt,
-        temperature: DEFAULTS[:temperature],
-        # Most models have a context length of 2048 tokens (except for the newest models, which support 4096).
-        max_tokens: 2048
-      )
+      complete(prompt: prompt, temperature: DEFAULTS[:temperature])
     end
     private

data/lib/langchain/tool/base.rb CHANGED Viewed

@@ -6,47 +6,59 @@ module Langchain::Tool
     # How to add additional Tools?
     # 1. Create a new file in lib/tool/your_tool_name.rb
-    # 2. Add your tool to the TOOLS hash below
-    #   "your_tool_name" => "Tool::YourToolName"
-    # 3. Implement `self.execute(input:)` method in your tool class
-    # 4. Add your tool to the README.md
+    # 2. Create a class in the file that inherits from Langchain::Tool::Base
+    # 3. Add `NAME=` and `DESCRIPTION=` constants in your Tool class
+    # 4. Implement `execute(input:)` method in your tool class
+    # 5. Add your tool to the README.md
-    TOOLS = {
-      "calculator" => "Langchain::Tool::Calculator",
-      "search" => "Langchain::Tool::SerpApi",
-      "wikipedia" => "Langchain::Tool::Wikipedia",
-      "database" => "Langchain::Tool::Database"
-    }
+    #
+    # Returns the NAME constant of the tool
+    #
+    # @return [String] tool name
+    #
+    def tool_name
+      self.class.const_get(:NAME)
+    end
+    #
+    # Sets the DESCRIPTION constant of the tool
+    #
+    # @param value [String] tool description
+    #
     def self.description(value)
       const_set(:DESCRIPTION, value.tr("\n", " ").strip)
     end
+    #
     # Instantiates and executes the tool and returns the answer
+    #
     # @param input [String] input to the tool
     # @return [String] answer
+    #
     def self.execute(input:)
       new.execute(input: input)
     end
+    #
     # Executes the tool and returns the answer
+    #
     # @param input [String] input to the tool
     # @return [String] answer
+    #
     def execute(input:)
       raise NotImplementedError, "Your tool must implement the `#execute(input:)` method that returns a string"
     end
     #
-    # Validates the list of strings (tools) are all supported or raises an error
-    # @param tools [Array<String>] list of tools to be used
+    # Validates the list of tools or raises an error
+    # @param tools [Array<Langchain::Tool>] list of tools to be used
     #
     # @raise [ArgumentError] If any of the tools are not supported
     #
     def self.validate_tools!(tools:)
-      unrecognized_tools = tools - Langchain::Tool::Base::TOOLS.keys
-      if unrecognized_tools.any?
-        raise ArgumentError, "Unrecognized Tools: #{unrecognized_tools}"
+      # Check if the tool count is equal to unique tool count
+      if tools.count != tools.map(&:tool_name).uniq.count
+        raise ArgumentError, "Either tools are not unique or are conflicting with each other"
       end
     end
   end

data/lib/langchain/tool/calculator.rb CHANGED Viewed

@@ -8,9 +8,10 @@ module Langchain::Tool
     # Gem requirements:
     #   gem "eqn", "~> 1.6.5"
     #   gem "google_search_results", "~> 2.0.0"
-    # ENV requirements: ENV["SERPAPI_API_KEY"]
     #
+    NAME = "calculator"
     description <<~DESC
       Useful for getting the result of a math expression.
@@ -33,8 +34,12 @@ module Langchain::Tool
     rescue Eqn::ParseError, Eqn::NoVariableValueError
       # Sometimes the input is not a pure math expression, e.g: "12F in Celsius"
       # We can use the google answer box to evaluate this expression
-      hash_results = Langchain::Tool::SerpApi.execute_search(input: input)
-      hash_results.dig(:answer_box, :to)
+      # TODO: Figure out to find a better way to evaluate these language expressions.
+      hash_results = Langchain::Tool::SerpApi
+        .new(api_key: ENV["SERPAPI_API_KEY"])
+        .execute_search(input: input)
+      hash_results.dig(:answer_box, :to) ||
+        hash_results.dig(:answer_box, :result)
     end
   end
 end

data/lib/langchain/tool/database.rb CHANGED Viewed

@@ -6,40 +6,55 @@ module Langchain::Tool
     # Gem requirements: gem "sequel", "~> 5.68.0"
     #
+    NAME = "database"
     description <<~DESC
       Useful for getting the result of a database query.
       The input to this tool should be valid SQL.
     DESC
+    attr_reader :db
+    #
     # Establish a database connection
-    # @param db_connection_string [String] Database connection info, e.g. 'postgres://user:password@localhost:5432/db_name'
-    def initialize(db_connection_string)
+    #
+    # @param connection_string [String] Database connection info, e.g. 'postgres://user:password@localhost:5432/db_name'
+    # @return [Database] Database object
+    #
+    def initialize(connection_string:)
       depends_on "sequel"
       require "sequel"
       require "sequel/extensions/schema_dumper"
-      raise StandardError, "db_connection_string parameter cannot be blank" if db_connection_string.empty?
+      raise StandardError, "connection_string parameter cannot be blank" if connection_string.empty?
-      @db = Sequel.connect(db_connection_string)
+      @db = Sequel.connect(connection_string)
       @db.extension :schema_dumper
     end
+    #
+    # Returns the database schema
+    #
+    # @return [String] schema
+    #
     def schema
       Langchain.logger.info("[#{self.class.name}]".light_blue + ": Dumping schema")
-      @db.dump_schema_migration(same_db: true, indexes: false) unless @db.adapter_scheme == :mock
+      db.dump_schema_migration(same_db: true, indexes: false) unless db.adapter_scheme == :mock
     end
+    #
     # Evaluates a sql expression
+    #
     # @param input [String] sql expression
     # @return [Array] results
+    #
     def execute(input:)
       Langchain.logger.info("[#{self.class.name}]".light_blue + ": Executing \"#{input}\"")
-      begin
-        @db[input].to_a
-      rescue Sequel::DatabaseError => e
-        Langchain.logger.error("[#{self.class.name}]".light_red + ": #{e.message}")
-      end
+      db[input].to_a
+    rescue Sequel::DatabaseError => e
+      Langchain.logger.error("[#{self.class.name}]".light_red + ": #{e.message}")
     end
   end
 end

data/lib/langchain/tool/ruby_code_interpreter.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module Langchain::Tool
     #
     # Gem requirements: gem "safe_ruby", "~> 1.0.4"
     #
+    NAME = "ruby_code_interpreter"
     description <<~DESC
       A Ruby code interpreter. Use this to execute ruby expressions. Input should be a valid ruby expression. If you want to see the output of the tool, make sure to return a value.
     DESC

data/lib/langchain/tool/serp_api.rb CHANGED Viewed

@@ -6,8 +6,13 @@ module Langchain::Tool
     # Wrapper around SerpAPI
     #
     # Gem requirements: gem "google_search_results", "~> 2.0.0"
-    # ENV requirements: ENV["SERPAPI_API_KEY"] # https://serpapi.com/manage-api-key)
     #
+    # Usage:
+    # search = Langchain::Tool::SerpApi.new(api_key: "YOUR_API_KEY")
+    # search.execute(input: "What is the capital of France?")
+    #
+    NAME = "search"
     description <<~DESC
       A wrapper around Google Search.
@@ -18,39 +23,57 @@ module Langchain::Tool
       Input should be a search query.
     DESC
-    def initialize
+    attr_reader :api_key
+    #
+    # Initializes the SerpAPI tool
+    #
+    # @param api_key [String] SerpAPI API key
+    # @return [Langchain::Tool::SerpApi] SerpAPI tool
+    #
+    def initialize(api_key:)
       depends_on "google_search_results"
       require "google_search_results"
+      @api_key = api_key
     end
+    #
     # Executes Google Search and returns hash_results JSON
+    #
     # @param input [String] search query
     # @return [Hash] hash_results JSON
+    #
     def self.execute_search(input:)
       new.execute_search(input: input)
     end
-    # Executes Google Search and returns hash_results JSON
+    #
+    # Executes Google Search and returns the result
+    #
     # @param input [String] search query
     # @return [String] Answer
-    # TODO: Glance at all of the fields that langchain Python looks through: https://github.com/hwchase17/langchain/blob/v0.0.166/langchain/utilities/serpapi.py#L128-L156
-    # We may need to do the same thing here.
+    #
     def execute(input:)
       Langchain.logger.info("[#{self.class.name}]".light_blue + ": Executing \"#{input}\"")
       hash_results = execute_search(input: input)
+      # TODO: Glance at all of the fields that langchain Python looks through: https://github.com/hwchase17/langchain/blob/v0.0.166/langchain/utilities/serpapi.py#L128-L156
+      # We may need to do the same thing here.
       hash_results.dig(:answer_box, :answer) ||
         hash_results.dig(:answer_box, :snippet) ||
         hash_results.dig(:organic_results, 0, :snippet)
     end
+    #
+    # Executes Google Search and returns hash_results JSON
+    #
+    # @param input [String] search query
+    # @return [Hash] hash_results JSON
+    #
     def execute_search(input:)
-      GoogleSearch.new(
-        q: input,
-        serp_api_key: ENV["SERPAPI_API_KEY"]
-      )
+      GoogleSearch
+        .new(q: input, serp_api_key: api_key)
         .get_hash
     end
   end

data/lib/langchain/tool/wikipedia.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module Langchain::Tool
     #
     # Gem requirements: gem "wikipedia-client", "~> 1.17.0"
     #
+    NAME = "wikipedia"
     description <<~DESC
       A wrapper around Wikipedia.

data/lib/langchain/utils/token_length_validator.rb CHANGED Viewed

@@ -34,23 +34,50 @@ module Langchain
         "ada" => 2049
       }.freeze
+      # GOOGLE_PALM_TOKEN_LIMITS = {
+      #   "chat-bison-001" => {
+      #     "inputTokenLimit"=>4096,
+      #     "outputTokenLimit"=>1024
+      #   },
+      #   "text-bison-001" => {
+      #     "inputTokenLimit"=>8196,
+      #     "outputTokenLimit"=>1024
+      #   },
+      #   "embedding-gecko-001" => {
+      #     "inputTokenLimit"=>1024
+      #   }
+      # }.freeze
       #
-      # Validate the length of the text passed in to OpenAI's API
+      # Calculate the `max_tokens:` parameter to be set by calculating the context length of the text minus the prompt length
       #
       # @param text [String] The text to validate
       # @param model_name [String] The model name to validate against
-      # @return [Boolean] Whether the text is valid or not
+      # @return [Integer] Whether the text is valid or not
       # @raise [TokenLimitExceeded] If the text is too long
       #
-      def self.validate!(text, model_name)
-        encoder = Tiktoken.encoding_for_model(model_name)
-        token_length = encoder.encode(text).length
+      def self.validate_max_tokens!(text, model_name)
+        text_token_length = token_length(text, model_name)
+        max_tokens = TOKEN_LIMITS[model_name] - text_token_length
-        if token_length > TOKEN_LIMITS[model_name]
-          raise TokenLimitExceeded, "This model's maximum context length is #{TOKEN_LIMITS[model_name]} tokens, but the given text is #{token_length} tokens long."
+        # Raise an error even if whole prompt is equal to the model's token limit (max_tokens == 0) since not response will be returned
+        if max_tokens <= 0
+          raise TokenLimitExceeded, "This model's maximum context length is #{TOKEN_LIMITS[model_name]} tokens, but the given text is #{text_token_length} tokens long."
         end
-        true
+        max_tokens
+      end
+      #
+      # Calculate token length for a given text and model name
+      #
+      # @param text [String] The text to validate
+      # @param model_name [String] The model name to validate against
+      # @return [Integer] The token length of the text
+      #
+      def self.token_length(text, model_name)
+        encoder = Tiktoken.encoding_for_model(model_name)
+        encoder.encode(text).length
       end
     end
   end

data/lib/langchain/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 # frozen_string_literal: true
 module Langchain
-  VERSION = "0.5.0"
+  VERSION = "0.5.2"
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: langchainrb
 version: !ruby/object:Gem::Version
-  version: 0.5.0
+  version: 0.5.2
 platform: ruby
 authors:
 - Andrei Bondarev
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2023-06-05 00:00:00.000000000 Z
+date: 2023-06-08 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: tiktoken_ruby