RubyGems - langchainrb - Versions diffs - 0.3.13 → 0.3.14 - Mend

langchainrb 0.3.13 → 0.3.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +9 -0
data/Gemfile.lock +1 -1
data/README.md +1 -0
data/lib/langchain/data.rb +16 -0
data/lib/langchain/loader.rb +4 -3
data/lib/langchain.rb +1 -0
data/lib/llm/base.rb +5 -0
data/lib/llm/cohere.rb +17 -0
data/lib/llm/google_palm.rb +20 -0
data/lib/llm/hugging_face.rb +4 -0
data/lib/llm/openai.rb +29 -0
data/lib/llm/prompts/summarize_template.json +5 -0
data/lib/llm/replicate.rb +29 -0
data/lib/vectorsearch/base.rb +1 -1
data/lib/vectorsearch/weaviate.rb +13 -36
data/lib/version.rb +1 -1
metadata +4 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 2ee811b2bac8fadea4d90c4212363a901829a4aac219da0f2a2dcbe7c6f59c5b
-  data.tar.gz: 8fa32e6df4aaf69cb6d29977913c1b8a30d6f65b777b1f90c8a7f504d869ca8f
+  metadata.gz: 33c9436ac8d6a73dc06d30f63c11e4f246b3705aa8934765a53ee59325c3a9cd
+  data.tar.gz: 9cc85603694f9367dd162e25379029a345aa0b5c88cccf303c2af114d43a4010
 SHA512:
-  metadata.gz: cbb7e0c975333248c01082a47f7096fb9d6807c3b7619424eb9348238008d7b4257518287d9358114bf4e3a589349520ebf71ace00bf1fe8906afd27e8b1418a
-  data.tar.gz: 759444abe0b17518c6ef31fed6980f6bc0d3d096606860c4d6fddb8baeda4e0a23fc3909e42eba0f32912a786abec76cac54384533db2787e05d741f0907fa1d
+  metadata.gz: ca5e81638625939d11999a64d44c92fc57c762a934aa8fd5b110c3f5aacc9a736ab5f02da4366e7a1b9b9ec0335dd1eb1683f5b9d90bd97c81914ea0a698dc7c
+  data.tar.gz: aff49ef9451bcbc9a97d181757a5b913737cbfbb4fc3ca49d423cbd2e59a4a71091816e98c2996ff7f8292cb6e0c0d69931a4f3e4e36e2a69fdd7f745640e266

data/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,14 @@
 ## [Unreleased]
+## [0.3.14] - 2023-05-28
+- 🔍 Vectorsearch
+  - Not relying on Weaviate modules anymore
+  - Adding missing specs for Qdrant and Milvus classes
+- 🚚 Loaders
+  - Add Langchain::Data result object for data loaders
+- 🗣️ LLMs
+  - Add `summarize()` method to the LLMs
 ## [0.3.13] - 2023-05-26
 - 🔍 Vectorsearch
   - Pgvector support

data/Gemfile.lock CHANGED Viewed

@@ -1,7 +1,7 @@
 PATH
   remote: .
   specs:
-    langchainrb (0.3.13)
+    langchainrb (0.3.14)
 GEM
   remote: https://rubygems.org/

data/README.md CHANGED Viewed

@@ -321,6 +321,7 @@ Langchain.logger.level = :info
 [<img style="border-radius:50%" alt="Andrei Bondarev" src="https://avatars.githubusercontent.com/u/541665?v=4" width="80" height="80" class="avatar">](https://github.com/andreibondarev)
 [<img style="border-radius:50%" alt="Rafael Figueiredo" src="https://avatars.githubusercontent.com/u/35845775?v=4" width="80" height="80" class="avatar">](https://github.com/rafaelqfigueiredo)
 [<img style="border-radius:50%" alt="Ricky Chilcott" src="https://avatars.githubusercontent.com/u/445759?v=4" width="80" height="80" class="avatar">](https://github.com/rickychilcott)
+[<img style="border-radius:50%" alt="Alex Chaplinsky" src="https://avatars.githubusercontent.com/u/695947?v=4" width="80" height="80" class="avatar">](https://github.com/alchaplinsky)
 (Criteria for becoming an Honorary Contributor or Core Contributor is pending...)

data/lib/langchain/data.rb ADDED Viewed

@@ -0,0 +1,16 @@
+# frozen_string_literal: true
+module Langchain
+  class Data
+    attr_reader :source
+    def initialize(data, options = {})
+      @source = options[:source]
+      @data = data
+    end
+    def value
+      @data
+    end
+  end
+end

data/lib/langchain/loader.rb CHANGED Viewed

@@ -58,11 +58,12 @@ module Langchain
     end
     def process(&block)
-      data, processor = yield
+      raw_data, kind = yield
-      raise UnknownFormatError unless processor
+      raise UnknownFormatError unless kind
-      Langchain::Processors.const_get(processor).new.parse(data)
+      processor = Langchain::Processors.const_get(kind).new
+      Langchain::Data.new(processor.parse(raw_data), source: @path)
     end
     def find_processor(constant, value)

data/lib/langchain.rb CHANGED Viewed

@@ -17,6 +17,7 @@ module Langchain
   @root = Pathname.new(__dir__)
   autoload :Loader, "langchain/loader"
+  autoload :Data, "langchain/data"
   module Processors
     autoload :Base, "langchain/processors/base"

data/lib/llm/base.rb CHANGED Viewed

@@ -33,6 +33,11 @@ module LLM
       raise NotImplementedError, "#{self.class.name} does not support generating embeddings"
     end
+    # Method supported by an LLM that summarizes a given text
+    def summarize(...)
+      raise NotImplementedError, "#{self.class.name} does not support summarization"
+    end
     # Ensure that the LLM value passed in is supported
     # @param llm [Symbol] The LLM to use
     def self.validate_llm!(llm:)

data/lib/llm/cohere.rb CHANGED Viewed

@@ -16,9 +16,12 @@ module LLM
       @client = ::Cohere::Client.new(api_key: api_key)
     end
+    #
     # Generate an embedding for a given text
+    #
     # @param text [String] The text to generate an embedding for
     # @return [Hash] The embedding
+    #
     def embed(text:)
       response = client.embed(
         texts: [text],
@@ -27,9 +30,12 @@ module LLM
       response.dig("embeddings").first
     end
+    #
     # Generate a completion for a given prompt
+    #
     # @param prompt [String] The prompt to generate a completion for
     # @return [Hash] The completion
+    #
     def complete(prompt:, **params)
       default_params = {
         prompt: prompt,
@@ -51,5 +57,16 @@ module LLM
     def chat(...)
       complete(...)
     end
+    # Generate a summary in English for a given text
+    #
+    # More parameters available to extend this method with: https://github.com/andreibondarev/cohere-ruby/blob/0.9.4/lib/cohere/client.rb#L107-L115
+    #
+    # @param text [String] The text to generate a summary for
+    # @return [String] The summary
+    def summarize(text:)
+      response = client.summarize(text: text)
+      response.dig("summary")
+    end
   end
 end

data/lib/llm/google_palm.rb CHANGED Viewed

@@ -81,5 +81,25 @@ module LLM
       response = client.generate_chat_message(**default_params)
       response.dig("candidates", 0, "content")
     end
+    #
+    # Generate a summarization for a given text
+    #
+    # @param text [String] The text to generate a summarization for
+    # @return [String] The summarization
+    #
+    def summarize(text:)
+      prompt_template = Prompt.load_from_path(
+        file_path: Langchain.root.join("llm/prompts/summarize_template.json")
+      )
+      prompt = prompt_template.format(text: text)
+      complete(
+        prompt: prompt,
+        temperature: DEFAULTS[:temperature],
+        # Most models have a context length of 2048 tokens (except for the newest models, which support 4096).
+        max_tokens: 2048
+      )
+    end
   end
 end

data/lib/llm/hugging_face.rb CHANGED Viewed

@@ -12,6 +12,7 @@ module LLM
     #
     # Intialize the HuggingFace LLM
+    #
     # @param api_key [String] The API key to use
     #
     def initialize(api_key:)
@@ -21,9 +22,12 @@ module LLM
       @client = ::HuggingFace::InferenceApi.new(api_token: api_key)
     end
+    #
     # Generate an embedding for a given text
+    #
     # @param text [String] The text to embed
     # @return [Array] The embedding
+    #
     def embed(text:)
       client.embedding(
         input: text,

data/lib/llm/openai.rb CHANGED Viewed

@@ -18,9 +18,12 @@ module LLM
       @client = ::OpenAI::Client.new(access_token: api_key)
     end
+    #
     # Generate an embedding for a given text
+    #
     # @param text [String] The text to generate an embedding for
     # @return [Array] The embedding
+    #
     def embed(text:)
       response = client.embeddings(
         parameters: {
@@ -31,9 +34,12 @@ module LLM
       response.dig("data").first.dig("embedding")
     end
+    #
     # Generate a completion for a given prompt
+    #
     # @param prompt [String] The prompt to generate a completion for
     # @return [String] The completion
+    #
     def complete(prompt:, **params)
       default_params = {
         model: DEFAULTS[:completion_model_name],
@@ -51,9 +57,12 @@ module LLM
       response.dig("choices", 0, "text")
     end
+    #
     # Generate a chat completion for a given prompt
+    #
     # @param prompt [String] The prompt to generate a chat completion for
     # @return [String] The chat completion
+    #
     def chat(prompt:, **params)
       default_params = {
         model: DEFAULTS[:chat_completion_model_name],
@@ -71,5 +80,25 @@ module LLM
       response = client.chat(parameters: default_params)
       response.dig("choices", 0, "message", "content")
     end
+    #
+    # Generate a summary for a given text
+    #
+    # @param text [String] The text to generate a summary for
+    # @return [String] The summary
+    #
+    def summarize(text:)
+      prompt_template = Prompt.load_from_path(
+        file_path: Langchain.root.join("llm/prompts/summarize_template.json")
+      )
+      prompt = prompt_template.format(text: text)
+      complete(
+        prompt: prompt,
+        temperature: DEFAULTS[:temperature],
+        # Most models have a context length of 2048 tokens (except for the newest models, which support 4096).
+        max_tokens: 2048
+      )
+    end
   end
 end

data/lib/llm/prompts/summarize_template.json ADDED Viewed

@@ -0,0 +1,5 @@
+{
+  "_type": "prompt",
+  "input_variables": ["text"],
+  "template": "Write a concise summary of the following:\n\n{text}\n\nCONCISE SUMMARY:"
+}

data/lib/llm/replicate.rb CHANGED Viewed

@@ -23,8 +23,11 @@ module LLM
       dimension: 384
     }.freeze
+    #
     # Intialize the Replicate LLM
+    #
     # @param api_key [String] The API key to use
+    #
     def initialize(api_key:)
       depends_on "replicate-ruby"
       require "replicate"
@@ -36,9 +39,12 @@ module LLM
       @client = ::Replicate.client
     end
+    #
     # Generate an embedding for a given text
+    #
     # @param text [String] The text to generate an embedding for
     # @return [Hash] The embedding
+    #
     def embed(text:)
       response = embeddings_model.predict(input: text)
@@ -50,9 +56,12 @@ module LLM
       response.output
     end
+    #
     # Generate a completion for a given prompt
+    #
     # @param prompt [String] The prompt to generate a completion for
     # @return [Hash] The completion
+    #
     def complete(prompt:, **params)
       response = completion_model.predict(prompt: prompt)
@@ -73,6 +82,26 @@ module LLM
       complete(...)
     end
+    #
+    # Generate a summary for a given text
+    #
+    # @param text [String] The text to generate a summary for
+    # @return [String] The summary
+    #
+    def summarize(text:)
+      prompt_template = Prompt.load_from_path(
+        file_path: Langchain.root.join("llm/prompts/summarize_template.json")
+      )
+      prompt = prompt_template.format(text: text)
+      complete(
+        prompt: prompt,
+        temperature: DEFAULTS[:temperature],
+        # Most models have a context length of 2048 tokens (except for the newest models, which support 4096).
+        max_tokens: 2048
+      )
+    end
     alias_method :generate_embedding, :embed
     private

data/lib/vectorsearch/base.rb CHANGED Viewed

@@ -74,7 +74,7 @@ module Vectorsearch
       texts = Array(path || paths)
         .flatten
-        .map { |path| Langchain::Loader.new(path)&.load }
+        .map { |path| Langchain::Loader.new(path)&.load&.value }
         .compact
       add_texts(texts: texts)

data/lib/vectorsearch/weaviate.rb CHANGED Viewed

@@ -14,9 +14,7 @@ module Vectorsearch
       @client = ::Weaviate::Client.new(
         url: url,
-        api_key: api_key,
-        model_service: llm,
-        model_service_api_key: llm_api_key
+        api_key: api_key
       )
       @index_name = index_name
@@ -30,7 +28,8 @@ module Vectorsearch
       objects = Array(texts).map do |text|
         {
           class: index_name,
-          properties: {content: text}
+          properties: {content: text},
+          vector: llm_client.embed(text: text)
         }
       end
@@ -43,11 +42,7 @@ module Vectorsearch
     def create_default_schema
       client.schema.create(
         class_name: index_name,
-        vectorizer: "text2vec-#{llm}",
-        # TODO: Figure out a way to optionally enable it
-        # "module_config": {
-        #   "qna-openai": {}
-        # },
+        vectorizer: "none",
         properties: [
           # TODO: Allow passing in your own IDs
           {
@@ -63,14 +58,9 @@ module Vectorsearch
     # @param k [Integer|String] The number of results to return
     # @return [Hash] The search results
     def similarity_search(query:, k: 4)
-      near_text = "{ concepts: [\"#{query}\"] }"
+      embedding = llm_client.embed(text: query)
-      client.query.get(
-        class_name: index_name,
-        near_text: near_text,
-        limit: k.to_s,
-        fields: "content _additional { id }"
-      )
+      similarity_search_by_vector(embedding: embedding, k: k)
     end
     # Return documents similar to the vector
@@ -92,29 +82,16 @@ module Vectorsearch
     # @param question [String] The question to ask
     # @return [Hash] The answer
     def ask(question:)
-      # Weaviate currently supports the `ask:` parameter only for the OpenAI LLM (with `qna-openai` module enabled).
-      # The Cohere support is on the way: https://github.com/weaviate/weaviate/pull/2600
-      if llm == :openai
-        ask_object = "{ question: \"#{question}\" }"
-        client.query.get(
-          class_name: index_name,
-          ask: ask_object,
-          limit: "1",
-          fields: "_additional { answer { result } }"
-        )
-      elsif llm == :cohere
-        search_results = similarity_search(query: question)
+      search_results = similarity_search(query: question)
-        context = search_results.map do |result|
-          result.dig("content").to_s
-        end
-        context = context.join("\n---\n")
+      context = search_results.map do |result|
+        result.dig("content").to_s
+      end
+      context = context.join("\n---\n")
-        prompt = generate_prompt(question: question, context: context)
+      prompt = generate_prompt(question: question, context: context)
-        llm_client.chat(prompt: prompt)
-      end
+      llm_client.chat(prompt: prompt)
     end
   end
 end

data/lib/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 # frozen_string_literal: true
 module Langchain
-  VERSION = "0.3.13"
+  VERSION = "0.3.14"
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: langchainrb
 version: !ruby/object:Gem::Version
-  version: 0.3.13
+  version: 0.3.14
 platform: ruby
 authors:
 - Andrei Bondarev
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2023-05-26 00:00:00.000000000 Z
+date: 2023-05-28 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: dotenv-rails
@@ -316,6 +316,7 @@ files:
 - lib/agent/chain_of_thought_agent/chain_of_thought_agent_prompt.json
 - lib/dependency_helper.rb
 - lib/langchain.rb
+- lib/langchain/data.rb
 - lib/langchain/loader.rb
 - lib/langchain/processors/base.rb
 - lib/langchain/processors/csv.rb
@@ -331,6 +332,7 @@ files:
 - lib/llm/google_palm.rb
 - lib/llm/hugging_face.rb
 - lib/llm/openai.rb
+- lib/llm/prompts/summarize_template.json
 - lib/llm/replicate.rb
 - lib/prompt/base.rb
 - lib/prompt/few_shot_prompt_template.rb