RubyGems - ollama-ruby - Versions diffs - 0.3.2 → 0.5.0 - Mend

ollama-ruby 0.3.2 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

checksums.yaml +4 -4
data/CHANGES.md +131 -0
data/README.md +21 -16
data/Rakefile +6 -1
data/bin/ollama_chat +303 -168
data/bin/ollama_cli +11 -9
data/lib/ollama/documents/cache/common.rb +17 -0
data/lib/ollama/documents/{memory_cache.rb → cache/memory_cache.rb} +8 -10
data/lib/ollama/documents/cache/redis_backed_memory_cache.rb +38 -0
data/lib/ollama/documents/{redis_cache.rb → cache/redis_cache.rb} +18 -11
data/lib/ollama/documents/splitters/character.rb +8 -6
data/lib/ollama/documents/splitters/semantic.rb +1 -1
data/lib/ollama/documents.rb +25 -19
data/lib/ollama/utils/colorize_texts.rb +21 -1
data/lib/ollama/utils/fetcher.rb +43 -10
data/lib/ollama/utils/file_argument.rb +20 -4
data/lib/ollama/utils/tags.rb +1 -0
data/lib/ollama/version.rb +1 -1
data/lib/ollama.rb +1 -0
data/ollama-ruby.gemspec +11 -7
data/spec/ollama/documents/memory_cache_spec.rb +16 -16
data/spec/ollama/documents/redis_backed_memory_cache_spec.rb +106 -0
data/spec/ollama/documents/redis_cache_spec.rb +36 -16
data/spec/ollama/documents/splitters/character_spec.rb +28 -14
data/spec/ollama/utils/fetcher_spec.rb +42 -1
metadata +70 -8

data/bin/ollama_chat CHANGED Viewed

@@ -5,6 +5,8 @@ include Ollama
 require 'term/ansicolor'
 include Term::ANSIColor
 require 'tins'
+require 'tins/xt/full'
+require 'tins/xt/hash_union'
 include Tins::GO
 require 'reline'
 require 'reverse_markdown'
@@ -14,6 +16,7 @@ require 'uri'
 require 'nokogiri'
 require 'rss'
 require 'pdf/reader'
+require 'csv'
 class OllamaChatConfig
   include ComplexConfig
@@ -22,16 +25,23 @@ class OllamaChatConfig
   DEFAULT_CONFIG = <<~EOT
     ---
     url: <%= ENV['OLLAMA_URL'] || 'http://%s' % ENV.fetch('OLLAMA_HOST') %>
+    proxy: null # http://localhost:8080
     model:
       name: <%= ENV.fetch('OLLAMA_CHAT_MODEL', 'llama3.1') %>
       options:
         num_ctx: 8192
     prompts:
       system: <%= ENV.fetch('OLLAMA_CHAT_SYSTEM', 'null') %>
+      embed: "This source was now embedded: %{source}"
       summarize: |
-        Generate an abstract summary of the content in this document:
+        Generate an abstract summary of the content in this document using
+        %{words} words:
-        %s
+        %{source_content}
+      web: |
+        Answer the the query %{query} using these sources and summaries:
+        %{results}
     voice: Samantha
     markdown: true
     embedding:
@@ -41,16 +51,20 @@ class OllamaChatConfig
         options: {}
         # Retrieval prompt template:
         prompt: 'Represent this sentence for searching relevant passages: %s'
-      collection: <%= ENV.fetch('OLLAMA_CHAT_COLLECTION', 'ollama_chat') %>
+      collection: <%= ENV['OLLAMA_CHAT_COLLECTION'] %>
       found_texts_size: 4096
       found_texts_count: null
       splitter:
         name: RecursiveCharacter
         chunk_size: 1024
-    cache: Ollama::Documents::RedisCache
+    cache: Ollama::Documents::Cache::RedisBackedMemoryCache
     redis:
-      url: <%= ENV.fetch('REDIS_URL', 'null') %>
+      documents:
+        url: <%= ENV.fetch('REDIS_URL', 'null') %>
+      expiring:
+        url: <%= ENV.fetch('REDIS_EXPIRING_URL', 'null') %>
     debug: <%= ENV['OLLAMA_CHAT_DEBUG'].to_i == 1 ? true : false %>
+    ssl_no_verify: []
   EOT
   def initialize(filename = nil)
@@ -111,8 +125,8 @@ class FollowChat
       end
       content = response.message&.content
       @messages.last.content << content
-      if @markdown and @messages.last.content.present?
-        markdown_content = Utils::ANSIMarkdown.parse(@messages.last.content)
+      if @markdown and content = @messages.last.content.full?
+        markdown_content = Utils::ANSIMarkdown.parse(content)
         @output.print clear_screen, move_home, @user, ?\n, markdown_content
       else
         @output.print content
@@ -130,11 +144,11 @@ class FollowChat
     prompt_eval_duration = response.prompt_eval_duration / 1e9
     stats_text = {
       eval_duration:        Tins::Duration.new(eval_duration),
-      eval_count:           response.eval_count,
-      eval_rate:            bold { "%.2f c/s" % (response.eval_count / eval_duration) } + color(111),
+      eval_count:           response.eval_count.to_i,
+      eval_rate:            bold { "%.2f c/s" % (response.eval_count.to_i / eval_duration) } + color(111),
       prompt_eval_duration: Tins::Duration.new(prompt_eval_duration),
-      prompt_eval_count:    response.prompt_eval_count,
-      prompt_eval_rate:     bold { "%.2f c/s" % (response.prompt_eval_count / prompt_eval_duration) } + color(111),
+      prompt_eval_count:    response.prompt_eval_count.to_i,
+      prompt_eval_rate:     bold { "%.2f c/s" % (response.prompt_eval_count.to_i / prompt_eval_duration) } + color(111),
       total_duration:       Tins::Duration.new(response.total_duration / 1e9),
       load_duration:        Tins::Duration.new(response.load_duration / 1e9),
     }.map { _1 * '=' } * ' '
@@ -149,7 +163,7 @@ def search_web(query, n = nil)
   n < 1 and n = 1
   query = URI.encode_uri_component(query)
   url = "https://www.duckduckgo.com/html/?q=#{query}"
-  Ollama::Utils::Fetcher.new.get(url) do |tmp|
+  Ollama::Utils::Fetcher.new(debug: $config.debug).get(url) do |tmp|
     result = []
     doc = Nokogiri::HTML(tmp)
     doc.css('.results_links').each do |link|
@@ -216,32 +230,25 @@ def save_conversation(filename, messages)
 end
 def message_type(images)
-  if images.present?
-    ?📸
-  else
-    ?📨
-  end
+  images.present? ? ?📸 : ?📨
 end
-def list_conversation(messages, markdown)
-  messages.each do |m|
+def list_conversation(messages, last = nil)
+  last = (last || messages.size).clamp(0, messages.size)
+  messages[-last..-1].to_a.each do |m|
     role_color = case m.role
                  when 'user' then 172
                  when 'assistant' then 111
                  when 'system' then 213
                  else 210
                  end
-    content = if markdown && m.content.present?
-                Utils::ANSIMarkdown.parse(m.content)
-              else
-                m.content
-              end
+    content = m.content.full? { $markdown ? Utils::ANSIMarkdown.parse(_1) : _1 }
     message_text = message_type(m.images) + " "
     message_text += bold { color(role_color) { m.role } }
     message_text += ":\n#{content}"
-    if m.images.present?
-      message_text += "\nImages: " + italic { m.images.map(&:path) * ', ' }
-    end
+    m.images.full? { |images|
+      message_text += "\nImages: " + italic { images.map(&:path) * ', ' }
+    }
     puts message_text
   end
 end
@@ -257,37 +264,37 @@ end
 def parse_rss(source_io)
   feed = RSS::Parser.parse(source_io, false, false)
-  title = <<~end
+  title = <<~EOT
     # #{feed&.channel&.title}
-  end
+  EOT
   feed.items.inject(title) do |text, item|
-    text << <<~end
+    text << <<~EOT
       ## [#{item&.title}](#{item&.link})
       updated on #{item&.pubDate}
       #{reverse_markdown(item&.description)}
-    end
+    EOT
   end
 end
 def parse_atom(source_io)
   feed = RSS::Parser.parse(source_io, false, false)
-  title = <<~end
+  title = <<~EOT
     # #{feed.title.content}
-  end
+  EOT
   feed.items.inject(title) do |text, item|
-    text << <<~end
+    text << <<~EOT
       ## [#{item&.title&.content}](#{item&.link&.href})
       updated on #{item&.updated&.content}
       #{reverse_markdown(item&.content&.content)}
-    end
+    EOT
   end
 end
@@ -302,6 +309,16 @@ def parse_source(source_io)
     end
     source_io.rewind
     source_io.read
+  when 'text/csv'
+    result = +''
+    CSV.table(File.new(source_io), col_sep: ?,).each do |row|
+      next if row.fields.select(&:present?).size == 0
+      result << row.map { |pair|
+        pair.compact.map { _1.to_s.strip } * ': ' if pair.last.present?
+      }.select(&:present?).map { _1.prepend('  ') } * ?\n
+      result << "\n\n"
+    end
+    result
   when %r(\Atext/)
     source_io.read
   when 'application/rss+xml'
@@ -312,47 +329,53 @@ def parse_source(source_io)
     source_io.read
   when 'application/pdf'
     reader = PDF::Reader.new(source_io)
-    result = +''
-    reader.pages.each do |page|
-      result << page.text
-    end
-    result
+    reader.pages.inject(+'') { |result, page| result << page.text }
   else
-    STDERR.puts "Cannot import #{source_io&.content_type} document."
+    STDERR.puts "Cannot embed #{source_io&.content_type} document."
     return
   end
 end
-def import_document(source_io, source)
-  unless $config.embedding.enabled
-    STDOUT.puts "Embedding disabled, I won't import any documents, try: /summarize"
-    return
-  end
-  puts "Importing #{italic { source_io&.content_type }} document #{source.to_s.inspect}."
+def embed_source(source_io, source)
+  embedding_enabled? or return parse_source(source_io)
+  puts "Embedding #{italic { source_io&.content_type }} document #{source.to_s.inspect}."
   text = parse_source(source_io) or return
   text.downcase!
   splitter_config = $config.embedding.splitter
-  inputs = case splitter_config.name
-           when 'Character'
-             Ollama::Documents::Splitters::Character.new(
-               chunk_size: splitter_config.chunk_size,
-             ).split(text)
-           when 'RecursiveCharacter'
-             Ollama::Documents::Splitters::RecursiveCharacter.new(
-               chunk_size: splitter_config.chunk_size,
-             ).split(text)
-           when 'Semantic'
-             Ollama::Documents::Splitters::Semantic.new(
-               ollama:, model: $config.embedding.model.name,
-               chunk_size: splitter_config.chunk_size,
-             ).split(
-               text,
-               breakpoint: splitter_config.breakpoint.to_sym,
-               percentage: splitter_config.percentage?,
-               percentile: splitter_config.percentile?,
-             )
-           end
-  $documents.add(inputs, source: source.to_s)
+  inputs = nil
+  case splitter_config.name
+  when 'Character'
+    splitter = Ollama::Documents::Splitters::Character.new(
+      chunk_size: splitter_config.chunk_size,
+    )
+    inputs = splitter.split(text)
+  when 'RecursiveCharacter'
+    splitter = Ollama::Documents::Splitters::RecursiveCharacter.new(
+      chunk_size: splitter_config.chunk_size,
+    )
+    inputs = splitter.split(text)
+  when 'Semantic'
+    splitter = Ollama::Documents::Splitters::Semantic.new(
+      ollama:, model: $config.embedding.model.name,
+      chunk_size: splitter_config.chunk_size,
+    )
+    inputs = splitter.split(
+      text,
+      breakpoint: splitter_config.breakpoint.to_sym,
+      percentage: splitter_config.percentage?,
+      percentile: splitter_config.percentile?,
+    )
+    inputs = splitter.split(text)
+  end
+  inputs or return
+  source = source.to_s
+  if source.start_with?(?!)
+    source = Ollama::Utils::Width.truncate(
+      source[1..-1].gsub(/\W+/, ?_),
+      length: 10
+    )
+  end
+  $documents.add(inputs, source: source)
 end
 def add_image(images, source_io, source)
@@ -361,10 +384,27 @@ def add_image(images, source_io, source)
   (images << image).uniq!
 end
+def http_options(url)
+  options = {}
+  if ssl_no_verify = $config.ssl_no_verify?
+    hostname = URI.parse(url).hostname
+    options |= { ssl_verify_peer: !ssl_no_verify.include?(hostname) }
+  end
+  if proxy = $config.proxy?
+    options |= { proxy: }
+  end
+  options
+end
 def fetch_source(source, &block)
   case source
+  when %r(\A!(.*))
+    command = $1
+    Utils::Fetcher.execute(command) do |tmp|
+      block.(tmp)
+    end
   when %r(\Ahttps?://\S+)
-    Utils::Fetcher.get(source) do |tmp|
+    Utils::Fetcher.get(source, debug: $config.debug, http_options: http_options(source)) do |tmp|
       block.(tmp)
     end
   when %r(\Afile://(?:(?:[.-]|[[:alnum:]])*)(/\S*)|([~.]?/\S*))
@@ -380,16 +420,45 @@ rescue => e
   STDERR.puts "Cannot add source #{source.to_s.inspect}: #{e}\n#{e.backtrace * ?\n}"
 end
-def summarize(source)
+def import(source)
+  puts "Now importing #{source.to_s.inspect}."
+  fetch_source(source) do |source_io|
+    content = parse_source(source_io)
+    content.present? or return
+    source_io.rewind
+    content
+  end
+end
+def summarize(source, words: nil)
+  words = words.to_i
+  words < 1 and words = 100
   puts "Now summarizing #{source.to_s.inspect}."
   source_content =
     fetch_source(source) do |source_io|
-      content = parse_source(source_io) or return
+      content = parse_source(source_io)
+      content.present? or return
       source_io.rewind
-      import_document(source_io, source)
       content
     end
-  $config.prompts.summarize % source_content
+  $config.prompts.summarize % { source_content:, words: }
+end
+def embed(source)
+  if embedding_enabled?
+    puts "Now embedding #{source.to_s.inspect}."
+    fetch_source(source) do |source_io|
+      content = parse_source(source_io)
+      content.present? or return
+      source_io.rewind
+      embed_source(source_io, source)
+      content
+    end
+    $config.prompts.embed % { source: }
+  else
+    puts "Embedding is off, so I will just give a small summary of this source."
+    summarize(source)
+  end
 end
 def parse_content(content, images)
@@ -407,7 +476,7 @@ def parse_content(content, images)
         when 'image'
           add_image(images, source_io, source)
         when 'text', 'application'
-          import_document(source_io, source)
+          embed_source(source_io, source)
         else
           STDERR.puts(
             "Cannot fetch #{source.to_s.inspect} with content type "\
@@ -434,62 +503,112 @@ end
 def choose_collection(default_collection)
   collections = [ default_collection ] + $documents.collections
-  collections = collections.uniq.sort
-  $documents.collection = collection =
-    Ollama::Utils::Chooser.choose(collections) || default_collection
+  collections = collections.compact.map(&:to_s).uniq.sort
+  collections.unshift('[NEW]')
+  collection = Ollama::Utils::Chooser.choose(collections) || default_collection
+  if collection == '[NEW]'
+      print "Enter name of the new collection: "
+      collection = STDIN.gets.chomp
+  end
+  $documents.collection = collection
 ensure
   puts "Changing to collection #{bold{collection}}."
   collection_stats
 end
 def collection_stats
-  puts <<~end
+  puts <<~EOT
     Collection
       Name: #{bold{$documents.collection}}
+      Embedding model: #{bold{$embedding_model}}
       #Embeddings: #{$documents.size}
       Tags: #{$documents.tags}
-  end
+  EOT
 end
 def configure_cache
-  Object.const_get($config.cache)
+  if $opts[?M]
+    Ollama::Documents::MemoryCache
+  else
+    Object.const_get($config.cache)
+  end
 rescue => e
   STDERR.puts "Caught #{e.class}: #{e} => Falling back to MemoryCache."
   Ollama::Documents::MemoryCache
 end
-def set_markdown(value)
-  if value
+def toggle_markdown
+  $markdown = !$markdown
+  show_markdown
+end
+def show_markdown
+  if $markdown
     puts "Using ANSI markdown to output content."
-    true
   else
     puts "Using plaintext for outputting content."
-    false
   end
+  $markdown
 end
-def display_chat_help
-  puts <<~end
-    /paste                                   to paste content
-    /markdown                                toggle markdown output
-    /list                                    list the messages of the conversation
-    /clear                                   clear the conversation messages
-    /clobber                                 clear conversation messages and collection
-    /pop [n]                                 pop the last n exchanges, defaults to 1
-    /model                                   change the model
-    /regenerate                              the last answer message
-    /collection clear [tag]|stats|change|new clear or show stats of current collection
-    /summarize source                        summarize the URL/file source's content
-    /web [n] query                           query web search & return n or 1 results
-    /save filename                           store conversation messages
-    /load filename                           load conversation messages
-    /quit                                    to quit
-    /help                                    to view this help
+def set_embedding(embedding)
+  $embedding_enabled = embedding
+  show_embedding
+end
+def show_embedding
+  puts "Embedding is #{embedding_enabled? ? "on" : "off"}."
+  $embedding_enabled
+end
+def embedding_enabled?
+  $embedding_enabled && !$embedding_paused
+end
+def toggle_embedding_paused
+  $embedding_paused = !$embedding_paused
+  show_embedding
+end
+def info
+  puts "Current model is #{bold{$model}}."
+  collection_stats
+  if show_embedding
+    puts "Text splitter is #{bold{$config.embedding.splitter.name}}."
   end
+  puts "Documents database cache is #{$documents.nil? ? 'n/a' : $documents.cache.class}"
+  show_markdown
+end
+def clear_messages(messages)
+  messages.delete_if { _1.role != 'system' }
+end
+def display_chat_help
+  puts <<~EOT
+    /paste                          to paste content
+    /markdown                       toggle markdown output
+    /list [n]                       list the last n / all conversation exchanges
+    /clear                          clear the whole conversation
+    /clobber                        clear the conversation and collection
+    /pop [n]                        pop the last n exchanges, defaults to 1
+    /model                          change the model
+    /regenerate                     the last answer message
+    /collection clear [tag]|change  clear or show stats of current collection
+    /import source                  import the source's content
+    /summarize [n] source           summarize the source's content in n words
+    /embedding                      toggle embedding paused or not
+    /embed source                   embed the source's content
+    /web [n] query                  query web search & return n or 1 results
+    /save filename                  store conversation messages
+    /load filename                  load conversation messages
+    /quit                           to quit
+    /help                           to view this help
+  EOT
 end
 def usage
-  puts <<~end
+  puts <<~EOT
     #{File.basename($0)} [OPTIONS]
       -f CONFIG      config file to read
@@ -498,11 +617,13 @@ def usage
       -s SYSTEM      the system prompt to use as a file, OLLAMA_CHAT_SYSTEM
       -c CHAT        a saved chat conversation to load
       -C COLLECTION  name of the collection used in this conversation
-      -D DOCUMENT    load document and add to collection (multiple)
+      -D DOCUMENT    load document and add to embeddings collection (multiple)
+      -M             use (empty) MemoryCache for this chat session
+      -E             disable embeddings for this chat session
       -v             use voice output
       -h             this help
-  end
+  EOT
   exit 0
 end
@@ -510,38 +631,44 @@ def ollama
   $ollama
 end
-opts = go 'f:u:m:s:c:C:D:vh'
+$opts = go 'f:u:m:s:c:C:D:MEvh'
-config = OllamaChatConfig.new(opts[?f])
+config = OllamaChatConfig.new($opts[?f])
 $config = config.config
-opts[?h] and usage
+$opts[?h] and usage
 puts "Configuration read from #{config.filename.inspect} is:", $config
-base_url = opts[?u] || $config.url
+base_url = $opts[?u] || $config.url
 $ollama      = Client.new(base_url:, debug: $config.debug)
-model        = choose_model(opts[?m], $config.model.name)
+$model       = choose_model($opts[?m], $config.model.name)
 options      = Options[$config.model.options]
-model_system = pull_model_unless_present(model, options)
+model_system = pull_model_unless_present($model, options)
 messages     = []
+set_embedding($config.embedding.enabled && !$opts[?E])
-if $config.embedding.enabled
-  embedding_model         = $config.embedding.model.name
+if voice = ($config.voice if $opts[?v])
+  puts "Using voice #{bold{voice}} to speak."
+end
+$markdown = $config.markdown
+if embedding_enabled?
+  $embedding_model         = $config.embedding.model.name
   embedding_model_options = Options[$config.embedding.model.options]
-  pull_model_unless_present(embedding_model, embedding_model_options)
-  collection = opts[?C] || $config.embedding.collection
+  pull_model_unless_present($embedding_model, embedding_model_options)
+  collection = $opts[?C] || $config.embedding.collection
   $documents = Documents.new(
     ollama:,
-    model:         $config.embedding.model.name,
+    model:         $embedding_model,
     model_options: $config.embedding.model.options,
     collection:,
     cache:         configure_cache,
-    redis_url:     $config.redis.url?,
+    redis_url:     $config.redis.documents.url?,
   )
-  document_list = opts[?D].to_a
+  document_list = $opts[?D].to_a
   if document_list.any?(&:empty?)
     puts "Clearing collection #{bold{collection}}."
     $documents.clear
@@ -559,28 +686,26 @@ if $config.embedding.enabled
     document_list.each_slice(25) do |docs|
       docs.each do |doc|
         fetch_source(doc) do |doc_io|
-          import_document(doc_io, doc)
+          embed_source(doc_io, doc)
         end
       end
     end
   end
   collection_stats
 else
-  $documents = Documents.new(ollama:, model:)
-end
-if voice = ($config.voice if opts[?v])
-  puts "Using voice #{bold{voice}} to speak."
+  $documents = Tins::NULL
 end
-markdown = set_markdown($config.markdown)
-if opts[?c]
-  messages.concat load_conversation(opts[?c])
+if $opts[?c]
+  messages.concat load_conversation($opts[?c])
 else
   if system = Ollama::Utils::FileArgument.
-      get_file_argument(opts[?s], default: $config.prompts.system? || model_system)
+      get_file_argument($opts[?s], default: $config.prompts.system? || model_system)
     messages << Message.new(role: 'system', content: system)
-    puts "Configured system prompt is:\n#{italic { system }}"
+    puts <<~EOT
+      Configured system prompt is:
+      #{italic{Ollama::Utils::Width.wrap(system, percentage: 90)}}
+    EOT
   end
 end
@@ -596,25 +721,25 @@ loop do
   when %r(^/paste$)
     puts bold { "Paste your content and then press C-d!" }
     content = STDIN.read
-  when %r(^/quit$)
-    puts "Goodbye."
-    exit 0
   when %r(^/markdown$)
-    markdown = set_markdown(!markdown)
+    $markdown = toggle_markdown
     next
-  when %r(^/list$)
-    list_conversation(messages, markdown)
+  when %r(^/list(?:\s+(\d*))?$)
+    last = if $1
+             2 * $1.to_i
+           end
+    list_conversation(messages, last)
     next
   when %r(^/clear$)
-    messages.clear
+    clear_messages(messages)
     puts "Cleared messages."
     next
   when %r(^/clobber$)
-    messages.clear
+    clear_messages(messages)
     $documents.clear
     puts "Cleared messages and collection."
     next
-  when %r(^/collection\s+(clear|stats|change|new)(?:\s+(.+))?$)
+  when %r(^/collection\s+(clear|change)(?:\s+(.+))?$)
     command, arg = $1, $2
     case command
     when 'clear'
@@ -626,24 +751,26 @@ loop do
         $documents.clear
         puts "Cleared collection #{bold{collection}}."
       end
-    when 'stats'
-      collection_stats
     when 'change'
       choose_collection(collection)
-    when 'new'
-      print "Enter name of the new collection: "
-      $documents.collection = collection = STDIN.gets.chomp
-      collection_stats
     end
     next
-  when %r(^/pop?(?:\s+(\d*))?$)
-    n = $1.to_i.clamp(1, Float::INFINITY)
-    r =  messages.pop(2 * n)
-    m = r.size / 2
-    puts "Popped the last #{m} exchanges."
+  when %r(/info)
+    info
+    next
+  when %r(^/pop(?:\s+(\d*))?$)
+    if messages.size > 1
+      n = $1.to_i.clamp(1, Float::INFINITY)
+      r =  messages.pop(2 * n)
+      m = r.size / 2
+      puts "Popped the last #{m} exchanges."
+    else
+      puts "No more exchanges you can pop."
+    end
+    list_conversation(messages, 2)
     next
   when %r(^/model$)
-    model = choose_model('', model)
+    $model = choose_model('', $model)
     next
   when %r(^/regenerate$)
     if content = messages[-2]&.content
@@ -655,23 +782,29 @@ loop do
     end
     parse_content = false
     content
-  when %r(^/summarize\s+(.+))
+  when %r(^/import\s+(.+))
+    parse_content = false
+    content       = import($1) or next
+  when %r(^/summarize\s+(?:(\d+)\s+)?(.+))
     parse_content = false
-    content       = summarize($1) or next
+    content       = summarize($2, words: $1) or next
+  when %r(^/embedding$)
+    toggle_embedding_paused
+    next
+  when %r(^/embed\s+(.+))
+    parse_content = false
+    content       = embed($1) or next
   when %r(^/web\s+(?:(\d+)\s+)?(.+))
     parse_content   = false
     urls            = search_web($2, $1.to_i)
     urls.each do |url|
-      fetch_source(url) do |url_io|
-        import_document(url_io, url)
-      end
+      fetch_source(url) { |url_io| embed_source(url_io, url) }
     end
     urls_summarized = urls.map { summarize(_1) }
-    content = <<~end
-      Answer the the query #{$2.inspect} using these sources and summaries:
-      #{urls.zip(urls_summarized).map { |u, s| "%s as \n:%s" % [ u, s ] } * "\n\n"}
-    end
+    query   = $2.inspect
+    results = urls.zip(urls_summarized).
+      map { |u, s| "%s as \n:%s" % [ u, s ] } * "\n\n"
+    content = $config.prompts.web % { query:, results: }
   when %r(^/save\s+(.+)$)
     save_conversation($1, messages)
     puts "Saved conversation to #$1."
@@ -680,6 +813,9 @@ loop do
     messages = load_conversation($1)
     puts "Loaded conversation from #$1."
     next
+  when %r(^/quit$)
+    puts "Goodbye."
+    exit 0
   when %r(^/)
     display_chat_help
     next
@@ -697,7 +833,7 @@ loop do
                     [ content, Utils::Tags.new ]
                   end
-  if $config.embedding.enabled && content
+  if embedding_enabled? && content
     records = $documents.find_where(
       content.downcase,
       tags:,
@@ -705,19 +841,18 @@ loop do
       text_size:  $config.embedding.found_texts_size?,
       text_count: $config.embedding.found_texts_count?,
     )
-    found_texts = records.map(&:text)
-    unless found_texts.empty?
-      content += "\nConsider these chunks for your answer:\n"\
-        "#{found_texts.join("\n\n---\n\n")}"
+    unless records.empty?
+      content += "\nConsider these chunks for your answer:\n\n"\
+        "#{records.map { [ _1.text, _1.tags_set ] * ?\n }.join("\n\n---\n\n")}"
     end
   end
   messages << Message.new(role: 'user', content:, images:)
-  handler = FollowChat.new(messages:, markdown:, voice:)
-  ollama.chat(model:, messages:, options:, stream: true, &handler)
+  handler = FollowChat.new(messages:, markdown: $markdown, voice:)
+  ollama.chat(model: $model, messages:, options:, stream: true, &handler)
-  if records
-    puts records.map { |record|
+  if embedding_enabled? && !records.empty?
+    puts "", records.map { |record|
       link = if record.source =~ %r(\Ahttps?://)
                record.source
              else