ragdoll-cli 0.1.11 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 89c5200b031e287b125fb93d7025ea666ad3456bdc209fbc68a0dc70b673a410
4
- data.tar.gz: 5bfa7dabb52f7b990b5935736ec1710a3b0f4cace386903bb9491bcf4f88720a
3
+ metadata.gz: 95d02e9e2a6f2ed5278406deae5fb36a8b55aaa1fa9228e3ca4bc8ad602daaf8
4
+ data.tar.gz: 34e38890fb8829a213057bb4f3142ce81c620e1e2463b70b8b3d2d0692beae5a
5
5
  SHA512:
6
- metadata.gz: f3eb42ababba85311e9d6bb3db1b5cf4f63f00e46a4a07ea8e9ec21841a9b4cdea44d36619b168a9298d08393d250917f66c14fa82c72b3866937833b3a44bae
7
- data.tar.gz: 2a5085c3c38a9147f2bf26fb8a4ad2814bccdb05dfa3d5d76f5cb7ec21319d82d969758eece5b066f01b50100efa85ae9a9abfa20badca70d9144b5bd52c7906
6
+ metadata.gz: 5767875a5559078f341466140788711c61b45f9cd52bc77fd0844b43574a84c9462367abbe29c88d9c997df86f6e6996f116fbe2c4bb5201321f13d8ccac6eb5
7
+ data.tar.gz: 68d51ae3e7061e95a9a2f74f55d269afdc3af9bb377edd6edb5758eae7a49938a4f3032cb3c358a4e82d367b1a28ff26882183b6f7714fa4cf04eb556a988c8f
data/README.md CHANGED
@@ -1,7 +1,7 @@
1
- <div align="center" style="background-color: yellow; color: black; padding: 20px; margin: 20px 0; border: 2px solid black; font-size: 48px; font-weight: bold;">
2
- ⚠️ CAUTION ⚠️<br />
3
- Software Under Development by a Crazy Man
4
- </div>
1
+ > [!CAUTION]
2
+ > **Software Under Development by a Crazy Man**
3
+ >
4
+ > Evolved from multi-modal to unified text-based RAG architecture.
5
5
  <br />
6
6
  <div align="center">
7
7
  <table>
@@ -12,7 +12,7 @@
12
12
  </a>
13
13
  </td>
14
14
  <td width="50%" valign="top">
15
- <p>Multi-modal RAG (Retrieval-Augmented Generation) is an architecture that integrates multiple data types (such as text, images, and audio) to enhance AI response generation. It combines retrieval-based methods, which fetch relevant information from a knowledge base, with generative large language models (LLMs) that create coherent and contextually appropriate outputs. This approach allows for more comprehensive and engaging user interactions, such as chatbots that respond with both text and images or educational tools that incorporate visual aids into learning materials. By leveraging various modalities, multi-modal RAG systems improve context understanding and user experience.</p>
15
+ <p>Unified Text-Based RAG converts all media types—images, audio, documents—into comprehensive text representations before vectorization. This approach enables powerful cross-modal search where you can find images through AI-generated descriptions, audio through transcripts, and all content through a single, unified text-based search index. The system combines intelligent text conversion with retrieval-based methods and generative large language models for enhanced AI response generation.</p>
16
16
  </td>
17
17
  </tr>
18
18
  </table>
@@ -20,7 +20,7 @@
20
20
 
21
21
  # Ragdoll::CLI
22
22
 
23
- Standalone command-line interface for the Ragdoll RAG (Retrieval-Augmented Generation) system. Provides document import, search, and management capabilities through a simple CLI.
23
+ Standalone command-line interface for the Ragdoll unified text-based RAG system. Converts all media types to searchable text and provides powerful cross-modal search capabilities through a simple CLI.
24
24
 
25
25
  ## Installation
26
26
 
@@ -10,6 +10,11 @@ module Ragdoll
10
10
 
11
11
  puts "Searching for: #{query}"
12
12
  puts "Search type: #{options[:search_type] || 'semantic'}"
13
+
14
+ # Show deprecation warning for content_type
15
+ if options[:content_type]
16
+ puts "⚠️ DEPRECATED: --content_type option is deprecated. Unified text-based system converts all media to searchable text."
17
+ end
13
18
 
14
19
  # Show hybrid search weights if applicable
15
20
  if options[:search_type] == 'hybrid'
@@ -22,7 +22,9 @@ module Ragdoll
22
22
 
23
23
  default_config = {
24
24
  'llm_provider' => 'openai',
25
- 'embedding_model' => 'text-embedding-3-small',
25
+ 'embedding_model' => 'text-embedding-3-large',
26
+ 'embedding_provider' => 'openai',
27
+ 'use_unified_content' => true,
26
28
  'chunk_size' => 1000,
27
29
  'chunk_overlap' => 200,
28
30
  'search_similarity_threshold' => 0.7,
@@ -72,7 +74,13 @@ module Ragdoll
72
74
  ragdoll_config.llm_provider = config['llm_provider']&.to_sym || :openai
73
75
  end
74
76
  if ragdoll_config.respond_to?(:embedding_model=)
75
- ragdoll_config.embedding_model = config['embedding_model'] || 'text-embedding-3-small'
77
+ ragdoll_config.embedding_model = config['embedding_model'] || 'text-embedding-3-large'
78
+ end
79
+ if ragdoll_config.respond_to?(:embedding_provider=)
80
+ ragdoll_config.embedding_provider = config['embedding_provider']&.to_sym || :openai
81
+ end
82
+ if ragdoll_config.respond_to?(:use_unified_content=)
83
+ ragdoll_config.use_unified_content = config['use_unified_content'] != false
76
84
  end
77
85
 
78
86
  # Processing settings
@@ -3,6 +3,6 @@
3
3
 
4
4
  module Ragdoll
5
5
  module CLI
6
- VERSION = "0.1.11"
6
+ VERSION = "0.1.12"
7
7
  end
8
8
  end
data/lib/ragdoll/cli.rb CHANGED
@@ -42,7 +42,7 @@ module Ragdoll
42
42
  method_option :threshold, type: :numeric,
43
43
  desc: 'Similarity threshold (0.0-1.0, lower = more results)'
44
44
  method_option :content_type, type: :string, aliases: '-c',
45
- desc: 'Filter by content type (text, image, audio)'
45
+ desc: 'DEPRECATED: Content type filtering (unified text-based system converts all media to text)'
46
46
  method_option :classification, type: :string, aliases: '-C',
47
47
  desc: 'Filter by classification'
48
48
  method_option :keywords, type: :string, aliases: '-k',
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: ragdoll-cli
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.11
4
+ version: 0.1.12
5
5
  platform: ruby
6
6
  authors:
7
7
  - Dewayne VanHoozer
@@ -15,14 +15,14 @@ dependencies:
15
15
  requirements:
16
16
  - - ">="
17
17
  - !ruby/object:Gem::Version
18
- version: 0.1.10
18
+ version: 0.1.12
19
19
  type: :runtime
20
20
  prerelease: false
21
21
  version_requirements: !ruby/object:Gem::Requirement
22
22
  requirements:
23
23
  - - ">="
24
24
  - !ruby/object:Gem::Version
25
- version: 0.1.10
25
+ version: 0.1.12
26
26
  - !ruby/object:Gem::Dependency
27
27
  name: ruby-progressbar
28
28
  requirement: !ruby/object:Gem::Requirement
@@ -177,8 +177,9 @@ dependencies:
177
177
  - - ">="
178
178
  - !ruby/object:Gem::Version
179
179
  version: '0'
180
- description: Command-line interface for Ragdoll RAG system with semantic, full-text,
181
- and hybrid search capabilities. Under development. Contributors welcome.
180
+ description: Command-line interface for Ragdoll's unified text-based RAG system. Converts
181
+ all media types (images, audio, documents) to searchable text for powerful cross-modal
182
+ search capabilities. Under development. Contributors welcome.
182
183
  email:
183
184
  - dvanhoozer@gmail.com
184
185
  executables:
@@ -227,7 +228,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
227
228
  - !ruby/object:Gem::Version
228
229
  version: '0'
229
230
  requirements: []
230
- rubygems_version: 3.7.1
231
+ rubygems_version: 3.7.2
231
232
  specification_version: 4
232
- summary: Multi-Modal Retrieval Augmented Generation for the CLI
233
+ summary: Unified Text-Based RAG CLI for Cross-Modal Search
233
234
  test_files: []