lsh 0.0.2 → 0.0.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/lib/lsh/index.rb +4 -5
 - data/lib/lsh/math_util_gsl.rb +10 -9
 - data/lib/lsh/math_util_jblas.rb +10 -6
 - metadata +25 -29
 
    
        data/lib/lsh/index.rb
    CHANGED
    
    | 
         @@ -21,7 +21,6 @@ module LSH 
     | 
|
| 
       21 
21 
     | 
    
         
             
                attr_reader :projections, :buckets
         
     | 
| 
       22 
22 
     | 
    
         | 
| 
       23 
23 
     | 
    
         
             
                def initialize(dim, k, w = Float::INFINITY, l = 150)
         
     | 
| 
       24 
     | 
    
         
            -
                  @math = MathUtil.new
         
     | 
| 
       25 
24 
     | 
    
         
             
                  @window = w
         
     | 
| 
       26 
25 
     | 
    
         
             
                  @dim = dim
         
     | 
| 
       27 
26 
     | 
    
         
             
                  @number_of_random_vectors = k
         
     | 
| 
         @@ -88,7 +87,7 @@ module LSH 
     | 
|
| 
       88 
87 
     | 
    
         
             
                        hash << 0
         
     | 
| 
       89 
88 
     | 
    
         
             
                      end
         
     | 
| 
       90 
89 
     | 
    
         
             
                    else
         
     | 
| 
       91 
     | 
    
         
            -
                      b = bias ?  
     | 
| 
      
 90 
     | 
    
         
            +
                      b = bias ? MathUtil.random_uniform : 0.0
         
     | 
| 
       92 
91 
     | 
    
         
             
                      hash << (b + dot_product / @window).floor
         
     | 
| 
       93 
92 
     | 
    
         
             
                    end
         
     | 
| 
       94 
93 
     | 
    
         
             
                  end
         
     | 
| 
         @@ -126,15 +125,15 @@ module LSH 
     | 
|
| 
       126 
125 
     | 
    
         | 
| 
       127 
126 
     | 
    
         
             
                def random_vector_unit(dim)
         
     | 
| 
       128 
127 
     | 
    
         
             
                  r = random_vector(dim)
         
     | 
| 
       129 
     | 
    
         
            -
                  r /=  
     | 
| 
      
 128 
     | 
    
         
            +
                  r /= MathUtil.norm(r)
         
     | 
| 
       130 
129 
     | 
    
         
             
                end
         
     | 
| 
       131 
130 
     | 
    
         | 
| 
       132 
131 
     | 
    
         
             
                def random_vector(dim)
         
     | 
| 
       133 
     | 
    
         
            -
                   
     | 
| 
      
 132 
     | 
    
         
            +
                  MathUtil.random_gaussian_vector(dim)
         
     | 
| 
       134 
133 
     | 
    
         
             
                end
         
     | 
| 
       135 
134 
     | 
    
         | 
| 
       136 
135 
     | 
    
         
             
                def similarity(v1, v2)
         
     | 
| 
       137 
     | 
    
         
            -
                   
     | 
| 
      
 136 
     | 
    
         
            +
                  MathUtil.dot(v1, v2)
         
     | 
| 
       138 
137 
     | 
    
         
             
                end
         
     | 
| 
       139 
138 
     | 
    
         | 
| 
       140 
139 
     | 
    
         
             
              end
         
     | 
    
        data/lib/lsh/math_util_gsl.rb
    CHANGED
    
    | 
         @@ -20,24 +20,25 @@ module LSH 
     | 
|
| 
       20 
20 
     | 
    
         | 
| 
       21 
21 
     | 
    
         
             
              class MathUtil
         
     | 
| 
       22 
22 
     | 
    
         | 
| 
       23 
     | 
    
         
            -
                 
     | 
| 
       24 
     | 
    
         
            -
             
     | 
| 
       25 
     | 
    
         
            -
             
     | 
| 
      
 23 
     | 
    
         
            +
                @@gsl_random = GSL::Rng.alloc
         
     | 
| 
      
 24 
     | 
    
         
            +
             
     | 
| 
      
 25 
     | 
    
         
            +
                def self.random_uniform
         
     | 
| 
      
 26 
     | 
    
         
            +
                  @@gsl_random.uniform
         
     | 
| 
       26 
27 
     | 
    
         
             
                end
         
     | 
| 
       27 
28 
     | 
    
         | 
| 
       28 
     | 
    
         
            -
                def  
     | 
| 
       29 
     | 
    
         
            -
                   
     | 
| 
      
 29 
     | 
    
         
            +
                def self.random_gaussian_vector(dim)
         
     | 
| 
      
 30 
     | 
    
         
            +
                  @@gsl_random.gaussian(1, dim)
         
     | 
| 
       30 
31 
     | 
    
         
             
                end
         
     | 
| 
       31 
32 
     | 
    
         | 
| 
       32 
     | 
    
         
            -
                def  
     | 
| 
       33 
     | 
    
         
            -
                   
     | 
| 
      
 33 
     | 
    
         
            +
                def self.random_gaussian_matrix(k, l)
         
     | 
| 
      
 34 
     | 
    
         
            +
                  GSL::Matrix.randn(k, l)
         
     | 
| 
       34 
35 
     | 
    
         
             
                end
         
     | 
| 
       35 
36 
     | 
    
         | 
| 
       36 
     | 
    
         
            -
                def dot(v1, v2)
         
     | 
| 
      
 37 
     | 
    
         
            +
                def self.dot(v1, v2)
         
     | 
| 
       37 
38 
     | 
    
         
             
                  v1 * v2.col
         
     | 
| 
       38 
39 
     | 
    
         
             
                end
         
     | 
| 
       39 
40 
     | 
    
         | 
| 
       40 
     | 
    
         
            -
                def norm(v)
         
     | 
| 
      
 41 
     | 
    
         
            +
                def self.norm(v)
         
     | 
| 
       41 
42 
     | 
    
         
             
                  v.norm
         
     | 
| 
       42 
43 
     | 
    
         
             
                end
         
     | 
| 
       43 
44 
     | 
    
         | 
    
        data/lib/lsh/math_util_jblas.rb
    CHANGED
    
    | 
         @@ -20,19 +20,23 @@ module LSH 
     | 
|
| 
       20 
20 
     | 
    
         | 
| 
       21 
21 
     | 
    
         
             
              class MathUtil
         
     | 
| 
       22 
22 
     | 
    
         | 
| 
       23 
     | 
    
         
            -
                def random_uniform
         
     | 
| 
      
 23 
     | 
    
         
            +
                def self.random_uniform
         
     | 
| 
       24 
24 
     | 
    
         
             
                  JBLAS.rand[0,0]
         
     | 
| 
       25 
25 
     | 
    
         
             
                end
         
     | 
| 
       26 
26 
     | 
    
         | 
| 
       27 
     | 
    
         
            -
                def random_gaussian_vector(dim)
         
     | 
| 
       28 
     | 
    
         
            -
                  JBLAS.randn( 
     | 
| 
      
 27 
     | 
    
         
            +
                def self.random_gaussian_vector(dim)
         
     | 
| 
      
 28 
     | 
    
         
            +
                  JBLAS.randn(1, dim)
         
     | 
| 
       29 
29 
     | 
    
         
             
                end
         
     | 
| 
       30 
30 
     | 
    
         | 
| 
       31 
     | 
    
         
            -
                def  
     | 
| 
       32 
     | 
    
         
            -
                  ( 
     | 
| 
      
 31 
     | 
    
         
            +
                def self.random_gaussian_matrix(k, l)
         
     | 
| 
      
 32 
     | 
    
         
            +
                  JBLAS.randn(k, l)
         
     | 
| 
       33 
33 
     | 
    
         
             
                end
         
     | 
| 
       34 
34 
     | 
    
         | 
| 
       35 
     | 
    
         
            -
                def  
     | 
| 
      
 35 
     | 
    
         
            +
                def self.dot(v1, v2)
         
     | 
| 
      
 36 
     | 
    
         
            +
                  (v1 * v2.t)[0,0]
         
     | 
| 
      
 37 
     | 
    
         
            +
                end
         
     | 
| 
      
 38 
     | 
    
         
            +
             
     | 
| 
      
 39 
     | 
    
         
            +
                def self.norm(v)
         
     | 
| 
       36 
40 
     | 
    
         
             
                  v.norm2
         
     | 
| 
       37 
41 
     | 
    
         
             
                end
         
     | 
| 
       38 
42 
     | 
    
         | 
    
        metadata
    CHANGED
    
    | 
         @@ -1,34 +1,32 @@ 
     | 
|
| 
       1 
1 
     | 
    
         
             
            --- !ruby/object:Gem::Specification
         
     | 
| 
       2 
2 
     | 
    
         
             
            name: lsh
         
     | 
| 
       3 
3 
     | 
    
         
             
            version: !ruby/object:Gem::Version
         
     | 
| 
       4 
     | 
    
         
            -
               
     | 
| 
       5 
     | 
    
         
            -
               
     | 
| 
      
 4 
     | 
    
         
            +
              version: 0.0.3
         
     | 
| 
      
 5 
     | 
    
         
            +
              prerelease: 
         
     | 
| 
       6 
6 
     | 
    
         
             
            platform: ruby
         
     | 
| 
       7 
7 
     | 
    
         
             
            authors:
         
     | 
| 
       8 
8 
     | 
    
         
             
            - Yves Raimond
         
     | 
| 
       9 
     | 
    
         
            -
            autorequire:
         
     | 
| 
      
 9 
     | 
    
         
            +
            autorequire: 
         
     | 
| 
       10 
10 
     | 
    
         
             
            bindir: bin
         
     | 
| 
       11 
11 
     | 
    
         
             
            cert_chain: []
         
     | 
| 
       12 
     | 
    
         
            -
            date: 2012-12- 
     | 
| 
      
 12 
     | 
    
         
            +
            date: 2012-12-17 00:00:00.000000000 Z
         
     | 
| 
       13 
13 
     | 
    
         
             
            dependencies:
         
     | 
| 
       14 
14 
     | 
    
         
             
            - !ruby/object:Gem::Dependency
         
     | 
| 
       15 
     | 
    
         
            -
              name:  
     | 
| 
       16 
     | 
    
         
            -
               
     | 
| 
      
 15 
     | 
    
         
            +
              name: gsl
         
     | 
| 
      
 16 
     | 
    
         
            +
              requirement: !ruby/object:Gem::Requirement
         
     | 
| 
      
 17 
     | 
    
         
            +
                none: false
         
     | 
| 
       17 
18 
     | 
    
         
             
                requirements:
         
     | 
| 
       18 
     | 
    
         
            -
                - -  
     | 
| 
      
 19 
     | 
    
         
            +
                - - ! '>='
         
     | 
| 
       19 
20 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       20 
     | 
    
         
            -
                    version:  
     | 
| 
       21 
     | 
    
         
            -
             
     | 
| 
      
 21 
     | 
    
         
            +
                    version: '0'
         
     | 
| 
      
 22 
     | 
    
         
            +
              type: :runtime
         
     | 
| 
      
 23 
     | 
    
         
            +
              prerelease: false
         
     | 
| 
      
 24 
     | 
    
         
            +
              version_requirements: !ruby/object:Gem::Requirement
         
     | 
| 
       22 
25 
     | 
    
         
             
                none: false
         
     | 
| 
       23 
     | 
    
         
            -
              requirement: !ruby/object:Gem::Requirement
         
     | 
| 
       24 
26 
     | 
    
         
             
                requirements:
         
     | 
| 
       25 
     | 
    
         
            -
                - -  
     | 
| 
      
 27 
     | 
    
         
            +
                - - ! '>='
         
     | 
| 
       26 
28 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       27 
     | 
    
         
            -
                    version:  
     | 
| 
       28 
     | 
    
         
            -
                      MA==
         
     | 
| 
       29 
     | 
    
         
            -
                none: false
         
     | 
| 
       30 
     | 
    
         
            -
              prerelease: false
         
     | 
| 
       31 
     | 
    
         
            -
              type: :runtime
         
     | 
| 
      
 29 
     | 
    
         
            +
                    version: '0'
         
     | 
| 
       32 
30 
     | 
    
         
             
            description: An implementation of LSH in Ruby, using JBLAS for JRuby and GSL for MRI
         
     | 
| 
       33 
31 
     | 
    
         
             
            email: yves.raimond@bbc.co.uk
         
     | 
| 
       34 
32 
     | 
    
         
             
            executables: []
         
     | 
| 
         @@ -39,30 +37,28 @@ files: 
     | 
|
| 
       39 
37 
     | 
    
         
             
            - lib/lsh/index.rb
         
     | 
| 
       40 
38 
     | 
    
         
             
            - lib/lsh/math_util_gsl.rb
         
     | 
| 
       41 
39 
     | 
    
         
             
            - lib/lsh/math_util_jblas.rb
         
     | 
| 
       42 
     | 
    
         
            -
            homepage:
         
     | 
| 
      
 40 
     | 
    
         
            +
            homepage: 
         
     | 
| 
       43 
41 
     | 
    
         
             
            licenses: []
         
     | 
| 
       44 
     | 
    
         
            -
            post_install_message:
         
     | 
| 
      
 42 
     | 
    
         
            +
            post_install_message: 
         
     | 
| 
       45 
43 
     | 
    
         
             
            rdoc_options: []
         
     | 
| 
       46 
44 
     | 
    
         
             
            require_paths:
         
     | 
| 
       47 
45 
     | 
    
         
             
            - lib
         
     | 
| 
       48 
46 
     | 
    
         
             
            required_ruby_version: !ruby/object:Gem::Requirement
         
     | 
| 
      
 47 
     | 
    
         
            +
              none: false
         
     | 
| 
       49 
48 
     | 
    
         
             
              requirements:
         
     | 
| 
       50 
     | 
    
         
            -
              - -  
     | 
| 
      
 49 
     | 
    
         
            +
              - - ! '>='
         
     | 
| 
       51 
50 
     | 
    
         
             
                - !ruby/object:Gem::Version
         
     | 
| 
       52 
     | 
    
         
            -
                  version:  
     | 
| 
       53 
     | 
    
         
            -
                    MA==
         
     | 
| 
       54 
     | 
    
         
            -
              none: false
         
     | 
| 
      
 51 
     | 
    
         
            +
                  version: '0'
         
     | 
| 
       55 
52 
     | 
    
         
             
            required_rubygems_version: !ruby/object:Gem::Requirement
         
     | 
| 
      
 53 
     | 
    
         
            +
              none: false
         
     | 
| 
       56 
54 
     | 
    
         
             
              requirements:
         
     | 
| 
       57 
     | 
    
         
            -
              - -  
     | 
| 
      
 55 
     | 
    
         
            +
              - - ! '>='
         
     | 
| 
       58 
56 
     | 
    
         
             
                - !ruby/object:Gem::Version
         
     | 
| 
       59 
     | 
    
         
            -
                  version:  
     | 
| 
       60 
     | 
    
         
            -
                    MA==
         
     | 
| 
       61 
     | 
    
         
            -
              none: false
         
     | 
| 
      
 57 
     | 
    
         
            +
                  version: '0'
         
     | 
| 
       62 
58 
     | 
    
         
             
            requirements: []
         
     | 
| 
       63 
     | 
    
         
            -
            rubyforge_project:
         
     | 
| 
       64 
     | 
    
         
            -
            rubygems_version: 1.8. 
     | 
| 
       65 
     | 
    
         
            -
            signing_key:
         
     | 
| 
      
 59 
     | 
    
         
            +
            rubyforge_project: 
         
     | 
| 
      
 60 
     | 
    
         
            +
            rubygems_version: 1.8.23
         
     | 
| 
      
 61 
     | 
    
         
            +
            signing_key: 
         
     | 
| 
       66 
62 
     | 
    
         
             
            specification_version: 3
         
     | 
| 
       67 
63 
     | 
    
         
             
            summary: Locality Sensitive Hashing gem
         
     | 
| 
       68 
64 
     | 
    
         
             
            test_files: []
         
     |