serp_scraper 1.0.0 → 1.0.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
 - data/.gitignore +0 -0
 - data/EXAMPLES.md +0 -0
 - data/README.md +0 -0
 - data/lib/engines/google.rb +10 -3
 - data/lib/serp_response.rb +0 -0
 - data/lib/serp_scraper.rb +0 -0
 - data/serp_scraper.gemspec +3 -3
 - metadata +5 -17
 
    
        checksums.yaml
    CHANGED
    
    | 
         @@ -1,7 +1,7 @@ 
     | 
|
| 
       1 
1 
     | 
    
         
             
            ---
         
     | 
| 
       2 
2 
     | 
    
         
             
            SHA1:
         
     | 
| 
       3 
     | 
    
         
            -
              metadata.gz:  
     | 
| 
       4 
     | 
    
         
            -
              data.tar.gz:  
     | 
| 
      
 3 
     | 
    
         
            +
              metadata.gz: 37e155ad5c882faa1b543fc3f875b417ed2f903a
         
     | 
| 
      
 4 
     | 
    
         
            +
              data.tar.gz: 18089df07af8acfc609da7552d2282eae2ff05d3
         
     | 
| 
       5 
5 
     | 
    
         
             
            SHA512:
         
     | 
| 
       6 
     | 
    
         
            -
              metadata.gz:  
     | 
| 
       7 
     | 
    
         
            -
              data.tar.gz:  
     | 
| 
      
 6 
     | 
    
         
            +
              metadata.gz: 6736db5b2e411387cf6401b888b0e20b723483801e05fd80aab0a7823c65740f9a047b019b51f45c92b45dfa91c3004a94a215e750f039123b6246028e884934
         
     | 
| 
      
 7 
     | 
    
         
            +
              data.tar.gz: 0123239f14dc80688a682a362e27f3739731a71b53a8ff836a56f655df04766040e1adfcb7df2f95c5d121d2e1e6b45856954a50287bf4dcdc6cb48a407932cb
         
     | 
    
        data/.gitignore
    CHANGED
    
    | 
         
            File without changes
         
     | 
    
        data/EXAMPLES.md
    CHANGED
    
    | 
         
            File without changes
         
     | 
    
        data/README.md
    CHANGED
    
    | 
         
            File without changes
         
     | 
    
        data/lib/engines/google.rb
    CHANGED
    
    | 
         @@ -89,8 +89,10 @@ class SerpScraper::Google 
     | 
|
| 
       89 
89 
     | 
    
         
             
                doc     = Nokogiri::HTML(html)
         
     | 
| 
       90 
90 
     | 
    
         
             
                results = Array.new
         
     | 
| 
       91 
91 
     | 
    
         | 
| 
       92 
     | 
    
         
            -
                rows = doc.css('h3.r > a')
         
     | 
| 
       93 
     | 
    
         
            -
             
     | 
| 
      
 92 
     | 
    
         
            +
                rows = doc.css('div.rc h3.r > a')
         
     | 
| 
      
 93 
     | 
    
         
            +
             
     | 
| 
      
 94 
     | 
    
         
            +
                position = 1
         
     | 
| 
      
 95 
     | 
    
         
            +
                rows.each do |row|
         
     | 
| 
       94 
96 
     | 
    
         
             
                  begin
         
     | 
| 
       95 
97 
     | 
    
         
             
                    href = Addressable::URI.parse(row["href"])
         
     | 
| 
       96 
98 
     | 
    
         | 
| 
         @@ -99,14 +101,19 @@ class SerpScraper::Google 
     | 
|
| 
       99 
101 
     | 
    
         | 
| 
       100 
102 
     | 
    
         
             
                    url = Addressable::URI.parse(external_url)
         
     | 
| 
       101 
103 
     | 
    
         | 
| 
      
 104 
     | 
    
         
            +
                    next unless url.host # Only add valid URL's (ignore images, news etc)
         
     | 
| 
      
 105 
     | 
    
         
            +
             
     | 
| 
       102 
106 
     | 
    
         
             
                    results.push({
         
     | 
| 
       103 
     | 
    
         
            -
                      position:  
     | 
| 
      
 107 
     | 
    
         
            +
                      position: position,
         
     | 
| 
       104 
108 
     | 
    
         
             
                      title: row.content,
         
     | 
| 
       105 
109 
     | 
    
         
             
                      scheme: url.scheme,
         
     | 
| 
       106 
110 
     | 
    
         
             
                      domain: url.host,
         
     | 
| 
       107 
111 
     | 
    
         
             
                      url: url.request_uri,
         
     | 
| 
       108 
112 
     | 
    
         
             
                      full_url: url.to_s
         
     | 
| 
       109 
113 
     | 
    
         
             
                    })
         
     | 
| 
      
 114 
     | 
    
         
            +
             
     | 
| 
      
 115 
     | 
    
         
            +
                    position += 1
         
     | 
| 
      
 116 
     | 
    
         
            +
             
     | 
| 
       110 
117 
     | 
    
         
             
                  rescue
         
     | 
| 
       111 
118 
     | 
    
         
             
                    next
         
     | 
| 
       112 
119 
     | 
    
         
             
                  end
         
     | 
    
        data/lib/serp_response.rb
    CHANGED
    
    | 
         
            File without changes
         
     | 
    
        data/lib/serp_scraper.rb
    CHANGED
    
    | 
         
            File without changes
         
     | 
    
        data/serp_scraper.gemspec
    CHANGED
    
    | 
         @@ -1,6 +1,6 @@ 
     | 
|
| 
       1 
1 
     | 
    
         
             
            Gem::Specification.new do |s|
         
     | 
| 
       2 
2 
     | 
    
         
             
              s.name        = 'serp_scraper'
         
     | 
| 
       3 
     | 
    
         
            -
              s.version     = '1.0. 
     | 
| 
      
 3 
     | 
    
         
            +
              s.version     = '1.0.4'
         
     | 
| 
       4 
4 
     | 
    
         
             
              s.date        = '2017-05-26'
         
     | 
| 
       5 
5 
     | 
    
         | 
| 
       6 
6 
     | 
    
         
             
              s.homepage    = 'https://github.com/kjellberg'
         
     | 
| 
         @@ -15,8 +15,8 @@ Gem::Specification.new do |s| 
     | 
|
| 
       15 
15 
     | 
    
         
             
              s.require_paths = ["lib"]
         
     | 
| 
       16 
16 
     | 
    
         
             
              s.files       = `git ls-files`.split($/)
         
     | 
| 
       17 
17 
     | 
    
         | 
| 
       18 
     | 
    
         
            -
              s.add_runtime_dependency 'mechanize', '~> 2.7 
     | 
| 
      
 18 
     | 
    
         
            +
              s.add_runtime_dependency 'mechanize', '~> 2.7.0'
         
     | 
| 
       19 
19 
     | 
    
         
             
              s.add_runtime_dependency 'addressable', '~> 2.5'
         
     | 
| 
       20 
     | 
    
         
            -
              s.add_runtime_dependency 'nokogiri', '~>  
     | 
| 
      
 20 
     | 
    
         
            +
              s.add_runtime_dependency 'nokogiri', '~> 1.6'
         
     | 
| 
       21 
21 
     | 
    
         
             
              s.add_runtime_dependency 'deathbycaptcha', '~> 5.0.0'
         
     | 
| 
       22 
22 
     | 
    
         
             
            end
         
     | 
    
        metadata
    CHANGED
    
    | 
         @@ -1,7 +1,7 @@ 
     | 
|
| 
       1 
1 
     | 
    
         
             
            --- !ruby/object:Gem::Specification
         
     | 
| 
       2 
2 
     | 
    
         
             
            name: serp_scraper
         
     | 
| 
       3 
3 
     | 
    
         
             
            version: !ruby/object:Gem::Version
         
     | 
| 
       4 
     | 
    
         
            -
              version: 1.0. 
     | 
| 
      
 4 
     | 
    
         
            +
              version: 1.0.4
         
     | 
| 
       5 
5 
     | 
    
         
             
            platform: ruby
         
     | 
| 
       6 
6 
     | 
    
         
             
            authors:
         
     | 
| 
       7 
7 
     | 
    
         
             
            - Rasmus Kjellberg
         
     | 
| 
         @@ -16,20 +16,14 @@ dependencies: 
     | 
|
| 
       16 
16 
     | 
    
         
             
                requirements:
         
     | 
| 
       17 
17 
     | 
    
         
             
                - - "~>"
         
     | 
| 
       18 
18 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       19 
     | 
    
         
            -
                    version:  
     | 
| 
       20 
     | 
    
         
            -
                - - ">="
         
     | 
| 
       21 
     | 
    
         
            -
                  - !ruby/object:Gem::Version
         
     | 
| 
       22 
     | 
    
         
            -
                    version: 2.7.5
         
     | 
| 
      
 19 
     | 
    
         
            +
                    version: 2.7.0
         
     | 
| 
       23 
20 
     | 
    
         
             
              type: :runtime
         
     | 
| 
       24 
21 
     | 
    
         
             
              prerelease: false
         
     | 
| 
       25 
22 
     | 
    
         
             
              version_requirements: !ruby/object:Gem::Requirement
         
     | 
| 
       26 
23 
     | 
    
         
             
                requirements:
         
     | 
| 
       27 
24 
     | 
    
         
             
                - - "~>"
         
     | 
| 
       28 
25 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       29 
     | 
    
         
            -
                    version:  
     | 
| 
       30 
     | 
    
         
            -
                - - ">="
         
     | 
| 
       31 
     | 
    
         
            -
                  - !ruby/object:Gem::Version
         
     | 
| 
       32 
     | 
    
         
            -
                    version: 2.7.5
         
     | 
| 
      
 26 
     | 
    
         
            +
                    version: 2.7.0
         
     | 
| 
       33 
27 
     | 
    
         
             
            - !ruby/object:Gem::Dependency
         
     | 
| 
       34 
28 
     | 
    
         
             
              name: addressable
         
     | 
| 
       35 
29 
     | 
    
         
             
              requirement: !ruby/object:Gem::Requirement
         
     | 
| 
         @@ -50,20 +44,14 @@ dependencies: 
     | 
|
| 
       50 
44 
     | 
    
         
             
                requirements:
         
     | 
| 
       51 
45 
     | 
    
         
             
                - - "~>"
         
     | 
| 
       52 
46 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       53 
     | 
    
         
            -
                    version: ' 
     | 
| 
       54 
     | 
    
         
            -
                - - ">="
         
     | 
| 
       55 
     | 
    
         
            -
                  - !ruby/object:Gem::Version
         
     | 
| 
       56 
     | 
    
         
            -
                    version: 2.9.4
         
     | 
| 
      
 47 
     | 
    
         
            +
                    version: '1.6'
         
     | 
| 
       57 
48 
     | 
    
         
             
              type: :runtime
         
     | 
| 
       58 
49 
     | 
    
         
             
              prerelease: false
         
     | 
| 
       59 
50 
     | 
    
         
             
              version_requirements: !ruby/object:Gem::Requirement
         
     | 
| 
       60 
51 
     | 
    
         
             
                requirements:
         
     | 
| 
       61 
52 
     | 
    
         
             
                - - "~>"
         
     | 
| 
       62 
53 
     | 
    
         
             
                  - !ruby/object:Gem::Version
         
     | 
| 
       63 
     | 
    
         
            -
                    version: ' 
     | 
| 
       64 
     | 
    
         
            -
                - - ">="
         
     | 
| 
       65 
     | 
    
         
            -
                  - !ruby/object:Gem::Version
         
     | 
| 
       66 
     | 
    
         
            -
                    version: 2.9.4
         
     | 
| 
      
 54 
     | 
    
         
            +
                    version: '1.6'
         
     | 
| 
       67 
55 
     | 
    
         
             
            - !ruby/object:Gem::Dependency
         
     | 
| 
       68 
56 
     | 
    
         
             
              name: deathbycaptcha
         
     | 
| 
       69 
57 
     | 
    
         
             
              requirement: !ruby/object:Gem::Requirement
         
     |