RubyGems - esearchy - Versions diffs - 0.2.1 → 0.2.2 - Mend

esearchy 0.2.1 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

data/bin/esearchy +6 -7
data/lib/esearchy/OtherEngines/amazonwishlist.rb +18 -0
data/lib/esearchy/SocialEngines/classmates.rb +1 -0
data/lib/esearchy/SocialEngines/googleprofiles.rb +1 -0
data/lib/esearchy/SocialEngines/jigsaw.rb +1 -0
data/lib/esearchy/SocialEngines/linkedin.rb +2 -1
data/lib/esearchy/SocialEngines/naymz.rb +1 -0
data/lib/esearchy/SocialEngines/plaxo.rb +1 -0
data/lib/esearchy/SocialEngines/spoke.rb +1 -0
data/lib/esearchy/SocialEngines/ziggs.rb +1 -0
data/lib/esearchy/compare.rb +18 -0
data/lib/esearchy/genericengine.rb +3 -3
metadata +10 -8

data/bin/esearchy CHANGED Viewed

@@ -192,7 +192,7 @@ class Output
   private
   def save_csv(data)
     out = File.new(@output, "w")
-    out << "EMAILS/PERSON, TYPE, SITE, CLASS, MATCH\n"
+    out << "ENTITY, TYPE, SITE, CLASS, MATCH\n"
     data.each { |r| out << "#{r[0].to_s},#{r[1]},#{r[2]},#{r[3]}\n"}
   end
@@ -203,7 +203,7 @@ class Output
     Prawn::Document.generate(@output) do
       table data,
         :position => :center,
-        :headers => ["Email/Person", "Type", "Site", "Class", "Match"],
+        :headers => ["Entity", "Type", "Site", "Class", "Match"],
         :header_color => "0046f9",
         :row_colors => :pdf_writer, #["ffffff","ffff00"],
         :font_size => 10,
@@ -221,14 +221,14 @@ class Output
     @db = SQLite3::Database.new(@output)
     @db.execute("CREATE TABLE IF NOT EXISTS results (
       id integer primary key asc,
-      object text,
+      entity text,
       type char,
       site text,
       class text,
       match char);")
     data.each do |r|
-      @db.execute("INSERT INTO results (object,type,site,class,match)
+      @db.execute("INSERT INTO results (entity,type,site,class,match)
                    VALUES (\"#{r[0].to_s}\",\"#{r[1]}\",\"#{r[2]}\",\"#{r[3]}\",\"#{r[4]}\");")
     end
     #@db.commit
@@ -380,8 +380,8 @@ opts.each do |opt, arg|
       #END OF HELP
       exit(0)
     when '--enable-all' then
-      @people_engines = [:LinkedIn, :Naymz, :Classmates, :GoogleProfiles,
-                         :Spoke, :JigSaw, :Ziggs, :Plaxo]
+      @people_engines = [:LinkedIn, :Naymz,  :Classmates, :GoogleProfiles,
+                         :Spoke,    :JigSaw, :Ziggs,      :Plaxo]
       @email_engines = [:Google, :Bing, :Yahoo, :Altavista, :PGP, :Spider ,:Usenet, :GoogleGroups ]
     when '--enable-people' then
       @people_engines = [:LinkedIn, :Naymz, :Classmates, :GoogleProfiles,
@@ -504,7 +504,6 @@ puts "- if you want to use GoogleProfiles, LinkedIn, Classmates or Naymz,"
 puts "  you will need to use the --company (-c) <company_name> option"
 puts "- If you want to spider a website you need to use the --website (-w) <URL> option"
 unless File.exist?(ENV['HOME'] + "/.esearchyrc")
   configure(@params[:maxhits],@yahoo_key,@bing_key)
 else

data/lib/esearchy/OtherEngines/amazonwishlist.rb ADDED Viewed

@@ -0,0 +1,18 @@
+module ESearchy
+  module OtherEngines
+    class AmazonWishList < ESearchy::GenericEngine
+      ENGINE = "" #Do not really need any of them.
+      PORT  = 0
+      NUM = 0
+      TYPE = 1
+      def search
+      end
+      def parse( html )
+      end
+    end
+  end
+end

data/lib/esearchy/SocialEngines/classmates.rb CHANGED Viewed

@@ -24,6 +24,7 @@ module ESearchy
       def crawl_people(html)
         html.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*) \|/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf,  self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/googleprofiles.rb CHANGED Viewed

@@ -27,6 +27,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*) -/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P",profile, self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/jigsaw.rb CHANGED Viewed

@@ -27,6 +27,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="(http\:\/\/www.jigsaw.com\/scid[0-9A-Za-z\/?&=@+%.;'_-]+\.xhtml)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*),/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf, self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/linkedin.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module ESearchy
       TYPE = 2
       def search
-        @querypath = "/cse?q=site%3Awww.linkedin.com/in+%22at+" +
+        @querypath = "/cse?q=site%3Awww.linkedin.com/pub+in+%22at+" +
                      CGI.escape(@company) + "%22&hl=en&cof=&num=100&filter=0&safe=off&start=" or
                      raise ESearchyMissingCompany, "Mssing website url Object.company=(value)"
         super
@@ -26,6 +26,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*) -/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf, self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/naymz.rb CHANGED Viewed

@@ -25,6 +25,7 @@ module ESearchy
       def crawl_people(html)
         html.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*) -/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ").delete_if do
             |x| x =~ /mr.|mr|ms.|ms|phd.|dr.|dr|phd|phd./i
           end

data/lib/esearchy/SocialEngines/plaxo.rb CHANGED Viewed

@@ -27,6 +27,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*)&#39;/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf, self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/spoke.rb CHANGED Viewed

@@ -26,6 +26,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*),/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf, self.class.to_s.upcase, "N"]

data/lib/esearchy/SocialEngines/ziggs.rb CHANGED Viewed

@@ -27,6 +27,7 @@ module ESearchy
       def crawl_people(text)
         text.scan(/<a href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" class=l[\sonmousedown="return clk(this.href,'','','res','\d','')"]*>([\w\s]*) -/).each do |profile|
           pf = profile[0].to_s
+          pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&amp/).to_s if pf.match(/\/url\?q=/)
           p = profile[1].split(" ")
           @people << [ p, pf ]
           @results << [p, "P", pf, self.class.to_s.upcase, "N"]

data/lib/esearchy/compare.rb ADDED Viewed

@@ -0,0 +1,18 @@
+#module ESearchy
+#  class Compare
+#    def distance(s1,s2)
+#      return 100 if s1.strip.downcase == s2.strip.downcase
+#      b_s1 = s1.unpack("B*")[0]
+#      b_s2 = s2.unpack("B*")[0]
+#      b_s1.size > b_s2.size ? (b1 = b_s1; b2 = b_s2;) : (b1 = b_s2; b2 = b_s1;)
+#      p b1
+#      p b2
+#      dist = 100
+#      dist -= b1.size - b2.size
+#      b1[0,b2.size].each_with_index do |chr,idx|
+#        dist -= 1 if chr != b2[idx]
+#      end
+#      return dist
+#    end
+#  end
+#end

data/lib/esearchy/genericengine.rb CHANGED Viewed

@@ -54,8 +54,8 @@ module ESearchy
             block.call(response)
           when Net::HTTPRedirection
             get(URI.parse(response['location']).host,
-                URI.parse(response['location']).port,
-                querystring, headers, limit - 1, block)
+                URI.parse(response['location']).port.to_i,
+                querystring, headers, limit - 1, &block)
           else
             return response.error!
           end
@@ -65,7 +65,7 @@ module ESearchy
       rescue Net::HTTPServerException
         D "Error: Something went wrong with the HTTP request"
       rescue
-        D "Error: Something went wrong :("
+        D "Error: Something went wrong :( + #{$!}"
       end
     end

metadata CHANGED Viewed

@@ -1,13 +1,13 @@
 --- !ruby/object:Gem::Specification
 name: esearchy
 version: !ruby/object:Gem::Version
-  hash: 21
+  hash: 19
   prerelease: false
   segments:
   - 0
   - 2
-  - 1
-  version: 0.2.1
+  - 2
+  version: 0.2.2
 platform: ruby
 authors:
 - Matias P. Brutti
@@ -15,7 +15,7 @@ autorequire:
 bindir: bin
 cert_chain: []
-date: 2010-06-19 00:00:00 -03:00
+date: 2011-04-06 00:00:00 -07:00
 default_executable:
 dependencies:
 - !ruby/object:Gem::Dependency
@@ -51,19 +51,19 @@ dependencies:
   type: :runtime
   version_requirements: *id002
 - !ruby/object:Gem::Dependency
-  name: FreedomCoder-rubyzip
+  name: rubyzip
   prerelease: false
   requirement: &id003 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ">="
       - !ruby/object:Gem::Version
-        hash: 61
+        hash: 51
         segments:
         - 0
         - 9
-        - 3
-        version: 0.9.3
+        - 4
+        version: 0.9.4
   type: :runtime
   version_requirements: *id003
 - !ruby/object:Gem::Dependency
@@ -108,11 +108,13 @@ extra_rdoc_files:
 - README.rdoc
 files:
 - lib/esearchy/bugmenot.rb
+- lib/esearchy/compare.rb
 - lib/esearchy/docs.rb
 - lib/esearchy/esearchy.rb
 - lib/esearchy/genericengine.rb
 - lib/esearchy/LocalEngines/directory.rb
 - lib/esearchy/localengines.rb
+- lib/esearchy/OtherEngines/amazonwishlist.rb
 - lib/esearchy/OtherEngines/googlegroups.rb
 - lib/esearchy/OtherEngines/ldap.rb
 - lib/esearchy/OtherEngines/pgp.rb