search_logger 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (35) hide show
  1. data/.rspec +1 -0
  2. data/.travis.yml +6 -0
  3. data/Gemfile +3 -0
  4. data/Gemfile.lock +36 -0
  5. data/Guardfile +9 -0
  6. data/README +0 -0
  7. data/Rakefile +1 -0
  8. data/bin/search_logger +12 -0
  9. data/lib/search_logger/csv_exporter.rb +20 -0
  10. data/lib/search_logger/exec.rb +131 -0
  11. data/lib/search_logger/google_parser/result.rb +60 -0
  12. data/lib/search_logger/google_parser.rb +59 -0
  13. data/lib/search_logger/persistence.rb +68 -0
  14. data/lib/search_logger/version.rb +3 -0
  15. data/lib/search_logger/xml_parser.rb +15 -0
  16. data/lib/search_logger.rb +11 -0
  17. data/schema.sql +15 -0
  18. data/search_logger.gemspec +26 -0
  19. data/spec/acceptance/google_parser_acceptance_spec.rb +93 -0
  20. data/spec/acceptance/mysql_to_csv_exportation_acceptance_spec.rb +39 -0
  21. data/spec/acceptance/persistence_acceptance_spec.rb +26 -0
  22. data/spec/acceptance/test_acceptance_spec.rb +61 -0
  23. data/spec/acceptance/xml_parser_acceptance_spec.rb +10 -0
  24. data/spec/spec_helper.rb +11 -0
  25. data/spec/support/file_repository/exported_from_persistence.csv +119 -0
  26. data/spec/support/file_repository/google_result.html +115 -0
  27. data/spec/support/file_repository/google_result_2.html +636 -0
  28. data/spec/support/file_repository/rankabove_test.xml +9 -0
  29. data/spec/support/file_repository/sample_mysql_data.rb +6 -0
  30. data/spec/unit/google_parser/google_parser_result_spec.rb +79 -0
  31. data/spec/unit/google_parser_spec.rb +69 -0
  32. data/spec/unit/persistence_spec.rb +86 -0
  33. data/spec/unit/shell_exec_spec.rb +28 -0
  34. data/spec/unit/xml_parser_spec.rb +22 -0
  35. metadata +152 -0
@@ -0,0 +1,61 @@
1
+ require "spec_helper"
2
+
3
+ describe "Test" do
4
+ def load_xml
5
+ xml_parser = SearchLogger::XmlParser.new('spec/support/file_repository/rankabove_test.xml')
6
+ xml_parser.parse
7
+ end
8
+
9
+ def search_google(query_string)
10
+ page_one = SearchLogger::GoogleParser.new.query(query_string).per_page(2).page(1).search
11
+ page_two = SearchLogger::GoogleParser.new.query(query_string).per_page(2).page(2).last_result(page_one).search
12
+ results = []
13
+ position = 1
14
+ (page_one + page_two).each do |e|
15
+ e.position.should == position
16
+ results << e.as_ary
17
+
18
+ position += 1
19
+ end
20
+ results
21
+ end
22
+
23
+ def save_into_mysql(google_results)
24
+ persistence = SearchLogger::Persistence.new
25
+ persistence.data(google_results).table('google_results').save
26
+ end
27
+
28
+ def mysql_data_equals_csv_exported?(mysql, csv)
29
+ correct_order = %w(keyword position url title description)
30
+ csv.each_with_index do |v, i|
31
+ if v == csv.first
32
+ v.join.should == correct_order.join
33
+ else
34
+ v.join.should == correct_order.map { |e| mysql[i-1][e.gsub(/(keyword)/, 'searched_\1').to_sym] }.join
35
+ end
36
+ end
37
+ end
38
+
39
+ def export_to_csv_file
40
+ csv_file = File.expand_path("../../support/file_repository/exported_from_persistence.csv", __FILE__)
41
+ data = DummyMysql.load_data
42
+
43
+ File.delete csv_file if File.exists? csv_file
44
+ CSVExporter.new.export data, to: csv_file
45
+ File.exists?(csv_file).should be_true
46
+
47
+ saved_data = CSV.parse File.read(csv_file)
48
+ mysql_data_equals_csv_exported?(data, saved_data)
49
+ end
50
+
51
+ it "load XML, search Google, save into MySQL and export CSV file" do
52
+ xml = load_xml
53
+ xml.should have(5).items
54
+ xml.each do |value|
55
+ google_results = search_google(value)
56
+ google_results.should be_kind_of Array
57
+ save_into_mysql(google_results)
58
+ end
59
+ export_to_csv_file
60
+ end
61
+ end
@@ -0,0 +1,10 @@
1
+ # encoding: utf-8
2
+ require "spec_helper"
3
+
4
+ describe "XML parser" do
5
+ subject { SearchLogger::XmlParser.new('spec/support/file_repository/rankabove_test.xml') }
6
+
7
+ it "loads a XML file and extracts its keywords into an array" do
8
+ subject.parse.should == ['seo software', 'ipad', 'muffuletta manhattanization', 'cheap motels', 'שפות תכנות']
9
+ end
10
+ end
@@ -0,0 +1,11 @@
1
+ require "rubygems"
2
+ require "bundler/setup"
3
+ require "nokogiri"
4
+
5
+ Dir["lib/**/*.rb"].each { |f| require "./"+f }
6
+ Dir["spec/support/**/*.rb"].each { |f| require "./"+f }
7
+
8
+ RSpec.configure do |config|
9
+ config.filter_run wip: true
10
+ config.run_all_when_everything_filtered = true
11
+ end
@@ -0,0 +1,119 @@
1
+ keyword,position,url,title,description
2
+ amazon,1,www.github.com,This is a title,First description.
3
+ amazon,2,www.github.com,This is the second title,Second description.
4
+ amazon,3,www.github.com,This is the third title,Third description.
5
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
6
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
7
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
8
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
9
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
10
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
11
+ ipad,3,"","",""
12
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
13
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=KMMxT4zJCsyisQKgq52UBw&ved=0CEkQqAI,News for ipad,""
14
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
15
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
16
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
17
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
18
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
19
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
20
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
21
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
22
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
23
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
24
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
25
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
26
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
27
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
28
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
29
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
30
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
31
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
32
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
33
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
34
+ ipad,3,"","",""
35
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
36
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=UcMxT5_OPKWlsQL8iKiZBw&ved=0CEkQqAI,News for ipad,""
37
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
38
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
39
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
40
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
41
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
42
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
43
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
44
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
45
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
46
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
47
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
48
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
49
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
50
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
51
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
52
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
53
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
54
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
55
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
56
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
57
+ ipad,3,"","",""
58
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
59
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=esMxT7CRM6aksQLn49HeBg&ved=0CEkQqAI,News for ipad,""
60
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
61
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
62
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
63
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
64
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
65
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
66
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
67
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
68
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
69
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
70
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
71
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
72
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
73
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
74
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
75
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
76
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
77
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
78
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
79
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
80
+ ipad,3,"","",""
81
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
82
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=4sMxT4vGGOXjsQLUtriXBw&ved=0CEkQqAI,News for ipad,""
83
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
84
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
85
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
86
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
87
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
88
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
89
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
90
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
91
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
92
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
93
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
94
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
95
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
96
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
97
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
98
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
99
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
100
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
101
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
102
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
103
+ ipad,3,"","",""
104
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
105
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=8ckxT-62LuOesQLo7_mhBw&ved=0CEkQqAI,News for ipad,""
106
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
107
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
108
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
109
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
110
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
111
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
112
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
113
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
114
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
115
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
116
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
117
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
118
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
119
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""