search_logger 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (35) hide show
  1. data/.rspec +1 -0
  2. data/.travis.yml +6 -0
  3. data/Gemfile +3 -0
  4. data/Gemfile.lock +36 -0
  5. data/Guardfile +9 -0
  6. data/README +0 -0
  7. data/Rakefile +1 -0
  8. data/bin/search_logger +12 -0
  9. data/lib/search_logger/csv_exporter.rb +20 -0
  10. data/lib/search_logger/exec.rb +131 -0
  11. data/lib/search_logger/google_parser/result.rb +60 -0
  12. data/lib/search_logger/google_parser.rb +59 -0
  13. data/lib/search_logger/persistence.rb +68 -0
  14. data/lib/search_logger/version.rb +3 -0
  15. data/lib/search_logger/xml_parser.rb +15 -0
  16. data/lib/search_logger.rb +11 -0
  17. data/schema.sql +15 -0
  18. data/search_logger.gemspec +26 -0
  19. data/spec/acceptance/google_parser_acceptance_spec.rb +93 -0
  20. data/spec/acceptance/mysql_to_csv_exportation_acceptance_spec.rb +39 -0
  21. data/spec/acceptance/persistence_acceptance_spec.rb +26 -0
  22. data/spec/acceptance/test_acceptance_spec.rb +61 -0
  23. data/spec/acceptance/xml_parser_acceptance_spec.rb +10 -0
  24. data/spec/spec_helper.rb +11 -0
  25. data/spec/support/file_repository/exported_from_persistence.csv +119 -0
  26. data/spec/support/file_repository/google_result.html +115 -0
  27. data/spec/support/file_repository/google_result_2.html +636 -0
  28. data/spec/support/file_repository/rankabove_test.xml +9 -0
  29. data/spec/support/file_repository/sample_mysql_data.rb +6 -0
  30. data/spec/unit/google_parser/google_parser_result_spec.rb +79 -0
  31. data/spec/unit/google_parser_spec.rb +69 -0
  32. data/spec/unit/persistence_spec.rb +86 -0
  33. data/spec/unit/shell_exec_spec.rb +28 -0
  34. data/spec/unit/xml_parser_spec.rb +22 -0
  35. metadata +152 -0
@@ -0,0 +1,61 @@
1
+ require "spec_helper"
2
+
3
+ describe "Test" do
4
+ def load_xml
5
+ xml_parser = SearchLogger::XmlParser.new('spec/support/file_repository/rankabove_test.xml')
6
+ xml_parser.parse
7
+ end
8
+
9
+ def search_google(query_string)
10
+ page_one = SearchLogger::GoogleParser.new.query(query_string).per_page(2).page(1).search
11
+ page_two = SearchLogger::GoogleParser.new.query(query_string).per_page(2).page(2).last_result(page_one).search
12
+ results = []
13
+ position = 1
14
+ (page_one + page_two).each do |e|
15
+ e.position.should == position
16
+ results << e.as_ary
17
+
18
+ position += 1
19
+ end
20
+ results
21
+ end
22
+
23
+ def save_into_mysql(google_results)
24
+ persistence = SearchLogger::Persistence.new
25
+ persistence.data(google_results).table('google_results').save
26
+ end
27
+
28
+ def mysql_data_equals_csv_exported?(mysql, csv)
29
+ correct_order = %w(keyword position url title description)
30
+ csv.each_with_index do |v, i|
31
+ if v == csv.first
32
+ v.join.should == correct_order.join
33
+ else
34
+ v.join.should == correct_order.map { |e| mysql[i-1][e.gsub(/(keyword)/, 'searched_\1').to_sym] }.join
35
+ end
36
+ end
37
+ end
38
+
39
+ def export_to_csv_file
40
+ csv_file = File.expand_path("../../support/file_repository/exported_from_persistence.csv", __FILE__)
41
+ data = DummyMysql.load_data
42
+
43
+ File.delete csv_file if File.exists? csv_file
44
+ CSVExporter.new.export data, to: csv_file
45
+ File.exists?(csv_file).should be_true
46
+
47
+ saved_data = CSV.parse File.read(csv_file)
48
+ mysql_data_equals_csv_exported?(data, saved_data)
49
+ end
50
+
51
+ it "load XML, search Google, save into MySQL and export CSV file" do
52
+ xml = load_xml
53
+ xml.should have(5).items
54
+ xml.each do |value|
55
+ google_results = search_google(value)
56
+ google_results.should be_kind_of Array
57
+ save_into_mysql(google_results)
58
+ end
59
+ export_to_csv_file
60
+ end
61
+ end
@@ -0,0 +1,10 @@
1
+ # encoding: utf-8
2
+ require "spec_helper"
3
+
4
+ describe "XML parser" do
5
+ subject { SearchLogger::XmlParser.new('spec/support/file_repository/rankabove_test.xml') }
6
+
7
+ it "loads a XML file and extracts its keywords into an array" do
8
+ subject.parse.should == ['seo software', 'ipad', 'muffuletta manhattanization', 'cheap motels', 'שפות תכנות']
9
+ end
10
+ end
@@ -0,0 +1,11 @@
1
+ require "rubygems"
2
+ require "bundler/setup"
3
+ require "nokogiri"
4
+
5
+ Dir["lib/**/*.rb"].each { |f| require "./"+f }
6
+ Dir["spec/support/**/*.rb"].each { |f| require "./"+f }
7
+
8
+ RSpec.configure do |config|
9
+ config.filter_run wip: true
10
+ config.run_all_when_everything_filtered = true
11
+ end
@@ -0,0 +1,119 @@
1
+ keyword,position,url,title,description
2
+ amazon,1,www.github.com,This is a title,First description.
3
+ amazon,2,www.github.com,This is the second title,Second description.
4
+ amazon,3,www.github.com,This is the third title,Third description.
5
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
6
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
7
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
8
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
9
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
10
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
11
+ ipad,3,"","",""
12
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
13
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=KMMxT4zJCsyisQKgq52UBw&ved=0CEkQqAI,News for ipad,""
14
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
15
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
16
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
17
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
18
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
19
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
20
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
21
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
22
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
23
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
24
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
25
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
26
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
27
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
28
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
29
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
30
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
31
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
32
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
33
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
34
+ ipad,3,"","",""
35
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
36
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=UcMxT5_OPKWlsQL8iKiZBw&ved=0CEkQqAI,News for ipad,""
37
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
38
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
39
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
40
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
41
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
42
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
43
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
44
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
45
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
46
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
47
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
48
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
49
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
50
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
51
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
52
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
53
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
54
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
55
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
56
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
57
+ ipad,3,"","",""
58
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
59
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=esMxT7CRM6aksQLn49HeBg&ved=0CEkQqAI,News for ipad,""
60
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
61
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
62
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
63
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
64
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
65
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
66
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
67
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
68
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
69
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
70
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
71
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
72
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
73
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
74
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
75
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
76
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
77
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
78
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
79
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
80
+ ipad,3,"","",""
81
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
82
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=4sMxT4vGGOXjsQLUtriXBw&ved=0CEkQqAI,News for ipad,""
83
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
84
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
85
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
86
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
87
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
88
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
89
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
90
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
91
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
92
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
93
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
94
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
95
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
96
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""
97
+ seo software,1,http://www.traffictravis.com/,Free SEO Software | The Best PPC & SEO Management Tool -Traffic ...,""
98
+ seo software,2,http://www.ibusinesspromoter.com/seo-tools/top-10-seo-software,SEO software - Top 10 ranking guarantee - Search engine ...,""
99
+ seo software,3,http://www.seoscheduler.com/,SEO Software - Do Your Own Search Engine Optimization | SEO ...,""
100
+ seo software,4,http://www.link-assistant.com/,SEO Software and SEO Tools | Top 10 Rank Guarantee | SEO ...,""
101
+ ipad,1,http://www.apple.com/ipad/,Apple - iPad 2 - Now with iOS 5 and iCloud.,""
102
+ ipad,2,http://store.apple.com/us/browse/home/shop_ipad/family/ipad,Buy iPad 2 Now,""
103
+ ipad,3,"","",""
104
+ ipad,4,http://en.wikipedia.org/wiki/IPad,"iPad - Wikipedia, the free encyclopedia",""
105
+ ipad,5,/search?q=ipad&num=2&hl=en&ie=UTF-8&prmd=ivnsr&source=univ&tbm=nws&tbo=u&sa=X&ei=8ckxT-62LuOesQLo7_mhBw&ved=0CEkQqAI,News for ipad,""
106
+ ipad,6,http://www.cnet.com/apple-ipad/,"Apple iPad tablet: reviews, news, photos, and videos - CNET.com",""
107
+ ipad,7,http://gizmodo.com/5458382/8-things-that-suck-about-the-ipad,8 Things That Suck About the iPad,""
108
+ muffuletta manhattanization,1,http://stackoverflow.com/questions/7332107/ruby-doesnt-treat-hebrew-letters-well,xml - Ruby doesn't treat hebrew letters well - Stack Overflow,""
109
+ muffuletta manhattanization,2,http://rubyonrails.resourcezen.com/ruby-doesn-t-treat-hebrew-letters-well,Ruby doesn't treat hebrew letters well | Ruby on Rails,""
110
+ muffuletta manhattanization,3,http://stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Stack Overflow,""
111
+ muffuletta manhattanization,4,https://facebook.stackoverflow.com/tags/hebrew/hot?filter=year,Hottest 'hebrew' Answers - Facebook Stack Overflow,""
112
+ cheap motels,1,http://www.motels.com/,Discount Hotels Motels - Cheap Rooms Online - your key to happy ...,""
113
+ cheap motels,2,http://www.motelplanet.com/,"Motels Cheap - Discount Motel Rates, Reservation & Guides",""
114
+ cheap motels,3,http://www.travelocity.com/Hotels,"Hotels, Motels and Inns - Find Cheap Hotels | Travelocity",""
115
+ cheap motels,4,http://www.motel6.com/,Motel 6 - Find Discount Motels Nationwide & Book Motel Reservations,""
116
+ שפות תכנות,1,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפת תכנות – ויקיפדיה‎,""
117
+ שפות תכנות,2,http://he.wikipedia.org/wiki/%D7%A9%D7%A4%D7%95%D7%AA_%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות – ויקיפדיה‎,""
118
+ שפות תכנות,3,http://www.underwar.co.il/tag/%D7%A9%D7%A4%D7%95%D7%AA-%D7%AA%D7%9B%D7%A0%D7%95%D7%AA,שפות תכנות‎,""
119
+ שפות תכנות,4,http://www.tapuz.co.il/Forums2008/ForumPage.aspx?ForumId=89,פורום שפות תכנות - תפוז פורומים‎,""