getter_cyndi5 0.0.1 → 0.0.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/bin/getter_cyndi5 +7 -1
- data/lib/getter_cyndi5.rb +11 -4
- data/lib/getter_cyndi5/parser.rb +7 -2
- data/lib/getter_cyndi5/product.rb +10 -0
- data/lib/getter_cyndi5/retriever.rb +1 -0
- metadata +60 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 1cd951e59fcde272f1b72e45d7a7f935a966e193bdf9b91bd219864cdf00db22
|
4
|
+
data.tar.gz: 60023272d347c7d374ec501559d547c5d5fcdfd0998bc3936b23935633a5b86a
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 24f20cbe4de2956352b27c1603d726c6797b2022db27b9afd0a531058645d5cd481dd283bb57e823d0faa223d67f02bb58e7e54af2b333752dbaafb18bb0d298
|
7
|
+
data.tar.gz: d175ff2ce3b5bb583dd574455c73dd63d098780c6f5d304ee9d84744be9901ea4b7025a49450973aa3c979671c3f7864ac958c3c062747b1540b5e1a59df2a2c
|
data/bin/getter_cyndi5
CHANGED
@@ -1,4 +1,10 @@
|
|
1
1
|
#!/usr/bin/env ruby
|
2
2
|
|
3
3
|
require 'getter_cyndi5'
|
4
|
-
|
4
|
+
base_url = ARGV[0] || 'https://thehappyco.com'
|
5
|
+
products_page_path = ARGV[1] || '/kelly/products'
|
6
|
+
item_row_selector = ARGV[2] || '.item-row'
|
7
|
+
item_anchor_selector = ARGV[3] || 'div > div.product-desc.text-center > div.product-title > h3 > a'
|
8
|
+
mode = (ARGV[4] || '2').to_i
|
9
|
+
filename = ARGV[5] || './tmp/document1.html'
|
10
|
+
GetterCyndi5.go(base_url, products_page_path, item_row_selector, item_anchor_selector, mode, filename)
|
data/lib/getter_cyndi5.rb
CHANGED
@@ -3,20 +3,27 @@ class GetterCyndi5
|
|
3
3
|
# Getter
|
4
4
|
#
|
5
5
|
# Example:
|
6
|
-
# >> GetterCyndi5.go(base_url = 'https://thehappyco.com', products_page_path = '/kelly/products', item_row_selector = '.item-row', item_anchor_selector = 'div > div.product-desc.text-center > div.product-title > h3 > a', mode =
|
6
|
+
# >> GetterCyndi5.go(base_url = 'https://thehappyco.com', products_page_path = '/kelly/products', item_row_selector = '.item-row', item_anchor_selector = 'div > div.product-desc.text-center > div.product-title > h3 > a', mode = 2, './tmp/document1.html')
|
7
7
|
# Arguments:
|
8
8
|
# base_url: (String)
|
9
9
|
# products_page_path: (String)
|
10
10
|
# item_row_selector: (String)
|
11
11
|
# item_anchor_selector: (String)
|
12
|
-
# mode: (Integer)
|
12
|
+
# mode: (Integer) 0 = retrieve and parse without saving HTML document to file, 1 = retrieve and parse saving HTML document to file, 2 = load and parse HTML document from file
|
13
13
|
# filename: (String)
|
14
14
|
|
15
|
-
def self.go(base_url
|
15
|
+
def self.go(base_url, products_page_path, item_row_selector, item_anchor_selector, mode, filename)
|
16
|
+
all_products = products(base_url, products_page_path, item_row_selector, item_anchor_selector, mode, filename)
|
17
|
+
all_products.each do |product|
|
18
|
+
puts "#{product.name} :-: #{product.url}"
|
19
|
+
end
|
20
|
+
end
|
21
|
+
|
22
|
+
def self.products(base_url, products_page_path, item_row_selector, item_anchor_selector, mode, filename)
|
16
23
|
retriever = Retriever.new(base_url, products_page_path, item_row_selector, mode, filename)
|
17
24
|
retriever.retrieve
|
18
25
|
parser = Parser.new(retriever.document, base_url, item_row_selector, item_anchor_selector)
|
19
|
-
parser.parse
|
26
|
+
products = parser.parse
|
20
27
|
end
|
21
28
|
end
|
22
29
|
|
data/lib/getter_cyndi5/parser.rb
CHANGED
@@ -1,9 +1,12 @@
|
|
1
|
+
require 'getter_cyndi5/product'
|
1
2
|
class GetterCyndi5::Parser
|
3
|
+
attr_reader :products
|
2
4
|
def initialize(document, base_url, item_row_selector, item_anchor_selector)
|
3
5
|
@document = document
|
4
6
|
@base_url = base_url
|
5
7
|
@item_row_selector = item_row_selector
|
6
8
|
@item_anchor_selector = item_anchor_selector
|
9
|
+
@products = []
|
7
10
|
end
|
8
11
|
|
9
12
|
def parse
|
@@ -12,7 +15,9 @@ class GetterCyndi5::Parser
|
|
12
15
|
product_element = item_row.css(@item_anchor_selector)[0]
|
13
16
|
product_name = product_element.text
|
14
17
|
product_url = "#{@base_url}#{product_element.attributes['href']}"
|
15
|
-
|
18
|
+
product = GetterCyndi5::Product.new(product_name, product_url)
|
19
|
+
products.append(product)
|
16
20
|
end
|
21
|
+
products
|
17
22
|
end
|
18
|
-
end
|
23
|
+
end
|
metadata
CHANGED
@@ -1,15 +1,71 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: getter_cyndi5
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.0.
|
4
|
+
version: 0.0.6
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Cyndi Cavanaugh
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2021-03-
|
12
|
-
dependencies:
|
11
|
+
date: 2021-03-12 00:00:00.000000000 Z
|
12
|
+
dependencies:
|
13
|
+
- !ruby/object:Gem::Dependency
|
14
|
+
name: httparty
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
16
|
+
requirements:
|
17
|
+
- - '='
|
18
|
+
- !ruby/object:Gem::Version
|
19
|
+
version: 0.18.1
|
20
|
+
type: :runtime
|
21
|
+
prerelease: false
|
22
|
+
version_requirements: !ruby/object:Gem::Requirement
|
23
|
+
requirements:
|
24
|
+
- - '='
|
25
|
+
- !ruby/object:Gem::Version
|
26
|
+
version: 0.18.1
|
27
|
+
- !ruby/object:Gem::Dependency
|
28
|
+
name: nokogiri
|
29
|
+
requirement: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - '='
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 1.11.1
|
34
|
+
type: :runtime
|
35
|
+
prerelease: false
|
36
|
+
version_requirements: !ruby/object:Gem::Requirement
|
37
|
+
requirements:
|
38
|
+
- - '='
|
39
|
+
- !ruby/object:Gem::Version
|
40
|
+
version: 1.11.1
|
41
|
+
- !ruby/object:Gem::Dependency
|
42
|
+
name: watir
|
43
|
+
requirement: !ruby/object:Gem::Requirement
|
44
|
+
requirements:
|
45
|
+
- - '='
|
46
|
+
- !ruby/object:Gem::Version
|
47
|
+
version: 6.18.0
|
48
|
+
type: :runtime
|
49
|
+
prerelease: false
|
50
|
+
version_requirements: !ruby/object:Gem::Requirement
|
51
|
+
requirements:
|
52
|
+
- - '='
|
53
|
+
- !ruby/object:Gem::Version
|
54
|
+
version: 6.18.0
|
55
|
+
- !ruby/object:Gem::Dependency
|
56
|
+
name: webdrivers
|
57
|
+
requirement: !ruby/object:Gem::Requirement
|
58
|
+
requirements:
|
59
|
+
- - '='
|
60
|
+
- !ruby/object:Gem::Version
|
61
|
+
version: 4.6.0
|
62
|
+
type: :runtime
|
63
|
+
prerelease: false
|
64
|
+
version_requirements: !ruby/object:Gem::Requirement
|
65
|
+
requirements:
|
66
|
+
- - '='
|
67
|
+
- !ruby/object:Gem::Version
|
68
|
+
version: 4.6.0
|
13
69
|
description: A simple getter cyndi5 gem
|
14
70
|
email: cynthiacavanaugh1@gmail.com
|
15
71
|
executables:
|
@@ -20,6 +76,7 @@ files:
|
|
20
76
|
- bin/getter_cyndi5
|
21
77
|
- lib/getter_cyndi5.rb
|
22
78
|
- lib/getter_cyndi5/parser.rb
|
79
|
+
- lib/getter_cyndi5/product.rb
|
23
80
|
- lib/getter_cyndi5/retriever.rb
|
24
81
|
homepage: https://cyndicavanaugh.com
|
25
82
|
licenses:
|