googscrape 0.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (3) hide show
  1. checksums.yaml +7 -0
  2. data/lib/google_image_scrape.rb +39 -0
  3. metadata +85 -0
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: c2a3e5e68a8d4368ec2a4f507bef8a20119f2298118a1562ac4f610f3b02c3ab
4
+ data.tar.gz: 829e29903853c24f6d2e6277d576bdf85df9557a5291470a4b69bb6462aeff46
5
+ SHA512:
6
+ metadata.gz: 4537cf48b5c8710b32f238a50e20a8c6886ef79fe15f8d611fa9230929a9ee15b05ca6ae485692813eba6755ef4a623d43226af48909ba97dacc5c920360c2a0
7
+ data.tar.gz: 86a5c66ac1c7e7aa7c8f6e692a4ec542569e0dde25ecf125bea9af485c8ff72f996db459b1120f63e32cf014aedae58ce771b36ca98d5f0c3ad5ea6046994ccd
@@ -0,0 +1,39 @@
1
+ require 'nokogiri'
2
+ require 'json'
3
+
4
+ class GoogleImageScrape
5
+ class << self
6
+ def scrape_images(source_file)
7
+
8
+ html_content = File.read(source_file)
9
+ doc = Nokogiri::HTML(html_content)
10
+
11
+ artworks = []
12
+
13
+ doc.css('[class^="klitem"]').each do |artwork|
14
+ name_element = artwork['aria-label']
15
+ name = name_element.strip if name_element
16
+
17
+ extensions_element = artwork.at_css('[class^="ellip"]')
18
+ extensions = extensions_element.text.strip.split(',') if extensions_element
19
+
20
+ link = artwork['href']
21
+ image_element = artwork.at_css('[class^="rISBZc"]')
22
+ image = image_element['src']
23
+
24
+ artworks << {
25
+ name: name,
26
+ extensions: extensions,
27
+ link: "https://www.google.com" + link.to_s,
28
+ image: image
29
+ }
30
+ end
31
+
32
+ output = { artworks: artworks }
33
+ output_file_path = './results.json'
34
+ File.write(output_file_path, JSON.pretty_generate(output))
35
+
36
+ puts "Results saved to file: #{output_file_path}."
37
+ end
38
+ end
39
+ end
metadata ADDED
@@ -0,0 +1,85 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: googscrape
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.2
5
+ platform: ruby
6
+ authors:
7
+ - MK
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2024-08-02 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: nokogiri
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ">="
18
+ - !ruby/object:Gem::Version
19
+ version: '0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ">="
25
+ - !ruby/object:Gem::Version
26
+ version: '0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ">="
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - ">="
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - ">="
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - ">="
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ description: google image marquee scraper.
56
+ email: ''
57
+ executables: []
58
+ extensions: []
59
+ extra_rdoc_files: []
60
+ files:
61
+ - lib/google_image_scrape.rb
62
+ homepage: https://rubygems.org/gems/google_image_scrape
63
+ licenses:
64
+ - GPL-2.0
65
+ metadata: {}
66
+ post_install_message:
67
+ rdoc_options: []
68
+ require_paths:
69
+ - lib
70
+ required_ruby_version: !ruby/object:Gem::Requirement
71
+ requirements:
72
+ - - ">="
73
+ - !ruby/object:Gem::Version
74
+ version: '0'
75
+ required_rubygems_version: !ruby/object:Gem::Requirement
76
+ requirements:
77
+ - - ">="
78
+ - !ruby/object:Gem::Version
79
+ version: '0'
80
+ requirements: []
81
+ rubygems_version: 3.3.15
82
+ signing_key:
83
+ specification_version: 4
84
+ summary: scrape google image marquees.
85
+ test_files: []