web-scrapper-gems 1.0.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/lib/web-scrapper-gems.rb +52 -0
- metadata +44 -0
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA256:
|
3
|
+
metadata.gz: a3d9fdb997818912f6fa9c059fa3697659eec8d5df82e6d0c11491707c622a6d
|
4
|
+
data.tar.gz: f5a1d48a4f60f03374a91afb078e5a69e610184c5801b32cb184b718e6207fdd
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: 9b9fb89e949bfc72e5efecc898caf5726232f105675401acdb28e0a0a9f9bee9d305c255b8d78400ce33c7f352c1d263e8e8237e68f2ccc74e04f16241a3ecbe
|
7
|
+
data.tar.gz: a8b5ad10e645ca91e9369f910587003c79e117d2de8694011ed2bd57d78a1c73104c9a33c262d95ad5921446cafc5e2625cdfce76c82dc98b26d2d2095cba1eb
|
@@ -0,0 +1,52 @@
|
|
1
|
+
# Pitchapa Sae-lim
|
2
|
+
# 6210546421
|
3
|
+
require "nokogiri"
|
4
|
+
require "open-uri"
|
5
|
+
require "uri"
|
6
|
+
|
7
|
+
class WebScrapper
|
8
|
+
def self.scrapper
|
9
|
+
alphabets_list = ('A'..'Z').to_a.unshift('NUMBER')
|
10
|
+
alphabets_list.each do |alphabet|
|
11
|
+
open_set_website = URI.open("https://www.set.or.th/set/commonslookup.do?language=th&country=TH&prefix=#{alphabet}")
|
12
|
+
get_link = Nokogiri::HTML(open_set_website)
|
13
|
+
|
14
|
+
get_href = get_link.css("td a")
|
15
|
+
get_href.each do |each_href|
|
16
|
+
h = each_href.attributes["href"].value.gsub("companyprofile", "companyhighlight")
|
17
|
+
get_h = "https://www.set.or.th#{h}"
|
18
|
+
open_each_href = URI.open(get_h)
|
19
|
+
html = Nokogiri::HTML(open_each_href)
|
20
|
+
name_company = html.css("h3").text
|
21
|
+
begin
|
22
|
+
td_list = [5, 4, 3, 2]
|
23
|
+
list_assets_value = Array.new
|
24
|
+
td_list.each do |i|
|
25
|
+
assets_value = html.css("td[#{i}]").first.text
|
26
|
+
list_assets_value.push(assets_value)
|
27
|
+
end
|
28
|
+
list_assets_value_2 = Array.new
|
29
|
+
list_assets_value.each do |x|
|
30
|
+
list_assets_value_2.push(x.gsub("\u00A0", ''))
|
31
|
+
end
|
32
|
+
empty_str = list_assets_value_2[0].gsub("\u00A0", '')
|
33
|
+
if list_assets_value_2[0] != ''
|
34
|
+
assets_value = list_assets_value_2[0]
|
35
|
+
elsif list_assets_value_2[0] == nil
|
36
|
+
assets_value = list_assets_value_2[1]
|
37
|
+
else
|
38
|
+
if empty_str == ''
|
39
|
+
assets_value = "don't have assets value."
|
40
|
+
end
|
41
|
+
end
|
42
|
+
if list_assets_value_2.all?('')
|
43
|
+
assets_value = "don't have assets value."
|
44
|
+
end
|
45
|
+
rescue => exception
|
46
|
+
assets_value = "don't have assets value."
|
47
|
+
end
|
48
|
+
puts "#{name_company} : #{assets_value}"
|
49
|
+
end
|
50
|
+
end
|
51
|
+
end
|
52
|
+
end
|
metadata
ADDED
@@ -0,0 +1,44 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: web-scrapper-gems
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 1.0.0
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Pitchapa SAE-LIM 6210546421
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2021-01-31 00:00:00.000000000 Z
|
12
|
+
dependencies: []
|
13
|
+
description: a simple ruby script to read and extract current assets of stock Delta
|
14
|
+
in set.or.th
|
15
|
+
email: pitchapa.sae@ku.th
|
16
|
+
executables: []
|
17
|
+
extensions: []
|
18
|
+
extra_rdoc_files: []
|
19
|
+
files:
|
20
|
+
- lib/web-scrapper-gems.rb
|
21
|
+
homepage: https://rubygems.org/gems/web-scrapper-gems
|
22
|
+
licenses:
|
23
|
+
- MIT
|
24
|
+
metadata: {}
|
25
|
+
post_install_message:
|
26
|
+
rdoc_options: []
|
27
|
+
require_paths:
|
28
|
+
- lib
|
29
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - ">="
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: '0'
|
34
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
35
|
+
requirements:
|
36
|
+
- - ">="
|
37
|
+
- !ruby/object:Gem::Version
|
38
|
+
version: '0'
|
39
|
+
requirements: []
|
40
|
+
rubygems_version: 3.1.4
|
41
|
+
signing_key:
|
42
|
+
specification_version: 4
|
43
|
+
summary: Print all stock data and assets value.
|
44
|
+
test_files: []
|