harunica 0.0.2 → 0.0.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/harunica/scraping/list_page.rb +2 -1
- data/lib/harunica/scraping/video_page.rb +25 -2
- data/lib/harunica/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 3fb99a2e1aae906ff21da91d172ad06caf8be866
|
4
|
+
data.tar.gz: 4843a6ce8ed8fe305fbedff69f895fa109440601
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 56f209aa18c8c22683c9223469e913fe5db031f8bfa2371ba9833e52905050e2e440da2471a0b287797685354cadc91ce6e722e54a28051c00271bfa28b1625b
|
7
|
+
data.tar.gz: 8906adaa556c268ead5e1a43de586adaeb67b260fdb300bf64164574a1c2f8d1a1eafb2fff06b06c1cca00ea94bd8fb082ee5c0ebe9fe7b37c23442b248902c4
|
@@ -31,7 +31,8 @@ module Harunica
|
|
31
31
|
def video_pages
|
32
32
|
@video_pages ||= html.doc.css(VIDEO_SELECTORS.join(' ')).map do |e|
|
33
33
|
url = html.url.base + e.css('.itemContent .itemTitle a')[0].attr('href')
|
34
|
-
|
34
|
+
thumb_url = e.css('.videoList01Wrap .uadWrap .itemThumbBox .thumb')[0].attr('src')
|
35
|
+
VideoPage.new(Html.new(url), thumb_url)
|
35
36
|
end
|
36
37
|
end
|
37
38
|
|
@@ -9,15 +9,38 @@ module Harunica
|
|
9
9
|
'strong[itemprop="name"]'
|
10
10
|
]
|
11
11
|
|
12
|
-
|
12
|
+
TITLE_SELECTORS = [
|
13
|
+
'head',
|
14
|
+
'meta[property="og:title"]'
|
15
|
+
]
|
16
|
+
|
17
|
+
DESC_SELECTORS = [
|
18
|
+
'#des_short',
|
19
|
+
'p:last-child'
|
20
|
+
]
|
13
21
|
|
14
|
-
|
22
|
+
attr_reader :html, :thumbnail_url
|
23
|
+
|
24
|
+
def initialize(html, thumbnail_url)
|
15
25
|
@html = html
|
26
|
+
@thumbnail_url = thumbnail_url
|
16
27
|
end
|
17
28
|
|
18
29
|
def author
|
19
30
|
@author ||= html.doc.css(AUTHOR_SELECTORS.join(' '))[0].content
|
20
31
|
end
|
32
|
+
|
33
|
+
def title
|
34
|
+
@title ||= html.doc.css(TITLE_SELECTORS.join(' '))[0].attr('content')
|
35
|
+
end
|
36
|
+
|
37
|
+
def description
|
38
|
+
@description ||= html.doc.css(DESC_SELECTORS.join(' '))[0].content
|
39
|
+
end
|
40
|
+
|
41
|
+
def url
|
42
|
+
html.url
|
43
|
+
end
|
21
44
|
end
|
22
45
|
end
|
23
46
|
end
|
data/lib/harunica/version.rb
CHANGED