baidu 0.2.1 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. data/lib/baidu.rb +11 -8
  2. metadata +1 -1
@@ -8,22 +8,25 @@ class Baidu
8
8
  @baseuri = "http://www.baidu.com/s?rn=#{@perpage}&wd="
9
9
  end
10
10
  def query(query)
11
- @uri = @baseuri+URI.encode(Iconv.conv('GBK','UTF-8',query))
11
+ @uri = @baseuri+URI.encode(query.encode('GBK'))
12
12
  @page = @a.get @uri
13
13
  self.clean
14
- @number = number
14
+ @number = self.number
15
15
  @maxpage = (@number / @perpage.to_f).round
16
16
  @maxpage =10 if @maxpage>10
17
17
  @currpage =0
18
18
  end
19
- def how_many_pages(url)
20
- self.query("site:#{url}")
19
+ def how_many_pages(uri)
20
+ self.query("site:#{uri}")
21
+ return self.number
21
22
  end
22
- def how_many_links
23
- self.query("domain:\"#{link}\"")
23
+ def how_many_links(uri)
24
+ self.query("domain:\"#{uri}\"")
25
+ return self.number
24
26
  end
25
27
  def how_many_pages_with(url,string)
26
28
  self.query("site:#{url} inurl:#{string}")
29
+ return self.number
27
30
  end
28
31
  def rank(host)
29
32
  @page.search("//table[@class=\"result\"]").each do |table|
@@ -47,7 +50,7 @@ class Baidu
47
50
  return true
48
51
  end
49
52
  def clean
50
- @page.body = Iconv.conv('UTF-16','GBK//IGNORE',@page.body)
51
- @page.body.gsub! ("[\U0080-\U2C77]+",'') //mechanize will be confuzed without removing the few characters
53
+ @page.body.encode!('UTF-8','GBK')
54
+ @page.body.gsub! ("[\U0080-\U2C77]+") #mechanize will be confuzed without removing the few characters
52
55
  end
53
56
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: baidu
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.1
4
+ version: 0.2.2
5
5
  prerelease:
6
6
  platform: ruby
7
7
  authors: