RubyGems - meiriyigua - Versions diffs - 0.0.1 - Mend

meiriyigua 0.0.1

Files changed (18) hide show

checksums.yaml +15 -0
data/.gitignore +20 -0
data/Gemfile +4 -0
data/LICENSE.txt +22 -0
data/README.md +29 -0
data/Rakefile +1 -0
data/lib/meiriyigua/baidu_crawl.rb +41 -0
data/lib/meiriyigua/config.rb +36 -0
data/lib/meiriyigua/crawl_client.rb +32 -0
data/lib/meiriyigua/detail_crawl.rb +160 -0
data/lib/meiriyigua/list_crawl.rb +97 -0
data/lib/meiriyigua/models.rb +47 -0
data/lib/meiriyigua/post_client.rb +105 -0
data/lib/meiriyigua/version.rb +4 -0
data/lib/meiriyigua.rb +43 -0
data/meiriyigua.gemspec +28 -0
data/set.yml.example +22 -0
metadata +144 -0

checksums.yaml ADDED Viewed

@@ -0,0 +1,15 @@
+---
+!binary "U0hBMQ==":
+  metadata.gz: !binary |-
+    N2VhZDc2ODBjYTliYzkxMTliNzQyNDYyNmZiZGI3NGM3YTJkZmM3MA==
+  data.tar.gz: !binary |-
+    YmZlZjE0YTE4N2U2ODY1ZDdkNTAwOTRiNjE5YjMyMTMwZWJlMjU1Mg==
+SHA512:
+  metadata.gz: !binary |-
+    YWE3NmNlYmIwYjExZTA3MDIxOWRmMTc4NDMxYWEwMmJmNDEzNTE3OTcxYzMy
+    ZGViMjNiNGZlZDkyYTBhZDBkZWJkNTgxNGNiYzkyNDMxN2UxZTg5ZmMzODgx
+    NDdjYWFmYmYzZjlkYTE4MGExNDQ2N2ZlMzYzNzdhMTRiNjRmZGE=
+  data.tar.gz: !binary |-
+    ZmI0MTQ2MzJmZDgyOTcyNzRlMGEwNDMwNDQ5OWMwNDRhOTZiMTA0MWM4NTg3
+    ODk4NWJmMmVlMzJjMWNkODMxMDZjZmJlZGRkNzg0ZWJkNWJmNGVjNDNmOGFk
+    MmMxMjdkNTk1NjFmYWQwYmVlZDBjYWIwNTcwNTk1OTQwNGJjN2U=

data/.gitignore ADDED Viewed

@@ -0,0 +1,20 @@
+*.gem
+*.rbc
+.bundle
+.config
+.yardoc
+Gemfile.lock
+InstalledFiles
+_yardoc
+coverage
+doc/
+lib/bundler/man
+pkg
+rdoc
+spec/reports
+test/tmp
+test/version_tmp
+tmp
+*.db
+set.yml

data/Gemfile ADDED Viewed

@@ -0,0 +1,4 @@
+source 'http://rubygems.org'
+# Specify your gem's dependencies in meiriyigua.gemspec
+gemspec

data/LICENSE.txt ADDED Viewed

@@ -0,0 +1,22 @@
+Copyright (c) 2014 mangege
+MIT License
+Permission is hereby granted, free of charge, to any person obtaining
+a copy of this software and associated documentation files (the
+"Software"), to deal in the Software without restriction, including
+without limitation the rights to use, copy, modify, merge, publish,
+distribute, sublicense, and/or sell copies of the Software, and to
+permit persons to whom the Software is furnished to do so, subject to
+the following conditions:
+The above copyright notice and this permission notice shall be
+included in all copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
+MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
+LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
+OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
+WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

data/README.md ADDED Viewed

@@ -0,0 +1,29 @@
+# Meiriyigua
+TODO: Write a gem description
+## Installation
+Add this line to your application's Gemfile:
+    gem 'meiriyigua'
+And then execute:
+    $ bundle
+Or install it yourself as:
+    $ gem install meiriyigua
+## Usage
+TODO: Write usage instructions here
+## Contributing
+1. Fork it
+2. Create your feature branch (`git checkout -b my-new-feature`)
+3. Commit your changes (`git commit -am 'Add some feature'`)
+4. Push to the branch (`git push origin my-new-feature`)
+5. Create new Pull Request

data/Rakefile ADDED Viewed

	@@ -0,0 +1 @@
1	+ require "bundler/gem_tasks"

data/lib/meiriyigua/baidu_crawl.rb ADDED Viewed

@@ -0,0 +1,41 @@
+# -*- encoding : utf-8 -*-
+require 'meiriyigua/crawl_client'
+require 'meiriyigua/models'
+module Meiriyigua
+  class BaiduCrawl
+    include Meiriyigua::Models
+    def initialize
+      @agent = CrawlClient.create_agent
+    end
+    def run
+      UrlRecord.all(:baidu_at => nil).each do |url_record|
+        page_record = url_record.page_record
+        baidu_intro = get_intro(page_record.title)
+        CrawlClient.random_sleep
+        if baidu_intro.empty?
+          print "抓取百度简介 #{url_record.url} "
+          puts "失败"
+        else
+          page_record.baidu_intro = baidu_intro
+          page_record.save
+          url_record.baidu_at = Time.now
+          url_record.save
+          print "抓取百度简介 #{url_record.url} "
+          puts "成功"
+        end
+      end
+    end
+    def get_intro(title)
+      page = @agent.get('http://www.baidu.com/')
+      sleep 1
+      search_form = page.form_with(:name => "f1")
+      search_form.field_with(:name => "wd").value = title
+      search_results = @agent.submit search_form
+      search_results.search('div.c-container:first-of-type div.c-abstract').text
+    end
+  end
+end

data/lib/meiriyigua/config.rb ADDED Viewed

@@ -0,0 +1,36 @@
+# -*- encoding : utf-8 -*-
+require 'uri'
+require 'yaml'
+module Meiriyigua
+  class Config
+    class << self
+      def load
+        YAML::ENGINE.yamler = 'syck'
+        @@hashs = YAML.load(File.read "#{Dir.pwd}/set.yml")
+      end
+      def site_host
+        URI(login_url).host
+      end
+      {login_url: '提交地址',
+       username: '用户名',
+       password: '密码',
+       encode: '编码',
+       day_num: '每天发布',
+       post_time: '发布延时',
+       update_time: '监控延时'}.each do |k, v|
+         define_method(k) do
+           @@hashs['基础'][v]
+         end
+       end
+       def categories
+         @@hashs['栏目']
+       end
+    end
+    self.load
+  end
+end

data/lib/meiriyigua/crawl_client.rb ADDED Viewed

@@ -0,0 +1,32 @@
+# -*- encoding : utf-8 -*-
+require 'mechanize'
+module Meiriyigua
+  class CrawlClient
+    USER_AGENTS = [
+      "Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10.6; en-US; rv:1.9.2) Gecko/20100115 Firefox/3.6",
+      "Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10_6_2; de-at) AppleWebKit/531.21.8 (KHTML, like Gecko) Version/4.0.4 Safari/531.21.10",
+      "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_2) AppleWebKit/534.51.22 (KHTML, like Gecko) Version/5.1.1 Safari/534.51.22",
+      "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/29.0.1547.32 Safari/537.36",
+      "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)",
+      "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; .NET CLR 1.1.4322; .NET CLR 2.0.50727)",
+      "Mozilla/5.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 1.1.4322; .NET CLR 2.0.50727)",
+      "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0)",
+    ]
+    def self.create_agent
+      Mechanize.new do |a|
+        a.user_agent = USER_AGENTS.shuffle.first
+        a.max_history = 1
+      end
+    end
+    def self.random_sleep
+      sleep(rand(1..3))
+    end
+    def self.set_page_encoding(page)
+      page.encoding = 'gbk' if page.encoding.downcase == 'gb2312'
+    end
+  end
+end

data/lib/meiriyigua/detail_crawl.rb ADDED Viewed

@@ -0,0 +1,160 @@
+# -*- encoding : utf-8 -*-
+require 'meiriyigua/crawl_client'
+require 'meiriyigua/models'
+module Meiriyigua
+  class DetailCrawl
+    include Meiriyigua::Models
+    def initialize(detail_urls)
+      @detail_urls = detail_urls
+      @agent = CrawlClient.create_agent
+    end
+    def run
+      while !@detail_urls.empty?
+        uri = URI(@detail_urls.pop)
+        handle_url(uri)
+      end
+    end
+    def handle_url(uri)
+      if UrlRecord.exist_url?(uri.to_s)
+        #print "抓取详情页 #{uri.to_s} "
+        #puts "重复,跳过"
+        return
+      end
+      page = @agent.get(uri)
+      CrawlClient.set_page_encoding(page)
+      name = uri.host.to_s.split('.')[1]
+      url_record = UrlRecord.new
+      url_record.url = uri.to_s
+      url_record.detail_at = Time.now
+      page_record = PageRecord.new
+      url_record.page_record = page_record
+      page_record = send("handle_#{name}", page, page_record)
+      if page_record.nil?
+        print "抓取详情页 #{uri.to_s} "
+        puts "失败"
+      else
+        print "抓取详情页 #{uri.to_s} "
+        if url_record.save
+          puts "成功"
+        else
+          puts "保存失败"
+        end
+      end
+      CrawlClient.random_sleep
+    end
+    def handle_1234wg(page, page_record)
+      page_record.title = page.search('td[width="583"] > font > strong font').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('body > table[background="/images/hgf-4.gif"] td[style="padding-left:6px;"] a:last-of-type').text
+      page_record.content = strip_content(page.search('td#intro'))
+      filename = page.search('td[valign="top"] > script:last-of-type').text.split(',')[1][6..-2]
+      page_record.downloads = "http://dx2down.bugwg.com:801/#{URI.escape filename}"
+      page_record
+    end
+    def handle_qh24(page, page_record)
+      page_record.title = page.search('//*[@id="sintro"]/h1/text()').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('h2.classname > a:last-of-type').text
+      page_record.content = strip_content(page.search('div.cnt'))
+      page_record.downloads = join_downloads(page.search('div#intext dd a').collect{|a| a['href']})
+      page_record
+    end
+    def handle_nanawg(page, page_record)
+      page_record.title = page.search('div.right_tit').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div#index3 a:last-of-type').text
+      page_record.content = page.search('div.rightsum_text4').text
+      page_record.downloads = join_downloads(page.search('ul.ul2 a').collect{|a| a['href'] =~ /^http/ ? a['href'] : "http://www.nanawg.com#{a['href']}"})
+      page_record
+    end
+    def handle_ucbug(page, page_record)
+      page_record.title = page.search('div.spmain_1 a').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div.slhead_1 a:last-of-type').text
+      page_record.content = page.search('div.spmain_5').text
+      page_record.downloads = join_downloads(page.search('ul.ul_Address a').collect{|a| a['href']})
+      page_record
+    end
+    def handle_gg1z(page, page_record)
+      page_record.title = page.search('div.software-info > div.cp-top > h3').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div.nav-breadcrumb a:nth-last-of-type(2)').text
+      content = page.search('div.cp-main > div.cp-main')
+      content.search('font[color="red"]').remove
+      page_record.content = strip_content(content)
+      downloads = page.search('ul.download-list a').collect{|a| "http://www.gg1z.com#{a['href']}"}
+      downloads = [downloads.first, downloads.last].uniq
+      final_downloads = []
+      downloads.each do |down|
+        down_page = @agent.get(down, nil, page.uri.to_s)
+        CrawlClient.set_page_encoding(down_page)
+        final_downloads.concat( down_page.search('div.downarea a').collect{|a| a['href'] =~ /^http/ ? a['href'] : "http://www.gg1z.com#{a['href']}"} )
+      end
+      page_record.downloads = join_downloads(final_downloads)
+      page_record
+    end
+    def handle_dongdongwg(page, page_record)
+      page_record.title = page.search('//div[@class="pageMainArea"]/h1/text()').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('span.current1 a:last-of-type').text
+      content = page.search('div#mainSoftIntro')
+      content.search('p:last-of-type').remove
+      page_record.content = strip_content(content)
+      page_record.downloads = join_downloads(page.search('ul.downlistbox a').collect{|a| a['href']})
+      page_record
+    end
+    def handle_uuuwg(page, page_record)
+      page_record.title = page.search('div.spmain_1').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div.slhead_1 a:last-of-type').text
+      page_record.content = strip_content(page.search('div.spmain_5'))
+      page_record.downloads = join_downloads(page.search('ul.spmain_3_2 > li:last-of-type a').collect{|a| a['href']})
+      page_record
+    end
+    def handle_xixiwg(page, page_record)
+      page_record.title = page.search('div.r2 h2').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div.location a:last-of-type').text
+      page_record.content = strip_content(page.search('div#intro'))
+      filename = page.search('div.xzk script:last-of-type').text.split(',')[1].strip[6..-3]
+      page_record.downloads = "http://dxdown1.xixiwg.com/#{URI.escape filename}"
+      page_record
+    end
+    def handle_xiaolinzi(page, page_record)
+      page_record.title = page.search('div.dlbt_wz').text.strip
+      return if page_record.title.empty?
+      page_record.category = page.search('div.head_dh a:last-of-type').text
+      page_record.content = strip_content(page.search('div#content_all'))
+      page_record.downloads = join_downloads(page.search('div.dl_link_bd a[target="_blank"]').collect{|a| a['href']})
+      page_record
+    end
+    def strip_content(content)
+      content.text
+    end
+    def join_downloads(downloads)
+      downloads.uniq.join('#!#')
+    end
+  end
+end

data/lib/meiriyigua/list_crawl.rb ADDED Viewed

@@ -0,0 +1,97 @@
+# -*- encoding : utf-8 -*-
+require 'meiriyigua/crawl_client'
+module Meiriyigua
+  class ListCrawl
+    attr_reader :detail_urls
+    def initialize
+      @list_urls = Queue.new
+      @detail_urls = Queue.new
+      @agent = CrawlClient.create_agent
+      init_url
+    end
+    def run
+      while !@list_urls.empty?
+        uri = URI(@list_urls.pop)
+        handle_url(uri)
+      end
+    end
+    def handle_url(uri)
+      page = @agent.get(uri)
+      CrawlClient.set_page_encoding(page)
+      name = uri.host.to_s.split('.')[1]
+      urls = send("handle_#{name}", page)
+      if urls.empty?
+        print "抓取列表页 #{uri.to_s} "
+        puts "失败"
+      else
+        urls.each {|a| @detail_urls << a}
+        print "抓取列表页 #{uri.to_s} "
+        puts "成功"
+      end
+      CrawlClient.random_sleep
+    end
+    def handle_1234wg(page)
+      urls = page.search('td[width="470"] a[href^="/1234/"]')
+      urls.collect {|a| "http://www.1234wg.com#{a['href']}" }
+    end
+    def handle_qh24(page)
+      urls = page.search('div#downhot table a')
+      urls.collect{|a| "http://www.qh24.com#{a['href']}"}
+    end
+    def handle_nanawg(page)
+      urls = page.search('td[width="362"] a:last-of-type')
+      urls.collect{|a| "http://www.nanawg.com#{a['href']}"}
+    end
+    def handle_ucbug(page)
+      urls = page.search('li.slmain2_2_2 a')
+      urls.collect{|a| a['href']}
+    end
+    def handle_gg1z(page)
+      urls = page.search('span.app-name a')
+      urls.collect{|a| "http://www.gg1z.com#{a['href']}"}
+    end
+    def handle_dongdongwg(page)
+      urls = page.search('span.list_title > a')
+      urls.collect{|a| "http://www.dongdongwg.com#{a['href']}"}
+    end
+    def handle_uuuwg(page)
+      urls = page.search('table.main_table tr > td:nth-child(2) a')
+      urls.collect{|a| "http://www.uuuwg.com#{a['href']}"}
+    end
+    def handle_xixiwg(page)
+      urls = page.search('div.entry > h2 > a')
+      urls.collect{|a| "http://www.xixiwg.com#{a['href']}"}
+    end
+    def handle_xiaolinzi(page)
+      urls = page.search('td.rewid1 > a')
+      urls.collect{|a| "http://www.xiaolinzi.com#{a['href']}"}
+    end
+    private
+    def init_url
+      @list_urls << 'http://www.1234wg.com/new.html'
+      @list_urls << 'http://www.qh24.com/new.html'
+      @list_urls << 'http://www.nanawg.com/soft/html/newlist-1.html'
+      @list_urls << 'http://www.ucbug.com/new.html'
+      @list_urls << 'http://www.gg1z.com/soft/html/newlist-1.html'
+      @list_urls << 'http://www.dongdongwg.com/soft/html/newlist-1.html'
+      @list_urls << 'http://www.uuuwg.com/newlist.html'
+      @list_urls << 'http://www.xixiwg.com/new/'
+      @list_urls << 'http://www.xiaolinzi.com/update/'
+    end
+  end
+end

data/lib/meiriyigua/models.rb ADDED Viewed

@@ -0,0 +1,47 @@
+# -*- encoding : utf-8 -*-
+require 'data_mapper'
+#DataMapper::Logger.new($stdout, :debug)
+DataMapper::Model.raise_on_save_failure = true
+DataMapper.setup(:default, "sqlite://#{Dir.pwd}/data.db")
+module Meiriyigua
+  module Models
+    class UrlRecord
+      include DataMapper::Resource
+      property :id, Serial
+      property :url, String, length: 1024
+      property :detail_at, DateTime
+      property :baidu_at, DateTime
+      property :publish_at, DateTime
+      property :created_at, DateTime
+      property :updated_at, DateTime
+      has 1, :page_record
+      def self.exist_url?(url)
+        self.count(url: url) > 0
+      end
+    end
+    class PageRecord
+      include DataMapper::Resource
+      property :id, Serial
+      property :title, String, length: 1024
+      property :category, String, length: 1024
+      property :content, Text
+      property :downloads, Text
+      property :baidu_intro, Text
+      property :created_at, DateTime
+      property :updated_at, DateTime
+      belongs_to :url_record
+    end
+  end
+end
+DataMapper.finalize
+DataMapper.auto_upgrade!

data/lib/meiriyigua/post_client.rb ADDED Viewed

@@ -0,0 +1,105 @@
+# -*- encoding : utf-8 -*-
+require 'meiriyigua/models'
+require 'meiriyigua/config'
+require 'meiriyigua/crawl_client'
+module Meiriyigua
+  class PostClient
+    include Meiriyigua::Models
+    ZHS = 0x4e00..0x9fff
+    attr_reader :category_ids
+    def initialize
+      @agent = CrawlClient.create_agent
+      @category_ids = {}
+      login
+      check_category
+    end
+    def run
+      today_count = UrlRecord.count(:publish_at.gte => Date.today)
+      if today_count >= Meiriyigua::Config.day_num
+        return
+      end
+      time_limit = Time.now - 60 * Meiriyigua::Config.post_time.to_i
+      UrlRecord.all(:detail_at.lte => time_limit, :baidu_at.not => nil, :publish_at => nil).each do |url_record|
+        today_count += 1
+        if today_count >= Meiriyigua::Config.day_num
+          return
+        end
+        page_record = url_record.page_record
+        if post_news(page_record, @category_ids[URI(url_record.url).host])
+          url_record.publish_at = Time.now
+          url_record.save
+          print "发布 #{url_record.url} "
+          puts "成功"
+        else
+          print "发布 #{url_record.url} "
+          puts "失败"
+        end
+        sleep 1
+      end
+    end
+    def login
+      page = @agent.get(Meiriyigua::Config.login_url)
+      login_form = page.form_with(name: 'login')
+      login_form.field_with(name: 'ad_name').value = Meiriyigua::Config.username
+      login_form.field_with(name: 'ad_pwd').value = Meiriyigua::Config.password
+      login_results = @agent.submit(login_form)
+      login_results.search('a[href="/admin/admin.php/Index/index"]').size > 0
+    end
+    def check_category
+      page = @agent.get "http://#{Meiriyigua::Config.site_host}/admin/admin.php/News/add"
+      options = page.search('select#news_type > option').collect{|o| [o.text.strip, o['value'].to_i]}
+      options = Hash[options]
+      Meiriyigua::Config.categories.each do |host, name|
+        unless options.keys.include?(name)
+          @category_ids[host] = options[name]
+          @agent.post("http://#{Meiriyigua::Config.site_host}/admin/admin.php/NewsType/add", news_type: name)
+        end
+      end
+      load_category_ids
+    end
+    def post_news(page_record, category_id)
+      post_params = {}
+      post_params['news_tit'] = "#{page_record.category}最新版辅助外挂免费下载 #{page_record.title}"
+      post_params['author'] = random_zh
+      post_params['click'] = rand(600..13000)
+      post_params['biaoqian'] = page_record.category
+      post_params['download_url'] = page_record.downloads.split('#!#')[0..1].join('|')
+      post_params['news_type'] = category_id
+      post_params['jianjie'] = page_record.content.to_s[0..16]
+      post_params['editorValue'] = "<pre>#{page_record.content} \r\n\r\n 提示一:\r\n#{page_record.baidu_intro}</pre>"
+      result_page = @agent.post("http://#{Meiriyigua::Config.site_host}/admin/admin.php/News/insert", post_params)
+      !result_page.search('script').text.index('/admin/admin.php/News/index').nil?
+    end
+    private
+    def random_zh
+      s = ""
+      rand(2..4).times do
+        s << rand(ZHS)
+      end
+      s
+    end
+    def load_category_ids
+      page = @agent.get "http://#{Meiriyigua::Config.site_host}/admin/admin.php/News/add"
+      options = page.search('select#news_type > option').collect{|o| [o.text.strip, o['value'].to_i]}
+      options = Hash[options]
+      Meiriyigua::Config.categories.each do |host, name|
+        @category_ids[host] = options[name]
+      end
+    end
+  end
+end

data/lib/meiriyigua/version.rb ADDED Viewed

@@ -0,0 +1,4 @@
+# -*- encoding : utf-8 -*-
+module Meiriyigua
+  VERSION = "0.0.1"
+end

data/lib/meiriyigua.rb ADDED Viewed

@@ -0,0 +1,43 @@
+# -*- encoding : utf-8 -*-
+require "meiriyigua/version"
+require 'meiriyigua/config'
+require "meiriyigua/list_crawl"
+require "meiriyigua/detail_crawl"
+require "meiriyigua/baidu_crawl"
+require "meiriyigua/post_client"
+module Meiriyigua
+  def run
+    while true
+      begin
+        threads = []
+        threads << Thread.new do
+          list_crawl = ListCrawl.new
+          list_crawl.run
+          detail_crawl = DetailCrawl.new(list_crawl.detail_urls)
+          detail_crawl.run
+          sleep(Meiriyigua::Config.update_time.to_i * 60)
+        end
+        threads << Thread.new do
+          baidu_crawl = BaiduCrawl.new
+          baidu_crawl.run
+          sleep(Meiriyigua::Config.update_time.to_i * 60)
+        end
+        threads << Thread.new do
+          post_client = PostClient.new
+          post_client.run
+          sleep(Meiriyigua::Config.post_time.to_i * 60)
+        end
+        threads.each { |thr| thr.join }
+      rescue
+        puts "出错了 #{$!.message}"
+      end
+      sleep 60*10
+    end
+  end
+  module_function :run
+end
+Meiriyigua.run

data/meiriyigua.gemspec ADDED Viewed

@@ -0,0 +1,28 @@
+# coding: utf-8
+lib = File.expand_path('../lib', __FILE__)
+$LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
+require 'meiriyigua/version'
+Gem::Specification.new do |spec|
+  spec.name          = "meiriyigua"
+  spec.version       = Meiriyigua::VERSION
+  spec.authors       = ["mangege"]
+  spec.email         = ["cxh116@126.com"]
+  spec.description   = %q{nil}
+  spec.summary       = %q{nil}
+  spec.homepage      = "http://github.com/mangege"
+  spec.license       = "MIT"
+  spec.files         = `git ls-files`.split($/)
+  spec.executables   = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
+  spec.test_files    = spec.files.grep(%r{^(test|spec|features)/})
+  spec.require_paths = ["lib"]
+  spec.add_runtime_dependency "mechanize", '~> 2.7'
+  spec.add_runtime_dependency "sqlite3", '~> 1.3'
+  spec.add_runtime_dependency "data_mapper", '~> 1.2'
+  spec.add_runtime_dependency "dm-sqlite-adapter", '~> 1.2'
+  spec.add_development_dependency "bundler", "~> 1.3"
+  spec.add_development_dependency "rake"
+end

data/set.yml.example ADDED Viewed

@@ -0,0 +1,22 @@
+保留头:
+    勿删除: 0
+基础:
+    提交地址: http://www.meiriyigua.com/admin/admin.php
+    用户名: admin
+    密码: admin888
+    编码: utf8
+    每天发布: 300
+    发布延时: 60
+    监控延时: 30
+栏目:
+    www.1234wg.com: 1234外挂网
+    www.qh24.com: 艾艾游戏网
+    www.nanawg.com: 娜娜网
+    www.ucbug.com: ucbug游戏网
+    www.gg1z.com: 挂挂一族
+    www.dongdongwg.com: 东东游戏网
+    www.uuuwg.com: 西西游戏网
+    www.xixiwg.com: 西西外挂网
+    www.xiaolinzi.com: 小林子软件站

metadata ADDED Viewed

@@ -0,0 +1,144 @@
+--- !ruby/object:Gem::Specification
+name: meiriyigua
+version: !ruby/object:Gem::Version
+  version: 0.0.1
+platform: ruby
+authors:
+- mangege
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2014-04-07 00:00:00.000000000 Z
+dependencies:
+- !ruby/object:Gem::Dependency
+  name: mechanize
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '2.7'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '2.7'
+- !ruby/object:Gem::Dependency
+  name: sqlite3
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.3'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.3'
+- !ruby/object:Gem::Dependency
+  name: data_mapper
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.2'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.2'
+- !ruby/object:Gem::Dependency
+  name: dm-sqlite-adapter
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.2'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.2'
+- !ruby/object:Gem::Dependency
+  name: bundler
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.3'
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ~>
+      - !ruby/object:Gem::Version
+        version: '1.3'
+- !ruby/object:Gem::Dependency
+  name: rake
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - ! '>='
+      - !ruby/object:Gem::Version
+        version: '0'
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - ! '>='
+      - !ruby/object:Gem::Version
+        version: '0'
+description: nil
+email:
+- cxh116@126.com
+executables: []
+extensions: []
+extra_rdoc_files: []
+files:
+- .gitignore
+- Gemfile
+- LICENSE.txt
+- README.md
+- Rakefile
+- lib/meiriyigua.rb
+- lib/meiriyigua/baidu_crawl.rb
+- lib/meiriyigua/config.rb
+- lib/meiriyigua/crawl_client.rb
+- lib/meiriyigua/detail_crawl.rb
+- lib/meiriyigua/list_crawl.rb
+- lib/meiriyigua/models.rb
+- lib/meiriyigua/post_client.rb
+- lib/meiriyigua/version.rb
+- meiriyigua.gemspec
+- set.yml.example
+homepage: http://github.com/mangege
+licenses:
+- MIT
+metadata: {}
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+required_rubygems_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+requirements: []
+rubyforge_project:
+rubygems_version: 2.2.2
+signing_key:
+specification_version: 4
+summary: nil
+test_files: []