RubyGems - jekyll-import - Versions diffs - 0.1.0.beta3 → 0.1.0.beta4 - Mend

jekyll-import 0.1.0.beta3 → 0.1.0.beta4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

checksums.yaml +6 -14
data/History.markdown +18 -0
data/README.markdown +12 -1
data/jekyll-import.gemspec +31 -25
data/lib/jekyll-import.rb +50 -1
data/lib/jekyll-import/importer.rb +11 -0
data/lib/jekyll-import/importers.rb +10 -0
data/lib/jekyll-import/importers/csv.rb +50 -0
data/lib/jekyll-import/importers/drupal6.rb +139 -0
data/lib/jekyll-import/importers/drupal7.rb +102 -0
data/lib/jekyll-import/importers/enki.rb +76 -0
data/lib/jekyll-import/importers/google_reader.rb +68 -0
data/lib/jekyll-import/importers/joomla.rb +83 -0
data/lib/jekyll-import/importers/jrnl.rb +127 -0
data/lib/jekyll-import/importers/marley.rb +72 -0
data/lib/jekyll-import/importers/mephisto.rb +109 -0
data/lib/jekyll-import/importers/mt.rb +169 -0
data/lib/jekyll-import/importers/posterous.rb +139 -0
data/lib/jekyll-import/importers/rss.rb +71 -0
data/lib/jekyll-import/importers/s9y.rb +67 -0
data/lib/jekyll-import/importers/textpattern.rb +76 -0
data/lib/jekyll-import/importers/tumblr.rb +265 -0
data/lib/jekyll-import/importers/typo.rb +89 -0
data/lib/jekyll-import/importers/wordpress.rb +323 -0
data/lib/jekyll-import/importers/wordpressdotcom.rb +97 -0
data/lib/jekyll/commands/import.rb +1 -0
data/test/helper.rb +3 -1
data/test/test_jrnl_importer.rb +39 -0
data/test/test_mt_importer.rb +16 -16
data/test/test_tumblr_importer.rb +61 -0
data/test/test_wordpress_importer.rb +1 -1
data/test/test_wordpressdotcom_importer.rb +1 -1
metadata +53 -32
data/lib/jekyll/jekyll-import/csv.rb +0 -30
data/lib/jekyll/jekyll-import/drupal6.rb +0 -112
data/lib/jekyll/jekyll-import/drupal7.rb +0 -74
data/lib/jekyll/jekyll-import/enki.rb +0 -49
data/lib/jekyll/jekyll-import/google_reader.rb +0 -61
data/lib/jekyll/jekyll-import/joomla.rb +0 -53
data/lib/jekyll/jekyll-import/marley.rb +0 -52
data/lib/jekyll/jekyll-import/mephisto.rb +0 -84
data/lib/jekyll/jekyll-import/mt.rb +0 -142
data/lib/jekyll/jekyll-import/posterous.rb +0 -122
data/lib/jekyll/jekyll-import/rss.rb +0 -63
data/lib/jekyll/jekyll-import/s9y.rb +0 -59
data/lib/jekyll/jekyll-import/textpattern.rb +0 -58
data/lib/jekyll/jekyll-import/tumblr.rb +0 -242
data/lib/jekyll/jekyll-import/typo.rb +0 -69
data/lib/jekyll/jekyll-import/wordpress.rb +0 -299
data/lib/jekyll/jekyll-import/wordpressdotcom.rb +0 -84

data/lib/jekyll/jekyll-import/mt.rb DELETED Viewed

@@ -1,142 +0,0 @@
-# Created by Nick Gerakines, open source and publically available under the
-# MIT license. Use this module at your own risk.
-# I'm an Erlang/Perl/C++ guy so please forgive my dirty ruby.
-require 'rubygems'
-require 'sequel'
-require 'fileutils'
-require 'safe_yaml'
-# NOTE: This converter requires Sequel and the MySQL gems.
-# The MySQL gem can be difficult to install on OS X. Once you have MySQL
-# installed, running the following commands should work:
-# $ sudo gem install sequel
-# $ sudo gem install mysql -- --with-mysql-config=/usr/local/mysql/bin/mysql_config
-module JekyllImport
-  module MT
-    STATUS_DRAFT = 1
-    STATUS_PUBLISHED = 2
-    MORE_CONTENT_SEPARATOR = '<!--more-->'
-    def self.default_options
-      {
-        :blog_id => nil,
-        :categories => true,
-        :dest_encoding => 'utf-8',
-        :src_encoding => 'utf-8'
-      }
-    end
-    # By default this migrator will include posts for all your MovableType blogs.
-    # Specify a single blog by providing blog_id.
-    # Main migrator function. Call this to perform the migration.
-    #
-    # dbname::  The name of the database
-    # user::    The database user name
-    # pass::    The database user's password
-    # host::    The address of the MySQL database host. Default: 'localhost'
-    # options:: A hash of configuration options
-    #
-    # Supported options are:
-    #
-    # :blog_id::        Specify a single MovableType blog to export by providing blog_id.
-    #                   Default: nil, importer will include posts for all blogs.
-    # :categories::     If true, save the post's categories in its
-    #                   YAML front matter. Default: true
-    # :src_encoding::   Encoding of strings from the database. Default: UTF-8
-    #                   If your output contains mangled characters, set src_encoding to
-    #                   something appropriate for your database charset.
-    # :dest_encoding::  Encoding of output strings. Default: UTF-8
-    def self.process(dbname, user, pass, host = 'localhost', options = {})
-      options = default_options.merge(options)
-      db = Sequel.mysql(dbname, :user => user, :password => pass, :host => host)
-      post_categories = db[:mt_placement].join(:mt_category, :category_id => :placement_category_id)
-      FileUtils.mkdir_p "_posts"
-      posts = db[:mt_entry]
-      posts = posts.filter(:entry_blog_id => options[:blog_id]) if options[:blog_id]
-      posts.each do |post|
-        categories = post_categories.filter(
-          :mt_placement__placement_entry_id => post[:entry_id]
-        ).map {|ea| encode(ea[:category_basename], options) }
-        file_name = post_file_name(post, options)
-        data = post_metadata(post, options)
-        data['categories'] = categories if !categories.empty? && options[:categories]
-        yaml_front_matter = data.delete_if { |k,v| v.nil? || v == '' }.to_yaml
-        content = post_content(post, options)
-        File.open("_posts/#{file_name}", "w") do |f|
-          f.puts yaml_front_matter
-          f.puts "---"
-          f.puts encode(content, options)
-        end
-      end
-    end
-    # Extracts metadata for YAML front matter from post
-    def self.post_metadata(post, options = default_options)
-      metadata = {
-        'layout' => 'post',
-        'title' => encode(post[:entry_title], options),
-        'date' => post[:entry_authored_on].strftime("%Y-%m-%d %H:%M:%S %z"),
-        'excerpt' => encode(post[:entry_excerpt], options),
-        'mt_id' => post[:entry_id]
-      }
-      metadata['published'] = false if post[:entry_status] != STATUS_PUBLISHED
-      metadata
-    end
-    # Extracts text body from post
-    def self.post_content(post, options = default_options)
-      if post[:entry_text_more].strip.empty?
-        post[:entry_text]
-      else
-        post[:entry_text] + "\n\n#{MORE_CONTENT_SEPARATOR}\n\n" + post[:entry_text_more]
-      end
-    end
-    def self.post_file_name(post, options = default_options)
-      date = post[:entry_authored_on]
-      slug = post[:entry_basename]
-      file_ext = suffix(post[:entry_convert_breaks])
-      "#{date.strftime('%Y-%m-%d')}-#{slug}.#{file_ext}"
-    end
-    def self.encode(str, options = default_options)
-      if str.respond_to?(:encoding)
-        str.encode(options[:dest_encoding], options[:src_encoding])
-      else
-        str
-      end
-    end
-    # Ideally, this script would determine the post format (markdown,
-    # html, etc) and create files with proper extensions. At this point
-    # it just assumes that markdown will be acceptable.
-    def self.suffix(entry_type)
-      if entry_type.nil? || entry_type.include?("markdown") || entry_type.include?("__default__")
-        # The markdown plugin I have saves this as
-        # "markdown_with_smarty_pants", so I just look for "markdown".
-        "markdown"
-      elsif entry_type.include?("textile")
-        # This is saved as "textile_2" on my installation of MT 5.1.
-        "textile"
-      elsif entry_type == "0" || entry_type.include?("richtext")
-        # Richtext looks to me like it's saved as HTML, so I include it here.
-        "html"
-      else
-        # Other values might need custom work.
-        entry_type
-      end
-    end
-  end
-end

data/lib/jekyll/jekyll-import/posterous.rb DELETED Viewed

@@ -1,122 +0,0 @@
-require 'rubygems'
-require 'jekyll'
-require 'fileutils'
-require 'net/http'
-require 'uri'
-require "json"
-# ruby -r './lib/jekyll/migrators/posterous.rb' -e 'Jekyll::Posterous.process(email, pass, api_key)'
-# Other arguments are optional; the default values are:
-# * :include_imgs => false         # should images be downloaded as well?
-# * :blog         => 'primary'     # blog, if you have more than one.
-# * :base_path    => '/'           # for image, if they will be served from a different host for eg.
-# For example, to download images as well as your posts, use the above command with
-# ....process(email, pass, api_key, :include_imgs => true)
-module JekyllImport
-  module Posterous
-    def self.fetch(uri_str, limit = 10)
-      # You should choose better exception.
-      raise ArgumentError, 'Stuck in a redirect loop. Please double check your email and password' if limit == 0
-      response = nil
-      Net::HTTP.start('posterous.com') do |http|
-        req = Net::HTTP::Get.new(uri_str)
-        req.basic_auth @email, @pass
-        response = http.request(req)
-      end
-      case response
-        when Net::HTTPSuccess     then response
-        when Net::HTTPRedirection then fetch(response['location'], limit - 1)
-        else response.error!
-      end
-    end
-    def self.fetch_images(directory, imgs)
-      def self.fetch_one(url, limit = 10)
-        raise ArgumentError, 'HTTP redirect too deep' if limit == 0
-        response = Net::HTTP.get_response(URI.parse(url))
-        case response
-        when Net::HTTPSuccess     then response.body
-        when Net::HTTPRedirection then self.fetch_one(response['location'], limit - 1)
-        else
-          response.error!
-        end
-      end
-      FileUtils.mkdir_p directory
-      urls = Array.new
-      imgs.each do |img|
-        fullurl = img["full"]["url"]
-        uri = URI.parse(fullurl)
-        imgname = uri.path.split("/")[-1]
-        imgdata = self.fetch_one(fullurl)
-        open(directory + "/" + imgname, "wb") do |file|
-          file.write imgdata
-        end
-        urls.push(directory + "/" + imgname)
-      end
-      return urls
-    end
-    def self.process(email, pass, api_token, opts={})
-      @email, @pass, @api_token = email, pass, api_token
-      defaults = { :include_imgs => false, :blog => 'primary', :base_path => '/' }
-      opts = defaults.merge(opts)
-      FileUtils.mkdir_p "_posts"
-      posts = JSON.parse(self.fetch("/api/v2/users/me/sites/#{opts[:blog]}/posts?api_token=#{@api_token}").body)
-      page = 1
-      while posts.any?
-        posts.each do |post|
-          title = post["title"]
-          slug = title.gsub(/[^[:alnum:]]+/, '-').downcase
-          date = Date.parse(post["display_date"])
-          content = post["body_html"]
-          published = !post["is_private"]
-          basename = "%02d-%02d-%02d-%s" % [date.year, date.month, date.day, slug]
-          name = basename + '.html'
-          # Images:
-          if opts[:include_imgs]
-            post_imgs = post["media"]["images"]
-            if post_imgs.any?
-              img_dir = "imgs/%s" % basename
-              img_urls = self.fetch_images(img_dir, post_imgs)
-              img_urls.map! do |url|
-                '<li><img src="' + opts[:base_path] + url + '"></li>'
-              end
-              imgcontent = "<ol>\n" + img_urls.join("\n") + "</ol>\n"
-              # filter out "posterous-content", replacing with imgs:
-              content = content.sub(/\<p\>\[\[posterous-content:[^\]]+\]\]\<\/p\>/, imgcontent)
-            end
-          end
-          # Get the relevant fields as a hash, delete empty fields and convert
-          # to YAML for the header
-          data = {
-             'layout' => 'post',
-             'title' => title.to_s,
-             'published' => published
-           }.delete_if { |k,v| v.nil? || v == ''}.to_yaml
-          # Write out the data and content to file
-          File.open("_posts/#{name}", "w") do |f|
-            f.puts data
-            f.puts "---"
-            f.puts content
-          end
-        end
-        page += 1
-        posts = JSON.parse(self.fetch("/api/v2/users/me/sites/#{opts[:blog]}/posts?api_token=#{@api_token}&page=#{page}").body)
-      end
-    end
-  end
-end

data/lib/jekyll/jekyll-import/rss.rb DELETED Viewed

@@ -1,63 +0,0 @@
-# Created by Kendall Buchanan (https://github.com/kendagriff) on 2011-12-22.
-# Use at your own risk. The end.
-#
-# Usage:
-#   (URL)
-#   ruby -r 'jekyll/jekyll-import/rss' -e "JekyllImport::RSS.process(:source => 'http://yourdomain.com/your-favorite-feed.xml')"
-#
-#   (Local file)
-#   ruby -r 'jekyll/jekyll-import/rss' -e "JekyllImport::RSS.process(:source => './somefile/on/your/computer.xml')"
-require 'rss/1.0'
-require 'rss/2.0'
-require 'open-uri'
-require 'fileutils'
-require 'safe_yaml'
-module JekyllImport
-  module RSS
-    def self.validate(options)
-      if !options[:source]
-        abort "Missing mandatory option --source."
-      end
-    end
-    # Process the import.
-    #
-    # source - a URL or a local file String.
-    #
-    # Returns nothing.
-    def self.process(options)
-      validate(options)
-      source = options[:source]
-      content = ""
-      open(source) { |s| content = s.read }
-      rss = ::RSS::Parser.parse(content, false)
-      raise "There doesn't appear to be any RSS items at the source (#{source}) provided." unless rss
-      rss.items.each do |item|
-        formatted_date = item.date.strftime('%Y-%m-%d')
-        post_name = item.title.split(%r{ |!|/|:|&|-|$|,}).map do |i|
-          i.downcase if i != ''
-        end.compact.join('-')
-        name = "#{formatted_date}-#{post_name}"
-        header = {
-          'layout' => 'post',
-          'title' => item.title
-        }
-        FileUtils.mkdir_p("_posts")
-        File.open("_posts/#{name}.html", "w") do |f|
-          f.puts header.to_yaml
-          f.puts "---\n\n"
-          f.puts item.description
-        end
-      end
-    end
-  end
-end

data/lib/jekyll/jekyll-import/s9y.rb DELETED Viewed

@@ -1,59 +0,0 @@
-# Migrator to import entries from an Serendipity (S9Y) blog
-#
-# Entries can be exported from http://blog.example.com/rss.php?version=2.0&all=1
-#
-# Usage:
-# ruby -r './s9y_rss.rb' -e 'Jekyll::S9Y.process("http://blog.example.com/rss.php?version=2.0&all=1")'
-require 'open-uri'
-require 'rss'
-require 'fileutils'
-require 'yaml'
-module JekyllImport
-  module S9Y
-    def self.validate(options)
-      if !options[:source]
-        abort "Missing mandatory option --source, e.g. --source \"http://blog.example.com/rss.php?version=2.0&all=1\""
-      end
-    end
-    def self.process(options)
-      validate(options)
-      FileUtils.mkdir_p("_posts")
-      source = options[:source]
-      text = ''
-      open(source) { |line| text = line.read }
-      rss = RSS::Parser.parse(text)
-      rss.items.each do |item|
-        post_url = item.link.match('.*(/archives/.*)')[1]
-        categories = item.categories.collect { |c| c.content }
-        content = item.content_encoded.strip
-        date = item.date
-        slug = item.link.match('.*/archives/[0-9]+-(.*)\.html')[1]
-        name = "%02d-%02d-%02d-%s.markdown" % [date.year, date.month, date.day,
-                                               slug]
-        data = {
-          'layout' => 'post',
-          'title' => item.title,
-          'categories' => categories,
-          'permalink' => post_url,
-          's9y_link' => item.link,
-          'date' => item.date,
-        }.delete_if { |k,v| v.nil? || v == '' }.to_yaml
-        # Write out the data and content to file
-        File.open("_posts/#{name}", "w") do |f|
-          f.puts data
-          f.puts "---"
-          f.puts content
-        end
-      end
-    end
-  end
-end

data/lib/jekyll/jekyll-import/textpattern.rb DELETED Viewed

@@ -1,58 +0,0 @@
-require 'rubygems'
-require 'sequel'
-require 'fileutils'
-require 'safe_yaml'
-# NOTE: This converter requires Sequel and the MySQL gems.
-# The MySQL gem can be difficult to install on OS X. Once you have MySQL
-# installed, running the following commands should work:
-# $ sudo gem install sequel
-# $ sudo gem install mysql -- --with-mysql-config=/usr/local/mysql/bin/mysql_config
-module JekyllImport
-  module TextPattern
-    # Reads a MySQL database via Sequel and creates a post file for each post.
-    # The only posts selected are those with a status of 4 or 5, which means
-    # "live" and "sticky" respectively.
-    # Other statuses are 1 => draft, 2 => hidden and 3 => pending.
-    QUERY = "SELECT Title, \
-                    url_title, \
-                    Posted, \
-                    Body, \
-                    Keywords \
-             FROM textpattern \
-             WHERE Status = '4' OR \
-                   Status = '5'"
-    def self.process(dbname, user, pass, host = 'localhost')
-      db = Sequel.mysql(dbname, :user => user, :password => pass, :host => host, :encoding => 'utf8')
-      FileUtils.mkdir_p "_posts"
-      db[QUERY].each do |post|
-        # Get required fields and construct Jekyll compatible name.
-        title = post[:Title]
-        slug = post[:url_title]
-        date = post[:Posted]
-        content = post[:Body]
-        name = [date.strftime("%Y-%m-%d"), slug].join('-') + ".textile"
-        # Get the relevant fields as a hash, delete empty fields and convert
-        # to YAML for the header.
-        data = {
-           'layout' => 'post',
-           'title' => title.to_s,
-           'tags' => post[:Keywords].split(',')
-         }.delete_if { |k,v| v.nil? || v == ''}.to_yaml
-        # Write out the data and content to file.
-        File.open("_posts/#{name}", "w") do |f|
-          f.puts data
-          f.puts "---"
-          f.puts content
-        end
-      end
-    end
-  end
-end