RubyGems - robi - Versions diffs - 0.0.1 - Mend

robi 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

checksums.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+---
+SHA1:
+  metadata.gz: 67c9217164cb562bda4b90c2330e8ed7f8a3dc70
+  data.tar.gz: eddff5c9f49640c852d3992f22464d27a95a98d3
+SHA512:
+  metadata.gz: 2e441b7ea0deb38e1b07e5352081cfeebbe5a71b9b9b32612d2ed7725854ce5a9ff0b7c80e6656edb2692365d8a080fa43e5ad716b61d889632486b228d68d53
+  data.tar.gz: c05727623b778fa1a16f1e78ae0b585bde44cc473c0a3fab29762852f98c407c3d66f310e67d63af2d72b6e1cc32b9a528e724ad52864e3b72e97f45f4139d66

data/bin/robi ADDED Viewed

@@ -0,0 +1,13 @@
+#!/usr/bin/env ruby
+require 'robi'
+require 'optparser'
+opts = OptParser.parse
+Robi.new(
+  opts[:subreddit],
+  opts[:type]
+).bundle(
+  opts[:count]
+)

data/lib/optparser.rb ADDED Viewed

@@ -0,0 +1,37 @@
+require 'optparse'
+module OptParser
+  TYPES = %i(hot new rising controversial top gilded).freeze
+  def self.parse
+    opt = {}
+    OptionParser.new { |options|
+      options.banner = 'Usage: robi SUBREDDIT [-t TYPE] [-c COUNT]'
+      opt[:subreddit] = ARGV.first
+      opt[:type] = :hot
+      opt[:count] = 25
+      options.on('-t', '--type TYPE', 'top, new, etc. (default hot)') { |type|
+        opt[:type] = type.downcase.to_sym
+      }
+      options.on('-c', '--count COUNT', 'Max number of posts (default 25)') { |count|
+        opt[:count] = count.to_i
+      }
+      options.on('-h', '--help', 'Display this screen') {
+        puts options
+        exit
+      }
+    }.parse!
+    raise 'No subreddit specified' if opt[:subreddit].nil?
+    raise "Subreddit name must be raw ('funny' or 'pics')" if opt[:subreddit].include?('/')
+    raise "Type must be one of {#{TYPES.join(', ')}}" unless TYPES.include?(opt[:type])
+    raise 'Count must be at least 1' if opt[:count] < 1
+    opt
+  end
+end

data/lib/robi/compiler.rb ADDED Viewed

@@ -0,0 +1,179 @@
+require 'nokogiri'
+require 'fileutils'
+class Robi
+  class Compiler
+    def initialize(dest_dir, stylesheet_source)
+      @dest_dir = dest_dir
+      @html_file = 'index.html'
+      @stylesheet_source = stylesheet_source
+      @stylesheet_file = File.basename(@stylesheet_source)
+      @table_of_contents_file = 'tableofcontents.ncx'
+      @metadata_file = 'metadata.opf'
+    end
+    def compile(title, posts)
+      puts '  Building HTML...'
+      html = build_html(title, posts)
+      puts '  Building metadata...'
+      metadata = build_metadata(title)
+      puts '  Building Table of Contents...'
+      table_of_contents = build_table_of_contents(title, posts)
+      puts '  Assembling files...'
+      assemble(metadata, html, table_of_contents)
+      "#{@dest_dir}/#{@metadata_file}"
+    end
+    def build_html(title, posts)
+      Nokogiri::HTML::Builder.new(encoding: 'utf-8') { |doc|
+        doc.html {
+          doc.head {
+            doc.title { doc.text title }
+            doc.link(
+              rel: 'stylesheet',
+              href: @stylesheet_file,
+              type: 'text/css'
+            )
+          }
+          doc.body {
+            doc.div(id: 'titlepage') {
+              doc.h1 { doc.text title }
+              doc.h2 {
+                unit = simple_plural('post', posts.size)
+                doc.text "#{posts.size} #{unit}"
+              }
+            }
+            doc.div(id: 'tableofcontents') {
+              doc.h1 { doc.text 'Posts' }
+              doc.ol {
+                posts.each do |post|
+                  doc.li {
+                    doc.a(href: "##{post.uid}") {
+                      doc.text post.title
+                    }
+                  }
+                end
+              }
+            }
+            doc.div(id: 'postwrapper') {
+              posts.each do |post|
+                doc.div(class: 'post', id: post.uid) {
+                  doc.h1 { doc.text post.title }
+                  doc.h2 { doc.text "by #{post.author}" }
+                  doc.div {
+                    body = Nokogiri::HTML::DocumentFragment.parse(post.body)
+                    doc << body.content
+                  }
+                }
+              end
+            }
+          }
+        }
+      }.to_html
+    end
+    def build_metadata(title)
+      Nokogiri::XML::Builder.new { |xml|
+        xml.root {
+          xml.package(
+            :'unique-identifier' => title,
+            :'xmlns:opf' => 'http://www.idpf.org/2007/opf',
+            :'xmlns:asd' => 'http://www.idpf.org/asdfaf'
+          ) {
+            xml.metadata {
+              xml.send(
+                :'dc-metadata',
+                :'xmlns:dc' => 'http://purl.org/metadata/dublin_core',
+                :'xmlns:oebpackage' => 'http://openebook.org/namespaces/oeb-package/1.0/'
+              ) {
+                xml.send(:'dc:Title', title)
+                xml.send(:'dc:Language', 'en')
+                xml.send(:'dc:Creator', 'Reddit')
+                xml.send(:'x-metadata')
+              }
+            }
+            xml.manifest {
+              # xml.item(
+              #   :id => 'content',
+              #   :'media-type' => 'text/x-oeb1-document',
+              #   :href => "#{HTML}#tableofcontents"
+              # )
+              xml.item(
+                :id => 'ncx',
+                :'media-type' => 'application/x-dtbncx+xml',
+                :href => @table_of_contents_file
+              )
+              xml.item(
+                :id => 'text',
+                :'media-type' => 'text/x-oeb1-document',
+                :href => "#{@html_file}"
+              )
+            }
+            xml.spine(toc: 'ncx')  {
+              # xml.itemref(idref: 'content')
+              xml.itemref(idref: 'text')
+            }
+            xml.guide {
+              xml.reference(type: 'toc', title: 'Table of Contents', href: @table_of_contents_file)
+              xml.reference(type: 'text', title: title, href: @html_file)
+            }
+          }
+        }
+      }.to_xml
+    end
+    def build_table_of_contents(title, posts)
+      Nokogiri::XML::Builder.new { |xml|
+        xml.doc.create_internal_subset(
+          'ncx',
+          '-//NISO//DTD ncx 2005-1//EN',
+          'http://www.daisy.org/z3986/2005/ncx-2005-1.dtd'
+        )
+        xml.ncx(xmlns: 'http://www.daisy.org/z3986/2005/ncx/', version: '2005-1') {
+          xml.docTitle {
+            xml.text_ title
+          }
+          xml.navMap {
+            # xml.navPoint(id: 'toc', playOrder: 1) {
+            #   xml.navLabel {
+            #     xml.text_ 'Table of Contents'
+            #   }
+            #   xml.content(src: @html_file)
+            # }
+            posts.zip(1..Float::INFINITY).each do |post, index|
+              xml.navPoint(id: post.uid, playOrder: index) {
+                xml.navLabel {
+                  xml.text_ post.title
+                }
+                xml.content(src: "#{@html_file}##{post.uid}")
+              }
+            end
+          }
+        }
+      }.to_xml
+    end
+    def assemble(metadata, html, table_of_contents)
+      Dir.mkdir(@dest_dir) unless Dir.exist?(@dest_dir)
+      File.open("#{@dest_dir}/#{@html_file}", 'w') { |file| file.write(html) }
+      File.open("#{@dest_dir}/#{@metadata_file}",  'w') { |file| file.write(metadata) }
+      File.open("#{@dest_dir}/#{@table_of_contents_file}",  'w') { |file| file.write(table_of_contents) }
+      FileUtils.cp(@stylesheet_source, "#{@dest_dir}/#{@stylesheet_file}")
+    end
+    def simple_plural(word, count)
+      if count.abs > 1
+        "#{word}s"
+      else
+        word
+      end
+    end
+  end
+end

data/lib/robi/fetcher.rb ADDED Viewed

@@ -0,0 +1,46 @@
+require 'net/http'
+require 'json'
+require 'pp'
+require 'robi/post'
+class Robi
+  class Fetcher
+    HTTP_SUCCESS = %w(200).map(&:freeze).freeze
+    HTTP_REDIRECT = %w(301 302).map(&:freeze).freeze
+    def initialize(subreddit, type)
+      @uri = URI("https://reddit.com/r/#{subreddit}/#{type}/.json")
+    end
+    def fetch(count)
+      puts "  Connecting to #{@uri}..."
+      response = Net::HTTP.get_response(@uri)
+      while HTTP_REDIRECT.include?(response.code)
+        @uri = URI(response.header['location'])
+        puts "  Redirecting to #{@uri}..."
+        response = Net::HTTP.get_response(@uri)
+      end
+      unless HTTP_SUCCESS.include?(response.code)
+        raise "Received response code #{response.code}: #{response.msg}"
+      end
+      json = response.body
+      puts '  Extracting content...'
+      obj = JSON.parse(json)
+      extract(count, obj)
+    end
+    def extract(count, obj)
+      obj['data']['children']
+        .map { |post| post['data'] }
+        .reject { |post| post['stickied'] }
+        .reject { |post| post['selftext'].empty? }
+        .first(count)
+        .map { |post| Post.from_json_hash(post) }
+    end
+  end
+end

data/lib/robi/post.rb ADDED Viewed

@@ -0,0 +1,49 @@
+require 'time'
+class Robi
+  class Post
+    attr_reader(
+      *%i(
+        uid
+        title
+        author
+        date body
+        comment_count
+        points
+      )
+    )
+    def initialize(
+      uid,
+      title,
+      author,
+      timestamp,
+      body,
+      comment_count,
+      points
+    )
+      @uid = uid.to_s
+      @title = title.to_s
+      @author = author.to_s
+      @date = Time.at(timestamp.to_i)
+      @body = body.to_s
+      @comment_count = comment_count.to_i
+      @points = points
+    end
+    def self.from_json_hash(hash)
+      new(
+        *hash.values_at(
+          *%w(
+            name
+            title
+            author
+            created
+            selftext_html
+            num_comments
+            score
+          )
+        )
+      )
+    end
+  end
+end

data/lib/robi.rb ADDED Viewed

@@ -0,0 +1,41 @@
+require 'time'
+require 'robi/fetcher'
+require 'robi/compiler'
+class Robi
+  def initialize(subreddit, type)
+    @subreddit = subreddit
+    @type = type
+  end
+  def bundle(count)
+    id = [@subreddit, @type, Time.now.strftime('%Y-%m-%d-%H%M')]
+    title_string = id.join(' ')
+    title_slug = id.join('_')
+    dest_dir = "./#{title_slug}"
+    if Dir.exist?(dest_dir) && (Dir.entries(dest_dir) - %w(. ..)).any?
+      raise "#{dest_dir} not empty"
+    end
+    puts 'Locating kindlegen'
+    kindlegen_found = system('which kindlegen')
+    abort unless kindlegen_found
+    puts "\nFetching posts"
+    posts = Fetcher.new(@subreddit, @type).fetch(count)
+    puts "\nCompiling to eBook source"
+    stylesheet = File.expand_path('stylesheet.css', "#{File.dirname(__FILE__)}/static")
+    metadata_file = Compiler.new(dest_dir, stylesheet)
+                                    .compile(title_string, posts)
+    puts "\nInvoking kindlegen"
+    outfile = "#{File.dirname(metadata_file)}/output.mobi"
+    system("kindlegen #{metadata_file} -o output.mobi")
+    raise 'kindlegen failed to output eBook' unless File.exist?(outfile)
+    FileUtils.mv(outfile, "./#{title_slug}.mobi")
+  end
+end

data/lib/static/stylesheet.css ADDED Viewed

@@ -0,0 +1,23 @@
+h1 { text-align: center; }
+h2 { text-align: center; }
+h3 { text-align: center; }
+#titlepage {
+    page-break-after: always;
+    padding-top: 40%;
+}
+#tableofcontents {
+    page-break-after: always;
+}
+#tableofcontents ol {
+    margin: 0 10%;
+}
+.post {
+    page-break-after: always;
+}

metadata ADDED Viewed

@@ -0,0 +1,71 @@
+--- !ruby/object:Gem::Specification
+name: robi
+version: !ruby/object:Gem::Version
+  version: 0.0.1
+platform: ruby
+authors:
+- Andrew Tolvstad
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2016-12-02 00:00:00.000000000 Z
+dependencies:
+- !ruby/object:Gem::Dependency
+  name: nokogiri
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.6'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.6.8
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.6'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.6.8
+description: Compile Reddit to Kindle eBooks
+email: tolvstaa@oregonstate.edu
+executables:
+- robi
+extensions: []
+extra_rdoc_files: []
+files:
+- bin/robi
+- lib/optparser.rb
+- lib/robi.rb
+- lib/robi/compiler.rb
+- lib/robi/fetcher.rb
+- lib/robi/post.rb
+- lib/static/stylesheet.css
+homepage: https://github.com/Inityx/robi
+licenses:
+- Apache-2.0
+metadata: {}
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: '0'
+required_rubygems_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: '0'
+requirements: []
+rubyforge_project:
+rubygems_version: 2.5.2
+signing_key:
+specification_version: 4
+summary: Robi
+test_files: []