RubyGems - nytimes_cli - Versions diffs - 0.1.8 - Mend

nytimes_cli 0.1.8

Files changed (11) hide show

checksums.yaml +7 -0
data/bin/console +14 -0
data/bin/nytimes_cli +10 -0
data/bin/setup +8 -0
data/lib/article.rb +84 -0
data/lib/nytimes_cli/cli.rb +163 -0
data/lib/nytimes_cli/navagation.rb +32 -0
data/lib/nytimes_cli/version.rb +3 -0
data/lib/nytimes_cli.rb +0 -0
data/lib/scraper.rb +69 -0
metadata +177 -0

checksums.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+---
+SHA1:
+  metadata.gz: 485c4d2f7a55939cdd8e07e1d4dfa0abb180527d
+  data.tar.gz: ee2ad28060dbcb739b3c3578ffbf42066768f9a3
+SHA512:
+  metadata.gz: 66367a084ca445b35f9474dd40d25e395637078836dbf8cd6df71d7b837a9d27cc9d134f99c458d1a84551f363b76fcd036f73dc7753aa9b2ee40a3706ff3b17
+  data.tar.gz: 7e0e385204a68906811263591d24ad0102a37b4783dd0fe0a0b9aa95bbbb72c3fb0303f1f314a39c6aba77ae4f70e8db1251942c931341ae36d93578dd545a7c

data/bin/console ADDED Viewed

@@ -0,0 +1,14 @@
+#!/usr/bin/env ruby
+require "bundler/setup"
+require "nytimes_cli"
+# You can add fixtures and/or initialization code here to make experimenting
+# with your gem easier. You can also use a different console, if you like.
+# (If you use this, don't forget to add pry to your Gemfile!)
+# require "pry"
+# Pry.start
+require "irb"
+IRB.start

data/bin/nytimes_cli ADDED Viewed

@@ -0,0 +1,10 @@
+#!/usr/bin/env ruby
+require 'require_all'
+require_rel '../lib'
+NytimesCli::CLI.new.call

data/bin/setup ADDED Viewed

@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+set -euo pipefail
+IFS=$'\n\t'
+set -vx
+bundle install
+# Do any other automated setup that you need to do here

data/lib/article.rb ADDED Viewed

@@ -0,0 +1,84 @@
+class Article
+  attr_accessor :title, :author, :url, :story
+  @@articles = []
+  def initialize(title = nil, url = nil, author = nil,  story =  nil)
+    @title = title
+    @author = author
+    @url = url
+    @story = story
+  end
+  def self.create_articles_from_array(array)
+    array.each do |article|
+      title = article[:title]
+      url = article[:url]
+      a =  Article.new(title, url)
+      @@articles << a
+    end
+    @@articles
+  end
+  def self.all
+    @@articles
+  end
+  def self.create_article_from_hash(hash)
+    a = Article.new
+    a.title = hash[:title]
+    a.url = hash[:url]
+    a.author = hash[:author]
+    string = hash[:story]
+    a.story = self.word_wrap(hash[:story])
+    a
+  end
+  def self.word_wrap(text)
+    paragraphs = []
+    paragraphs = text.split(/\n/)
+    finshed_text = ""
+    paragraphs.each do |p|
+      final_p = self.p_wrap(p, 78)
+      finshed_text << "\n" + final_p
+    end
+    finshed_text
+  end
+#following method was taken from https://www.safaribooksonline.com/library/view/ruby-cookbook/0596523696/ch01s15.html
+  def self.p_wrap(s, width=78)
+    lines = []
+    line = ""
+    s.split(/\s+/).each do |word|
+      if line.size + word.size >= width
+        lines << line
+        line = word
+      elsif line.empty?
+       line = word
+      else
+       line << " " << word
+     end
+     end
+     lines << line if line
+    return lines.join "\n"
+  end
+end

data/lib/nytimes_cli/cli.rb ADDED Viewed

@@ -0,0 +1,163 @@
+# cli controller
+class NytimesCli::CLI
+  attr_accessor :index
+  def call
+    puts ""
+    puts ""
+    puts "Welcome to Nytimes CLI"
+    puts "All articles © The New York Times"
+    puts "http://www.nytimes.com"
+    puts ""
+    puts ""
+    front
+    puts ""
+    puts ""
+    puts "There are currently " + num_articles + " articles on the front page of nytimes.com."
+    puts ""
+    num = get_articles.length
+    index(num)
+    interface_logic
+  end
+  def get_articles_from_front_page
+    array = Scraper.scrape_front_page
+    articles = Article.create_articles_from_array(array)
+    articles
+  end
+  def num_articles
+    get_articles.length.to_s
+  end
+  def input_to_index(num)
+    num.to_i - 1
+  end
+  def front
+    print_articles(0, 9)
+  end
+  #TODO
+  def print_articles(first_index, last_index )
+    array = get_articles_from_front_page
+    a = array[first_index..last_index]
+    a.each do |article|
+      all_articles = get_articles
+      i = all_articles.index(article) + 1
+      puts  i.to_s + ". " + article.title
+    end
+    puts ""
+    puts ""
+  end
+  def index(num)
+    @index = Navagation.new(num)
+  end
+  def get_articles
+    Article.all
+  end
+  def get_article_url(num)
+    i = input_to_index(num)
+    a = get_articles[i]
+    a.url
+  end
+  def get_article(url)
+    hash = Scraper.scrape_article(url)
+    article = Article.create_article_from_hash(hash)
+  end
+  def print_article(num)
+    url = get_article_url(num)
+    a = get_article(url)
+    puts ""
+    puts ""
+    puts a.title
+    puts ""
+    puts a.author
+    puts ""
+    puts a.story
+    puts ""
+    puts ""
+    puts "Link to nytimes.com: " + a.url
+    puts ""
+    puts ""
+  end
+  def show_manual
+    puts "man   ->  displays manual"
+    puts "front ->  shows first ten headlines"
+    puts "more  ->  shows 10 more headlines"
+    puts "less  ->  shows previous 10 headlines"
+    puts "exit  ->  terminates program"
+    puts ""
+    puts ""
+    puts "All articles © The New York Times"
+    puts "http://www.nytimes.com"
+    puts ""
+    puts ""
+  end
+  def more
+    @index.more
+    print_articles(@index.start_index, @index.end_index)
+  end
+  def less
+    @index.less
+    print_articles(@index.start_index, @index.end_index)
+  end
+  def interface_logic
+     while true
+      puts "Enter the number you would like to read or 'man' to see a list of commands."
+      answer = gets.chomp
+      if answer.upcase == "EXIT"
+        puts ""
+        puts "Ciao. Auf Wiedersehen. Goodbye."
+        puts ""
+        puts ""
+        exit
+      elsif answer.to_i.class == Fixnum && answer.to_i != 0
+        print_article(answer)
+      elsif answer.upcase == "MAN"
+        show_manual
+      elsif answer.upcase == "MORE"
+        more
+      elsif answer.upcase == "LESS"
+        less
+      elsif answer.upcase == "FRONT"
+        print_articles(0, 9)
+      else
+        puts ""
+        puts ""
+        puts "That was not a valid entry. Please try again."
+        puts ""
+        puts ""
+      end
+    end
+  end
+end

data/lib/nytimes_cli/navagation.rb ADDED Viewed

@@ -0,0 +1,32 @@
+class Navagation
+  attr_accessor :start_index, :end_index, :articles_length
+  def initialize(length)
+    @start_index = 0
+    @end_index = 9
+    @articles_length = length
+  end
+   def more
+    if @end_index + 10 < @articles_length
+      @start_index += 10
+      @end_index += 10
+    else
+      @start_index = @articles_length - 9
+      @end_index = @articles_length
+    end
+  end
+  def less
+    if @start_index >= 10
+      @start_index -= 10
+      @end_index = @start_index + 9
+    else
+      @start_index = 0
+      @end_index = 9
+    end
+  end
+end

data/lib/nytimes_cli/version.rb ADDED Viewed

@@ -0,0 +1,3 @@
+module NytimesCli
+  VERSION = "0.1.8"
+end

data/lib/nytimes_cli.rb ADDED Viewed

File without changes

data/lib/scraper.rb ADDED Viewed

@@ -0,0 +1,69 @@
+require 'mechanize'
+class Scraper
+  attr_accessor :title, :url, :author, :story
+  BASE_URL = "http://www.nytimes.com"
+  def self.scrape_front_page
+    agent = Mechanize.new
+    index = agent.get(BASE_URL)
+    front_page_articles = []
+    index.css(".story-heading").each do |story|
+      val =  story.css("a").text
+      next if val.nil? || val == false || val == ""
+      hash = {
+         :title => story.css("a").text.strip,
+         :url => story.css('a').attribute('href').value
+      }
+      front_page_articles  << hash
+    end
+    front_page_articles
+   end
+  def self.scrape_article(url)
+    agent = Mechanize.new
+    article = agent.get(url)
+    stories = []
+    story_hash = {}
+    title = article.search("//*[@id='headline']").text
+    author = article.search('.byline-author').text
+    story_hash[:title] = title
+    story_hash[:author] = author
+    story_hash[:url] =  url
+    article_string = ""
+    article.search(".story-body *").each do |paragraph|
+     if  !article_string.include?(paragraph.children.text)
+      if paragraph.name == "p" && paragraph.children.text != "Advertisement"
+         article_string << paragraph.children.text + "\n" + "\n"
+      elsif paragraph.name == "h4" && !paragraph.children.text.nil?
+         article_string << paragraph.children.text + "\n" + "\n"
+      end
+     end
+    end
+    story_hash[:story] = article_string
+    story_hash
+  end
+end

metadata ADDED Viewed

@@ -0,0 +1,177 @@
+--- !ruby/object:Gem::Specification
+name: nytimes_cli
+version: !ruby/object:Gem::Version
+  version: 0.1.8
+platform: ruby
+authors:
+- interestinall
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2016-06-08 00:00:00.000000000 Z
+dependencies:
+- !ruby/object:Gem::Dependency
+  name: bundler
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.12'
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.12'
+- !ruby/object:Gem::Dependency
+  name: rake
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '10.0'
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '10.0'
+- !ruby/object:Gem::Dependency
+  name: rspec
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '3.0'
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '3.0'
+- !ruby/object:Gem::Dependency
+  name: require_all
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.3'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.3.3
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.3'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.3.3
+- !ruby/object:Gem::Dependency
+  name: mechanize
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '2.7'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 2.7.4
+  type: :development
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '2.7'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 2.7.4
+- !ruby/object:Gem::Dependency
+  name: require_all
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.3'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.3.3
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.3'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 1.3.3
+- !ruby/object:Gem::Dependency
+  name: mechanize
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '2.7'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 2.7.4
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '2.7'
+    - - ">="
+      - !ruby/object:Gem::Version
+        version: 2.7.4
+description: Allows users to browse nytimes.com and read articles from the command
+  line.
+email:
+- justin.lefurjah@gmail.com
+executables:
+- nytimes_cli
+extensions: []
+extra_rdoc_files: []
+files:
+- bin/console
+- bin/nytimes_cli
+- bin/setup
+- lib/article.rb
+- lib/nytimes_cli.rb
+- lib/nytimes_cli/cli.rb
+- lib/nytimes_cli/navagation.rb
+- lib/nytimes_cli/version.rb
+- lib/scraper.rb
+homepage: https://github.com/interestinall/nytimes_cli
+licenses:
+- MIT
+metadata: {}
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: '0'
+required_rubygems_version: !ruby/object:Gem::Requirement
+  requirements:
+  - - ">="
+    - !ruby/object:Gem::Version
+      version: '0'
+requirements: []
+rubyforge_project:
+rubygems_version: 2.6.4
+signing_key:
+specification_version: 4
+summary: Command line interface for nytimes.com
+test_files: []