RubyGems - insta_scrape - Versions diffs - 1.1.0 → 1.1.1 - Mend

insta_scrape 1.1.0 → 1.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 05c519af7d4c14f15487b131afd234e2cd0c6435
-  data.tar.gz: 66aee1224c0a0c9d931f864d331d698f35b0b60d
+  metadata.gz: 0c55fecbadd0f789dfa52d2d26dab8175fb7acdd
+  data.tar.gz: ed3fa91e7b6422f435e6095d67a5abb175702b41
 SHA512:
-  metadata.gz: 8f5bb16a646d4a73f1b226b206d19b53edf5b8cc9b1bb88b6ac27bf9b302bc39096eee6a367870553a07f2b8560946fc6cc0cc1c1f36ce1d1a5a1e112caa13a8
-  data.tar.gz: 50a190f914e87580b97293595cc60bc78a0f037871b9a0a11b9ca0bbb33cef8af5c3571fd4087c3ea5c093b003da8bf4711bdfbdbadc78932563a46f5efe1fd5
+  metadata.gz: 135f7ac6592b5a7f03d04874af4341f472d9e30b6e6378a6a6219ef2854fdba2f4f4a494d1ab3daa5145a7c36f7d5a4722cf6723b74920453dca7ce2b31f4426
+  data.tar.gz: 13287580a7b8731f3ffaa29cfe4b2acec51bb14d40e76bed5d4af2b16ce74a613860d268f245c776c25f8a227bc1b85591553081ef21d2cff2b81432527dc4e0

data/README.md CHANGED

@@ -1,4 +1,5 @@
-[![Build Status](https://travis-ci.org/dannyvassallo/insta_scrape.svg?branch=master)](https://travis-ci.org/dannyvassallo/insta_scrape)[![Gem Version](https://badge.fury.io/rb/insta_scrape.svg)](https://badge.fury.io/rb/insta_scrape)
+[![Build Status](https://travis-ci.org/dannyvassallo/insta_scrape.svg?branch=master)](https://travis-ci.org/dannyvassallo/insta_scrape)[![Gem Version](https://badge.fury.io/rb/insta_scrape.svg)](https://badge.fury.io/rb/insta_scrape)![](http://ruby-gem-downloads-badge.herokuapp.com/insta_scrape?type=total&color=brightgreen)
 ![alt text](https://s3-us-west-2.amazonaws.com/instascrape/instascrapelogo.png "logo")
 # InstaScrape
@@ -7,7 +8,8 @@ This gem is dependent on Capybara, PhantomJS, and Poltergeist.
 Using this gem you can access multiple facets of the instagram API without needing authorization, most importantly the hashtag.
-v.1.1.0 introducing "long_scrape" methods! Now with more instgram posts!
+v.1.1.0 introducing "long_scrape" methods! Now with more instagram posts!
+v.1.1.1 introducing "long_scrape" methods! Now with more instgram posts!
 ## Note
@@ -41,6 +43,23 @@ Or install it yourself as:
 Long scrape method take two arguments -- (hashtag || username, time_in_seconds)
 Each other method accepts only one argument - a hashtag or a username.
+An additional feature has been added to grab some extra meta information (dates) from the posts.
+While this feature makes the scrape perform much slower, you can opt in to using it with
+the following option as a second or third argument on most methods:
+`include_meta_data: true`
+For Example:
+```
+InstaScrape.hashtag("foofighters", include_meta_data: true)
+#OR
+InstaScrape.long_scrape_hashtag("foofighters", 30, include_meta_data: true)
+```
+If you run the methods regularly, you won't get additional meta information.
 ####Long Scrape Methods
 ```ruby
@@ -174,4 +193,3 @@ Bug reports and pull requests are welcome on GitHub at https://github.com/dannyv
 ## License
 The gem is available as open source under the terms of the [MIT License](http://opensource.org/licenses/MIT).

data/lib/insta_scrape.rb CHANGED

@@ -4,29 +4,29 @@ module InstaScrape
   extend Capybara::DSL
   #get a hashtag
-  def self.hashtag(hashtag)
+  def self.hashtag(hashtag, include_meta_data: false)
     visit "https://www.instagram.com/explore/tags/#{hashtag}/"
     @posts = []
-    scrape_posts
+    scrape_posts(include_meta_data: include_meta_data)
   end
   #long scrape a hashtag
-  def self.long_scrape_hashtag(hashtag, scrape_length)
+  def self.long_scrape_hashtag(hashtag, scrape_length, include_meta_data: false)
     visit "https://www.instagram.com/explore/tags/#{hashtag}/"
     @posts = []
-    long_scrape_posts(scrape_length)
+    long_scrape_posts(scrape_length, include_meta_data: include_meta_data)
   end
   #long scrape a hashtag
-  def self.long_scrape_user_posts(username, scrape_length)
+  def self.long_scrape_user_posts(username, scrape_length, include_meta_data: false)
     @posts = []
-    long_scrape_user_posts_method(username, scrape_length)
+    long_scrape_user_posts_method(username, scrape_length, include_meta_data: include_meta_data)
   end
   #get user info and posts
-  def self.long_scrape_user_info_and_posts(username, scrape_length)
+  def self.long_scrape_user_info_and_posts(username, scrape_length, include_meta_data: false)
     scrape_user_info(username)
-    long_scrape_user_posts_method(username, scrape_length)
+    long_scrape_user_posts_method(username, scrape_length, include_meta_data: include_meta_data)
     @user = InstaScrape::InstagramUserWithPosts.new(username, @image, @post_count, @follower_count, @following_count, @description, @posts)
   end
@@ -37,15 +37,15 @@ module InstaScrape
   end
   #get user info and posts
-  def self.user_info_and_posts(username)
+  def self.user_info_and_posts(username, include_meta_data: false)
     scrape_user_info(username)
-    scrape_user_posts(username)
+    scrape_user_posts(username, include_meta_data: false)
     @user = InstaScrape::InstagramUserWithPosts.new(username, @image, @post_count, @follower_count, @following_count, @description, @posts)
   end
   #get user posts only
-  def self.user_posts(username)
-    scrape_user_posts(username)
+  def self.user_posts(username, include_meta_data: false)
+    scrape_user_posts(username, include_meta_data: include_meta_data)
   end
   #get user follower count
@@ -74,14 +74,21 @@ module InstaScrape
   private
   #post iteration method
-  def self.iterate_through_posts
-    all("article div div div a").each do |post|
+  def self.iterate_through_posts(include_meta_data:)
+    posts = all("article div div div a").collect do |post|
+      { link: post["href"],
+        image: post.find("img")["src"]}
+    end
-      link = post["href"]
-      image = post.find("img")["src"]
-      info = InstaScrape::InstagramPost.new(link, image)
+    posts.each do |post|
+      if include_meta_data
+        visit(post[:link])
+        date = page.find('time')["datetime"]
+        info = InstaScrape::InstagramPost.new(post[:link], post[:image], date)
+      else
+        info = InstaScrape::InstagramPost.new(post[:link], post[:image])
+      end
       @posts << info
     end
     #log
@@ -108,7 +115,7 @@ module InstaScrape
   end
   #scrape posts
-  def self.scrape_posts
+  def self.scrape_posts(include_meta_data:)
     begin
       page.find('a', :text => "Load more", exact: true).click
       max_iteration = 10
@@ -120,15 +127,15 @@ module InstaScrape
         page.execute_script "window.scrollTo(0,(document.body.scrollHeight - 5000));"
         sleep 0.1
       end
-      iterate_through_posts
+      iterate_through_posts(include_meta_data: include_meta_data)
     rescue Capybara::ElementNotFound => e
       begin
-        iterate_through_posts
+        iterate_through_posts(include_meta_data: include_meta_data)
       end
     end
   end
-  def self.long_scrape_posts(scrape_length_in_seconds)
+  def self.long_scrape_posts(scrape_length_in_seconds, include_meta_data:)
     begin
       page.find('a', :text => "Load more", exact: true).click
       max_iteration = (scrape_length_in_seconds / 0.3)
@@ -145,24 +152,24 @@ module InstaScrape
         @loader << "."
         system "clear"
       end
-      iterate_through_posts
+      iterate_through_posts(include_meta_data: include_meta_data)
     rescue Capybara::ElementNotFound => e
       begin
-        iterate_through_posts
+        iterate_through_posts(include_meta_data: include_meta_data)
       end
     end
   end
-  def self.long_scrape_user_posts_method(username, scrape_length_in_seconds)
+  def self.long_scrape_user_posts_method(username, scrape_length_in_seconds, include_meta_data:)
     @posts = []
     visit "https://www.instagram.com/#{username}/"
-    long_scrape_posts(scrape_length_in_seconds)
+    long_scrape_posts(scrape_length_in_seconds, include_meta_data: include_meta_data)
   end
-  def self.scrape_user_posts(username)
+  def self.scrape_user_posts(username, include_meta_data:)
     @posts = []
     visit "https://www.instagram.com/#{username}/"
-    scrape_posts
+    scrape_posts(include_meta_data: include_meta_data)
   end
   #post logger

data/lib/insta_scrape/version.rb CHANGED

@@ -1,3 +1,3 @@
 module InstaScrape
-  VERSION = "1.1.0"
+  VERSION = "1.1.1"
 end

data/lib/models/instagram_post.rb CHANGED

@@ -1,7 +1,8 @@
 class InstaScrape::InstagramPost
-  attr_accessor :link, :image
-  def initialize(link, image)
+  attr_accessor :link, :image, :date
+  def initialize(link, image, date=nil)
     @image = image
     @link = link
+    @date = date
   end
 end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: insta_scrape
 version: !ruby/object:Gem::Version
-  version: 1.1.0
+  version: 1.1.1
 platform: ruby
 authors:
 - dannyvassallo
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2016-06-13 00:00:00.000000000 Z
+date: 2016-12-14 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: bundler