pluto 1.0.1 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/lib/pluto/schema.rb DELETED
@@ -1,139 +0,0 @@
1
-
2
- module Pluto
3
-
4
- class CreateDb < ActiveRecord::Migration
5
-
6
- def up
7
- create_table :sites do |t|
8
- t.string :title, :null => false # e.g Planet Ruby, Planet JavaScript, etc.
9
- t.string :key, :null => false # e.g. ruby, js, etc.
10
-
11
- ############
12
- # filters (site-wide)
13
- t.string :includes # regex
14
- t.string :excludes # regex
15
-
16
- ######################
17
- # for auto-update of feed list/site config
18
-
19
- t.string :url # source url for auto-update (optional)
20
-
21
- ## note: make sure to use same fields for update check as feed
22
-
23
- t.datetime :fetched # last fetched/checked date -- make not null ??
24
- t.integer :http_code # last http status code e.g. 200,404,etc.
25
- t.string :http_etag # last http header etag
26
- ## note: save last-modified header as text (not datetime) - pass through as is
27
- t.string :http_last_modified # last http header last-modified - note: save header as plain text!!! pass along in next request as-is
28
- t.string :http_server # last http server header if present
29
-
30
- # note: do NOT store body content (that is, text) and md5 digest
31
- # use git! and github! commit will be http_etag!!
32
-
33
- t.datetime :fetched # last fetched/checked date
34
-
35
- #############
36
- # more fields
37
-
38
- t.timestamps # created_at, updated_at
39
- end
40
-
41
- create_table :subscriptions do |t| # has_many join table (sites/feeds)
42
- t.references :site, :null => false
43
- t.references :feed, :null => false
44
- t.timestamps
45
- end
46
-
47
- create_table :feeds do |t|
48
- t.string :title # user supplied title
49
- t.string :auto_title # "fallback" - auto(fill) title from feed
50
-
51
- t.string :title2 # user supplied title2
52
- t.string :auto_title2 # "fallback" - auto(fill) title2 from feed e.g. subtitle (atom)
53
-
54
- t.string :url # user supplied site url
55
- t.string :auto_url # "fallback" - auto(fill) url from feed
56
-
57
- t.string :feed_url # user supplied feed url
58
- t.string :auto_feed_url # "fallback" - auto discovery feed url from (site) url
59
-
60
- t.text :summary # e.g. description (rss)
61
-
62
- t.string :generator # feed generator (e.g. wordpress, etc.) from feed
63
-
64
- t.datetime :published # from feed published(atom)+ pubDate(rss)
65
- t.datetime :built # from feed lastBuiltDate(rss)
66
- t.datetime :touched # from feed updated(atom)
67
-
68
- ### extras (move to array for custom fields or similar??)
69
- t.string :github # github handle (optional)
70
- t.string :twitter # twitter handle (optional)
71
- t.string :avatar # gravator or hackergotchi handle (optional)
72
-
73
- ### add class/kind field e.g.
74
- # - personal feed/blog/site, that is, individual author
75
- # - team blog/site
76
- # - org (anization) or com(pany blog/site)
77
- # - newsfeed (composite)
78
- # - other (link blog?, podcast?) - why? why not??
79
-
80
- ############
81
- # filters
82
- t.string :includes # regex
83
- t.string :excludes # regex
84
- # todo: add generic filter list e.g. t.string :filters (comma,pipe or space separated method names?)
85
-
86
- # -- our own (meta) fields
87
- t.datetime :last_published # cache last (latest) published for items
88
-
89
- t.string :key, :null => false
90
- t.string :format # e.g. atom (1.0), rss 2.0, rss 0.7 etc.
91
-
92
- t.integer :http_code # last http status code e.g. 200,404,etc.
93
- t.string :http_etag # last http header etag
94
- ## note: save last-modified header as text (not datetime) - pass through as is
95
- t.string :http_last_modified # last http header last-modified - note: save header as plain text!!! pass along in next request as-is
96
- t.string :http_server # last http server header if present
97
-
98
- t.string :md5 # md5 hash of body
99
- t.text :body # last http response body (complete feed!)
100
-
101
- t.datetime :fetched # last fetched/checked date
102
-
103
- t.timestamps # created_at, updated_at
104
- end
105
-
106
-
107
- create_table :items do |t|
108
- t.string :guid
109
- t.string :url
110
-
111
- ## note: title may contain more than 255 chars!! use text for sure!
112
- ## e.g. Rails Girls blog has massive titles in feed
113
-
114
- t.text :title # todo: add some :null => false ??
115
- t.text :summary # e.g. description (rss), summary (atom)
116
- t.text :content
117
-
118
- t.datetime :published # from feed (published) + pubDate(rss)
119
- t.datetime :touched # from feed updated (atom)
120
-
121
- ## todo: add :last_updated_at ?? (NOTE: updated_at already take by auto-timestamps)
122
- t.references :feed, :null => false
123
-
124
- t.datetime :fetched # last fetched/check date
125
- t.timestamps # created_at, updated_at
126
-
127
- ## t.string :author
128
- ## todo: add author/authors, category/categories
129
- end
130
-
131
- end
132
-
133
- def down
134
- raise ActiveRecord::IrreversibleMigration
135
- end
136
-
137
- end # class CreateDb
138
-
139
- end # module Pluto
@@ -1,102 +0,0 @@
1
- module Pluto
2
-
3
- class Subscriber
4
-
5
- include LogUtils::Logging
6
-
7
- include Models
8
-
9
- def debug=(value) @debug = value; end
10
- def debug?() @debug || false; end
11
-
12
-
13
- def update_subscriptions( config, opts={} )
14
- # !!!! -- depreciated API - remove - do NOT use anymore
15
- puts "*** warn - [Pluto::Subscriber] depreciated API -- use update_subscriptions_for( site_key )"
16
- update_subscriptions_for( 'planet', config, opts ) # default to planet site_key
17
- end
18
-
19
-
20
- def update_subscriptions_for( site_key, config, opts={} )
21
- site_attribs = {
22
- title: config['title'] || config['name'], # support either title or name
23
- url: config['source'] || config['url'] # support source or url for source url for auto-update (optional)
24
- }
25
-
26
- logger.debug "site_attribs: #{site_attribs.inspect}"
27
-
28
- site_rec = Site.find_by_key( site_key )
29
- if site_rec.nil?
30
- site_rec = Site.new
31
- site_attribs[ :key ] = site_key
32
-
33
- ## use object_id: site.id and object_type: Site
34
- ## change - model/table/schema!!!
35
- Activity.create!( text: "new site >#{site_key}< - #{site_attribs[ :title ]}" )
36
- end
37
- site_rec.update_attributes!( site_attribs )
38
-
39
- # -- log update activity
40
- Activity.create!( text: "update subscriptions >#{site_key}<" )
41
-
42
- # clean out subscriptions and add again
43
- logger.debug "before site.subscriptions.delete_all - count: #{site_rec.subscriptions.count}"
44
- site_rec.subscriptions.destroy_all # note: use destroy_all NOT delete_all (delete_all tries by default only nullify)
45
- logger.debug "after site.subscriptions.delete_all - count: #{site_rec.subscriptions.count}"
46
-
47
- config.each do |key, value|
48
-
49
- ## todo: downcase key - why ??? why not???
50
-
51
- # skip "top-level" feed keys e.g. title, etc. or planet planet sections (e.g. planet,defaults)
52
- next if ['title','title2','name',
53
- 'source', 'url',
54
- 'include','includes','exclude','excludes',
55
- 'feeds',
56
- 'planet','defaults'].include?( key )
57
-
58
- ### todo/check:
59
- ## check value - must be hash
60
- # check if url or feed_url present
61
- # that is, check for required props/key-value pairs
62
-
63
- feed_key = key.to_s.dup
64
- feed_hash = value
65
-
66
- # todo/fix: use title from feed?
67
- # e.g. fill up auto_title, auto_url, etc.
68
-
69
- feed_attribs = {
70
- feed_url: feed_hash[ 'feed' ] || feed_hash[ 'feed_url' ],
71
- url: feed_hash[ 'link' ] || feed_hash[ 'url' ],
72
- title: feed_hash[ 'title' ] || feed_hash[ 'name' ],
73
- title2: feed_hash[ 'title2' ],
74
- includes: feed_hash[ 'includes' ] || feed_hash[ 'include' ],
75
- excludes: feed_hash[ 'excludes' ] || feed_hash[ 'exclude' ]
76
- }
77
-
78
- puts "Updating feed subscription >#{feed_key}< - >#{feed_attribs[:feed_url]}<..."
79
-
80
- feed_rec = Feed.find_by_key( feed_key )
81
- if feed_rec.nil?
82
- feed_rec = Feed.new
83
- feed_attribs[ :key ] = feed_key
84
-
85
- ## use object_id: feed.id and object_type: Feed
86
- ## change - model/table/schema!!!
87
- ## todo: add parent_action_id - why? why not?
88
- Activity.create!( text: "new feed >#{feed_key}< - #{feed_attribs[ :title ]}" )
89
- end
90
-
91
- feed_rec.update_attributes!( feed_attribs )
92
-
93
- # add subscription record
94
- # note: subscriptions get cleaned out on update first (see above)
95
- site_rec.subscriptions.create!( feed_id: feed_rec.id )
96
- end
97
-
98
- end # method update_subscriptions
99
-
100
- end # class Subscriber
101
-
102
- end # module Pluto
@@ -1,25 +0,0 @@
1
-
2
-
3
- task :env do
4
- LogUtils::Logger.root.level = :debug
5
-
6
- Pluto.connect!
7
- end
8
-
9
-
10
- #########
11
- # for debugging
12
-
13
- desc 'pluto - debug site setup'
14
- task :site => :env do
15
- site = Pluto::Models::Site.first # FIX: for now assume one planet per DB (fix later; allow planet key or similar)
16
- if site.present?
17
- puts "site found:"
18
- pp site
19
- else
20
- puts "no site found"
21
- end
22
- end
23
-
24
- ### todo: add new task :sites
25
-
@@ -1,40 +0,0 @@
1
-
2
-
3
- desc 'pluto -=- setup/update feed subscriptions'
4
- task :setup => :env do
5
-
6
- ## check if PLANET key passed in
7
- if ENV['PLANET'].present?
8
- key = ENV['PLANET']
9
- puts "setup planet for key >#{key}<"
10
- else
11
- puts 'no PLANET=key passed along; try defaults'
12
- # try pluto.yml or planet.yml if exist
13
-
14
- if File.exists?( './pluto.ini' ) || File.exists?( './pluto.yml' ) # check if pluto.yml exists, if yes add/use it
15
- key ='pluto'
16
- elsif File.exists?( './planet.ini' ) || File.exists?( './planet.yml' ) # check if planet.yml exists, if yes add/use it
17
- key = 'planet'
18
- else
19
- puts '*** note: no arg passed in; no pluto.ini|yml or planet.ini|yml found in working folder'
20
- end
21
- end
22
-
23
-
24
- config_path = "./#{key}.ini"
25
- if File.exists?( config_path )
26
- config = INI.load_file( config_path )
27
- else ## assume .yml
28
- config_path = "./#{key}.yml"
29
- config = YAML.load_file( config_path )
30
- end
31
-
32
-
33
- puts "dump planet setup settings >#{config_path}<:"
34
- pp config
35
-
36
- # note: allow multiple planets (sites) for a single install
37
- Pluto::Subscriber.new.update_subscriptions_for( key, config )
38
-
39
- puts 'Done.'
40
- end
@@ -1,10 +0,0 @@
1
-
2
-
3
- desc 'pluto - show planet (feed) stats'
4
- task :stats => :env do
5
- puts "stats:"
6
- puts " Feeds: #{Pluto::Models::Feed.count}"
7
- puts " Items: #{Pluto::Models::Item.count}"
8
- puts " Sites: #{Pluto::Models::Site.count}"
9
- puts " Subscriptions: #{Pluto::Models::Subscription.count}"
10
- end
@@ -1,24 +0,0 @@
1
-
2
-
3
- desc 'pluto -=- update planet (site configs)'
4
- task :update_sites => :env do
5
-
6
- Pluto.update_sites # update all site configs if source (url) present/specified
7
-
8
- puts 'Done (Update Sites).'
9
- end
10
-
11
-
12
- desc 'pluto -=- update planet (feeds)'
13
- task :update_feeds => :env do
14
-
15
- Pluto.update_feeds
16
-
17
- puts 'Done (Update Feeds).'
18
- end
19
-
20
-
21
- desc 'pluto -=- update planet (site configs + feeds)'
22
- task :update => [:update_sites, :update_feeds] do
23
- puts 'Done.'
24
- end
data/lib/pluto/updater.rb DELETED
@@ -1,50 +0,0 @@
1
- module Pluto
2
-
3
- class Updater
4
-
5
- include LogUtils::Logging
6
-
7
- ### fix!!!!!: change config to text - yes/no - why? why not??
8
- # or pass along struct
9
- # - with hash and text and format(e.g. ini/yml) as fields???
10
- #
11
- # - why? - we need to get handle on md5 digest/hash plus on plain text, ideally to store in db
12
- ## - pass along unparsed text!! - not hash struct
13
- # - will get saved in db plus we need to generate md5 hash
14
- # - add filename e.g. ruby.ini|ruby.conf|ruby.yml as opt ??
15
- # or add config format as opt e.g. ini or yml?
16
-
17
- def initialize( opts, config )
18
- @opts = opts
19
- @config = config
20
- end
21
-
22
- attr_reader :opts, :config
23
-
24
- def run( arg )
25
- arg = arg.downcase.gsub('.ini','').gsub('.yml','') # remove file extension if present
26
-
27
- update_for( arg )
28
- end
29
-
30
- def update_for( site_key )
31
- ###################
32
- # step 1) update subscriptions
33
- subscriber = Subscriber.new
34
-
35
- # pass along debug/verbose setting/switch
36
- subscriber.debug = true if opts.verbose?
37
- subscriber.update_subscriptions_for( site_key, config )
38
-
39
- ##############################
40
- # step 2) update feeds
41
- refresher = Refresher.new
42
-
43
- # pass along debug/verbose setting/switch
44
- refresher.debug = true if opts.verbose?
45
- refresher.update_feeds_for( site_key )
46
- end # method run
47
-
48
- end # class Updater
49
-
50
- end # module Pluto
data/lib/pluto/version.rb DELETED
@@ -1,4 +0,0 @@
1
-
2
- module Pluto
3
- VERSION = '1.0.1'
4
- end
data/test/helper.rb DELETED
@@ -1,18 +0,0 @@
1
- ## $:.unshift(File.dirname(__FILE__))
2
-
3
-
4
- ## minitest setup
5
-
6
- # require 'minitest/unit'
7
- require 'minitest/autorun'
8
-
9
- # include MiniTest::Unit # lets us use TestCase instead of MiniTest::Unit::TestCase
10
-
11
-
12
- ## our own code
13
-
14
- require 'pluto'
15
-
16
-
17
- LogUtils::Logger.root.level = :debug
18
-
data/test/test_helpers.rb DELETED
@@ -1,15 +0,0 @@
1
- # encoding: UTF-8
2
-
3
- ###
4
- # to run use
5
- # ruby -I ./lib -I ./test test/test_rss.rb
6
- # or better
7
- # rake test
8
-
9
- require 'helper'
10
-
11
- class TestHelper < MiniTest::Unit::TestCase
12
-
13
- ## add some tests; to be done
14
-
15
- end # class TestHelper