twitter_ebooks 2.0.3 → 2.0.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/Gemfile.lock +12 -12
- data/bin/ebooks +21 -6
- data/data/ANC-all-count.txt +297241 -0
- data/data/stopwords.txt +204 -0
- data/data/wordfreq.json +1 -0
- data/lib/twitter_ebooks/bot.rb +25 -7
- data/lib/twitter_ebooks/markov.rb +55 -63
- data/lib/twitter_ebooks/model.rb +57 -74
- data/lib/twitter_ebooks/nlp.rb +90 -55
- data/lib/twitter_ebooks/version.rb +1 -1
- data/script/process_anc_data.rb +19 -0
- data/skeleton/Procfile +1 -1
- data/skeleton/bots.rb +0 -6
- data/skeleton/corpus/README.md +1 -1
- data/skeleton/run.rb +9 -0
- data/test/keywords.rb +18 -0
- data/twitter_ebooks.gemspec +3 -5
- metadata +13 -40
- data/skeleton/model/README.md +0 -1
data/Gemfile.lock
CHANGED
@@ -1,15 +1,15 @@
|
|
1
1
|
PATH
|
2
2
|
remote: .
|
3
3
|
specs:
|
4
|
-
twitter_ebooks (2.0.
|
4
|
+
twitter_ebooks (2.0.3)
|
5
|
+
bloomfilter-rb
|
5
6
|
engtagger
|
7
|
+
fast-stemmer
|
6
8
|
gingerice
|
9
|
+
highscore
|
7
10
|
htmlentities
|
8
|
-
|
9
|
-
ruby-stemmer
|
11
|
+
minitest
|
10
12
|
rufus-scheduler
|
11
|
-
tactful_tokenizer
|
12
|
-
tokenizer
|
13
13
|
tweetstream
|
14
14
|
twitter
|
15
15
|
|
@@ -19,6 +19,8 @@ GEM
|
|
19
19
|
addressable (2.3.5)
|
20
20
|
atomic (1.1.14)
|
21
21
|
awesome_print (1.2.0)
|
22
|
+
bloomfilter-rb (2.1.1)
|
23
|
+
redis
|
22
24
|
cookiejar (0.3.0)
|
23
25
|
daemons (1.1.9)
|
24
26
|
em-http-request (1.0.3)
|
@@ -37,25 +39,23 @@ GEM
|
|
37
39
|
eventmachine (1.0.3)
|
38
40
|
faraday (0.8.8)
|
39
41
|
multipart-post (~> 1.2.0)
|
42
|
+
fast-stemmer (1.0.2)
|
40
43
|
gingerice (1.2.1)
|
41
44
|
addressable
|
42
45
|
awesome_print
|
46
|
+
highscore (1.1.0)
|
47
|
+
whatlanguage (>= 1.0.0)
|
43
48
|
htmlentities (4.3.1)
|
44
49
|
http_parser.rb (0.5.3)
|
45
|
-
linguistics (2.0.2)
|
46
|
-
loggability (~> 0.5)
|
47
|
-
loggability (0.8.1)
|
48
50
|
minitest (5.0.8)
|
49
51
|
multi_json (1.8.2)
|
50
52
|
multipart-post (1.2.0)
|
51
|
-
|
53
|
+
redis (3.0.5)
|
52
54
|
rufus-scheduler (3.0.2)
|
53
55
|
tzinfo
|
54
56
|
simple_oauth (0.2.0)
|
55
|
-
tactful_tokenizer (0.0.2)
|
56
57
|
thread_safe (0.1.3)
|
57
58
|
atomic
|
58
|
-
tokenizer (0.1.1)
|
59
59
|
tweetstream (2.5.0)
|
60
60
|
daemons (~> 1.1)
|
61
61
|
em-http-request (~> 1.0.2)
|
@@ -68,11 +68,11 @@ GEM
|
|
68
68
|
simple_oauth (~> 0.2)
|
69
69
|
tzinfo (1.1.0)
|
70
70
|
thread_safe (~> 0.1)
|
71
|
+
whatlanguage (1.0.5)
|
71
72
|
yajl-ruby (1.1.0)
|
72
73
|
|
73
74
|
PLATFORMS
|
74
75
|
ruby
|
75
76
|
|
76
77
|
DEPENDENCIES
|
77
|
-
minitest
|
78
78
|
twitter_ebooks!
|
data/bin/ebooks
CHANGED
@@ -44,11 +44,7 @@ module Ebooks
|
|
44
44
|
end
|
45
45
|
|
46
46
|
def self.gen(model_path, input)
|
47
|
-
|
48
|
-
model = nil;
|
49
|
-
puts Benchmark.measure {
|
50
|
-
model = Model.load(model_path)
|
51
|
-
}
|
47
|
+
model = Model.load(model_path)
|
52
48
|
if input && !input.empty?
|
53
49
|
puts "@cmd " + model.markov_response(input, 135)
|
54
50
|
else
|
@@ -56,16 +52,33 @@ module Ebooks
|
|
56
52
|
end
|
57
53
|
end
|
58
54
|
|
55
|
+
def self.score(model_path, input)
|
56
|
+
model = Model.load(model_path)
|
57
|
+
model.score_interest(input)
|
58
|
+
end
|
59
|
+
|
59
60
|
def self.archive(username, outpath)
|
60
61
|
Archiver.new(username, outpath).fetch_tweets
|
61
62
|
end
|
62
63
|
|
64
|
+
def self.tweet(modelpath, username)
|
65
|
+
load File.join(APP_PATH, 'bots.rb')
|
66
|
+
model = Model.load(modelpath)
|
67
|
+
statement = model.markov_statement
|
68
|
+
log "@#{username}: #{statement}"
|
69
|
+
bot = Bot.get(username)
|
70
|
+
bot.configure
|
71
|
+
bot.tweet(statement)
|
72
|
+
end
|
73
|
+
|
63
74
|
def self.command(args)
|
64
75
|
usage = """Usage:
|
65
76
|
ebooks new <reponame>
|
66
77
|
ebooks consume <corpus_path> [...]
|
67
|
-
ebooks gen <
|
78
|
+
ebooks gen <model_path> [input]
|
79
|
+
ebooks score <model_path> <input>
|
68
80
|
ebooks archive <@user> <outpath>
|
81
|
+
ebooks tweet <model_path> <@bot>
|
69
82
|
"""
|
70
83
|
|
71
84
|
if args.length == 0
|
@@ -77,7 +90,9 @@ module Ebooks
|
|
77
90
|
when "new" then new(args[1])
|
78
91
|
when "consume" then consume(args[1..-1])
|
79
92
|
when "gen" then gen(args[1], args[2..-1].join(' '))
|
93
|
+
when "score" then score(args[1], args[2..-1].join(' '))
|
80
94
|
when "archive" then archive(args[1], args[2])
|
95
|
+
when "tweet" then tweet(args[1], args[2])
|
81
96
|
end
|
82
97
|
end
|
83
98
|
end
|