twexicon 0.1.7.1 → 0.1.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 8628e88177bf13abeb0aabcdf40f85829cf3234b
4
- data.tar.gz: 0dfa52e2ed29c01ec14b575587f5b9ee038a81fa
3
+ metadata.gz: 166ba87d5e9f7c5039ffc03a8a9b74aaf25d6599
4
+ data.tar.gz: c3f0f992b626d751057db8850589fec2c5fdb47f
5
5
  SHA512:
6
- metadata.gz: dffb2fbd8eaa81c1550aef0ccac4d745a3595ae43cd5cff2729cc1ffa9f5a21cc61b5488865af8e0184166ceb2fb58d5ca6359bd63164eb2425eea070de22799
7
- data.tar.gz: 60c9217cf1fe43793c4d474d56d00bd668dd60d2e4f57bc72d7473392f57291484e1c0d4cb27bcc710d93906f751ea19f731bcf91cbfbfa7281f2eb3d0f81cdb
6
+ metadata.gz: a575dc49c0ee39ee40b0501cc65d1d47d7567ea035cac6a2c02ebeb26712be09edeeaffc893c2f13c009bed0bfbf2960ccb38df66d0923e1b6fa1944a9d57bd0
7
+ data.tar.gz: 521809c9442611e804c9b36d4affa9534f7c002a8089011eb5c200757914f456e8a50e64c4b7450380b1850ffb4fc5fbe12836275c67df6b1ef267ad16b88624
@@ -13,7 +13,7 @@ class Twexicon::Analyzer
13
13
  until quit
14
14
  @input = nil
15
15
  @int = ""
16
- puts "What would you like to do next? For options, type 'help'."
16
+ puts "\nWhat would you like to do next? For options, type 'help'."
17
17
  until is_valid?
18
18
  @input = gets.strip.gsub(/\W/, "").downcase
19
19
  end
@@ -69,14 +69,16 @@ class Twexicon::Analyzer
69
69
  end
70
70
  end
71
71
 
72
- # 38 words from https://en.wikipedia.org/wiki/Most_common_words_in_English –– Left out some common yet still interesting ones (People, Good, Think, Work, First, One, Two, Want, New, Give, Know)
72
+ # Words from https://en.wikipedia.org/wiki/Most_common_words_in_English –– Left out some common yet still interesting ones (People, Good, Think, Work, First, One, Two, Want, New, Give, Know)
73
73
  COMMON_WORDS = ["A", "About", "An", "And", "Are", "As", "At", "Be", "Been", "But", "By", "For", "From", "Get", "Had", "Has", "Have", "In", "Into", "Is", "It", "It's", "Its", "Just", "Not", "Of", "On", "Or", "Say", "So", "Some", "That", "The", "There", "These", "This", "Those", "To", "Up", "With", "I", "My", "Your", "They", "He", "You", "Do", "His", "We", "Her", "She", "Will", "All", "Would", "Their", "What", "Out", "If", "Who", "Which", "Go", "Me", "When", "Make", "Can", "Time", "No", "Him", "Take", "Year", "Could", "Them", "See", "Other", "Than", "Then", "Now", "Look", "Only", "Come", "Over", "Also", "Back", "After", "Use", "How", "Our", "Well", "Way", "Even", "Because", "Any", "Day", "Most", "Us",
74
74
  # other additions
75
- "Wouldn't", "Couldn't", "Shouldn't", "Mustn't", "Would've", "Could've", "Should've", "Must've", "Hadn't", "Wasn't", "Weren't", "Ain't", "Aint", "Here", "Seem", "Seems", "That's", "Took", "Much", "More", "You're", "We're", "We've", "I've", "I'm",
75
+ "Wouldn't", "Couldn't", "Shouldn't", "Mustn't", "Would've", "Could've", "Should've", "Must've", "Hadn't", "Wasn't", "Weren't", "Ain't", "Aint", "Here", "Seem", "Seems", "That's", "Took", "Much", "More", "You're", "We're", "We've", "I've", "I'm", "Don't", "Got", "Soon",
76
76
  # contraction endings until I fix the parsing error
77
77
  "Re", "Ll", "Ve",
78
78
  # Letters until I fix the contraction parsing error
79
- "B", "C", "D", "E", "F", "G", "H", "J", "K", "L", "M", "N", "O", "P", "Q", "R", "S", "T", "U", "V", "W", "X", "Y", "Z"]
79
+ "B", "C", "D", "E", "F", "G", "H", "J", "K", "L", "M", "N", "O", "P", "Q", "R", "S", "T", "U", "V", "W", "X", "Y", "Z",
80
+ # Common words in other languages that *aren't* uncommon English words (so, "Con" doesn't count)
81
+ "En"]
80
82
 
81
83
  def get_words
82
84
  words = {}
@@ -93,15 +95,17 @@ class Twexicon::Analyzer
93
95
  end
94
96
  words.each do |w, n| # Create strings for the words that occur >1 times
95
97
  case n
96
- when 1..9 then word_array << "0#{n}x #{w}"
97
- when 10..99 then word_array << "#{n}x #{w}"
98
+ when 1..9 then word_array << "000#{n}x #{w}"
99
+ when 10..99 then word_array << "00#{n}x #{w}"
100
+ when 100..999 then word_array << "0#{n}x #{w}"
101
+ when 1000..9999 then word_array << "#{n}x #{w}"
98
102
  end
99
103
  end
100
104
  if word_array.empty?
101
105
  puts "\nIt appears that @#{username} is not much of a talker."
102
106
  else
103
107
  puts "\n@#{username}'s current favorite word(s):"
104
- puts word_array.sort.reverse.take(10)
108
+ puts word_array.sort.reverse.each{|w| w.sub!(/^0+/, "")}.take(10)
105
109
  end
106
110
  end
107
111
 
@@ -14,12 +14,12 @@ class Twexicon::Scraper
14
14
  tweets.each do |num, tweet|
15
15
  t = tweet.keys[0].dup
16
16
  t.scan(/pic.twitter.com\/\w{10}/){|p| tweet.values[0][:pix] << p.strip}.gsub!(/pic.twitter.com\/\w{10}/, " ")
17
- t.scan(/https?:\/\/[\w\.\?\=\&\-\/\#]+/){|w| tweet.values[0][:links] << w.strip}.gsub!(/https?:\/\/[\w\.\?\=\&\-\/\#]+/, " ")
17
+ t.scan(/https?:\/\/[\w\.\?\=\&\-\/\#\:]+/){|w| tweet.values[0][:links] << w.strip}.gsub!(/https?:\/\/[\w\.\?\=\&\-\/\#\:]+/, " ")
18
18
  t.scan(/#\w+/){|h| tweet.values[0][:hashtags] << h.gsub(/\W/, "").prepend("#")}.gsub!(/#\w+/, " ")
19
19
  t.scan(/@\w+/){|u| tweet.values[0][:usernames] << u.gsub(/\W/, "").prepend("@")}.gsub!(/@\w+/, " ")
20
- t.scan(/(\d+[:\.\b]?\d*)+/){|n| tweet.values[0][:numbers] << n.first.gsub(/(^\W+|\W+$)/, "")}.gsub!(/(\d+[:\.\b]?\d*)+/, " ")
21
- t.scan(/(\b[A-Z][\.\b][A-Z][\.\b][A-Z][\.\b]|\b[A-Z][\.\b][A-Z][\.\b])/){|a| tweet.values[0][:acronyms] << a.first.strip}.gsub!(/(\b[A-Z][\.\b][A-Z][\.\b][A-Z][\.\b]|\b[A-Z][\.\b][A-Z][\.\b])/, " ")
22
- t.scan(/(([A-Z]+\W){2,}|[A-Z]{4,}\W)/){|s| tweet.values[0][:shouts] << s.first.gsub(/\W/, " ").strip}.gsub!(/(([A-Z]+\W){2,}|[A-Z]{4,}\W)/, " ")
20
+ t.scan(/(\d+[:\.\ ]?\d*)+/){|n| tweet.values[0][:numbers] << n.first.gsub(/(^\W+|\W+$)/, "")}.gsub!(/(\d+[:\.\ ]?\d*)+/, " ")
21
+ t.scan(/(\b[A-Z][\.\ ][A-Z][\.\ ][A-Z][\.\ ]|\b[A-Z][\.\ ][A-Z][\.\ ])/){|a| tweet.values[0][:acronyms] << a.first.strip}.gsub!(/(\b[A-Z][\.\ ][A-Z][\.\ ][A-Z][\.\ ]|\b[A-Z][\.\ ][A-Z][\.\ ])/, " ")
22
+ t.scan(/(([A-Z]+[\s\,\&\:\-]+){2,}|[A-Z]{4,}\W)/){|s| tweet.values[0][:shouts] << s.first.gsub(/\W/, " ").strip}.gsub!(/(([A-Z]+[\s\,\&\:\-]+){2,}|[A-Z]{4,}\W)/, " ")
23
23
  t.scan(/\b[A-Z]{2,3}\b/){|a| tweet.values[0][:acronyms] << a.strip}.gsub!(/\b[A-Z]{2,3}\b/, " ")
24
24
  t.scan(/\w+['\/]?\w*/){|w| tweet.values[0][:words] << w.strip}.gsub!(/\w+['\/]?\w*/, " ")
25
25
  end
@@ -1,3 +1,3 @@
1
1
  module Twexicon
2
- VERSION = "0.1.7.1"
2
+ VERSION = "0.1.8"
3
3
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: twexicon
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.7.1
4
+ version: 0.1.8
5
5
  platform: ruby
6
6
  authors:
7
7
  - Gabe Jackson