RubyGems - zhongwen_tools - Versions diffs - 0.3.5 → 0.4.0 - Mend

zhongwen_tools 0.3.5 → 0.4.0

Files changed (8) hide show

checksums.yaml +4 -4
data/README.md +20 -17
data/lib/zhongwen_tools/string/ruby18.rb +6 -0
data/lib/zhongwen_tools/string.rb +9 -0
data/lib/zhongwen_tools/version.rb +1 -1
data/test/test_romanization.rb +3 -2
data/test/test_string.rb +4 -0
metadata +2 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 922f41394b5974c16b42521d9a203ac31876272e
-  data.tar.gz: 8390da15a9a05b60703c661ec117b77da2a52edb
+  metadata.gz: 9aaee7db1f2f9b57eb3119302933bd0650f3f00d
+  data.tar.gz: ce9e4f18cae127abd60fc4dc664453586029fa0e
 SHA512:
-  metadata.gz: a4b14a2962e68f69dfa4fbeb20731ed1c067f0110eefd7711c09f4bce2f4450a71fbad9912eb68154415ea106a263c4b79a173f68c142da66bffae52f6e9cb5a
-  data.tar.gz: c5d4b6cfe2d3be093b6852d89fecfbf6b995818f6f134341b920372cbb8c9d93d604fff9df2c2cfd49694238ec6ba991304b38960c7c1d29ab275072f61a9e17
+  metadata.gz: 4f1fde8db869e573f9e066cf1bf8687724e165b972e886e924f346d96a3bbaf4b210f1f2478f405494f2865b92f9f26e1e71e9ecb29cdb84f459e6a8314fb55e
+  data.tar.gz: 881dd5bb06c31500f55e3bf7ce925634f64e46fe7184c2beffe639c24d6eb7884b9ba002ec55931ec25ff9c00dff8d75199f55a4b7b46d62ca2afa90e91056bf

data/README.md CHANGED Viewed

@@ -44,23 +44,29 @@ ZhongwenTools includes the following modules:
 ### ZhongwenTools::String: useful string functions for Chinese.
-    ZhongwenTools::String.ascii? 'hello'    #=> true #non-multibyle strings
-    ZhongwenTools::String.multibyte? '中文'  #=> true #multibtye strings
-    ZhongwenTools::String.halfwidth?
-    ZhongwenTools::String.fullwidth?
-    ZhongwenTools::String.to_halfwidth
-    ZhongwenTools::String.uri_encode  #=> just because I'm lazy
-    ZhongwenTools::Unicode.to_codepoint
-    ZhongwenTools::Unicode.to_unicode --> converts from unicode codepoint.
-    ZhongwenTools::String.downcase --> does pinyin/ lowercase
-    ZhongwenTools::String.upcase --> does pinyin uppercase
-    ZhongwenTools::String.capitalize ---> does pinyin / fullwidth capitalization
+    ZhongwenTools::String.ascii? 'hello'              #=> true #non-multibyle strings
+    ZhongwenTools::String.multibyte? '中文'           #=> true #multibtye strings
+    ZhongwenTools::String.halfwidth? 'hello'          #=> true
+    ZhongwenTools::String.fullwidth? 'ｈｅｌｌｏ'     #=> true
+    ZhongwenTools::String.to_halfwidth 'ｈｅｌｌｏ'   #=> 'hello'
+    ZhongwenTools::String.uri_encode '我太懒'            #=>
+    ZhongwenTools::Unicode.to_codepoint '中文'           #=> '\u4e2d\u6587'
+    ZhongwenTools::Unicode.from_codepoint '\u4e2d\u6587' #=> '中文' #converts string from a utf-8 codepoint.
     ZhongwenTools::String.has_zh? '1月'     #=> true
     ZhongwenTools::String.is_zh? '1月'      #=> false can't be mixed.
     ZhongwenTools::String.is_zhs? '中国'    #=> true
     ZhongwenTools::String.is_zht? '中国'    #=> false
+    ZhongwenTools::String.has_zh_punctuation? '你在哪里？'     #=> true
+    ZhongwenTools::String.strip_zh_punctuation? '你在哪里？'     #=> '你在哪里'
+#### The following capitalization methods work for pinyin. [TODO]
+    ZhongwenTools::String.downcase 'Qǐng wèn...'  #=> --> does pinyin/ lowercase
+    ZhongwenTools::String.upcase --> does pinyin uppercase
+    ZhongwenTools::String.capitalize ---> does pinyin / fullwidth capitalization
 #### Ruby 1.8 safe methods
     ZhongwenTools::String.chars '中文' #=> ['中','文']
     ZhongwenTools::String.size '中文'  #=> 2
@@ -68,7 +74,7 @@ ZhongwenTools includes the following modules:
     ZhongwenTools::Unicode.to_utf8 '\x{D6D0}\x{CEC4}' => '中文'
-###Numbers
+### Numbers
 Functions for converting to and from Chinese numbers.
     ZhongwenTools::Number.number_zht 12000        #=> '一萬二千'
@@ -77,7 +83,7 @@ Functions for converting to and from Chinese numbers.
     ZhongwenTools::Number.number_to_int '四十二'  #=> 42
     ZhongwenTools::Number.number? '四十二'        #=> true
-###Integers
+### Integers
 Monkey-patch your integers for Chinese.
     class Integer
@@ -122,7 +128,7 @@ scripts. It **does not convert Chinese characters to pinyin** (see ZhongwenTools
     str.pyn? #=> true
-### Conversion
+### Conversion [TODO]
 Functions for converting between scripts (e.g. traditional Chinese to
 simplified Chinese) and between chinese and romanization systems (e.g.
 Chinese to pinyin).
@@ -139,9 +145,6 @@ Chinese to pinyin).
 ###Tone Sandhi
 Some functions for predicting / converting to tone sandhi
-##Plugins
-Zhongwen Tools tries to avoid having many dependencies. Functionality
-that requires an external dependency is packaged as a separate gem.
 ## TODO
 1. A trad/simp script converter

data/lib/zhongwen_tools/string/ruby18.rb CHANGED Viewed

@@ -67,5 +67,11 @@ module ZhongwenTools
       !str[regex[:punc]].nil?
     end
+    def strip_zh_punctuation(str = nil)
+      str ||= self
+      str.gsub(self.convert_regex(UNICODE_REGEX[:punc]), '')
+    end
   end
 end

data/lib/zhongwen_tools/string.rb CHANGED Viewed

@@ -33,6 +33,12 @@ module ZhongwenTools
       !str[UNICODE_REGEX[:punc]].nil?
     end
+    def strip_zh_punctuation(str = nil)
+      str ||= self
+      str.gsub(UNICODE_REGEX[:punc], '')
+    end
     def size(str = nil)
       str ||= self
       str.chars.size
@@ -142,6 +148,9 @@ module ZhongwenTools
     def self.has_zh?(*args)
       Basement.new.has_zh?(*args)
     end
+    def self.strip_zh_punctuation(*args)
+      Basement.new.strip_zh_punctuation(*args)
+    end
     def self.has_zh_punctuation?(*args)
       Basement.new.has_zh_punctuation?(*args)
     end

data/lib/zhongwen_tools/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module ZhongwenTools
-  VERSION = "0.3.5"
+  VERSION = "0.4.0"
 end

data/test/test_romanization.rb CHANGED Viewed

@@ -13,10 +13,10 @@ class TestRomanization < Minitest::Test
   def test_pinyin
     assert_equal 'Zhōng wén','Zhong1 wen2'.to_pinyin
     assert_equal 'Zhōngwén', 'Zhong1-wen2'.to_pinyin
-    #binding.pry
     assert_equal "Tiān'ānmén",'Tian1an1men2'.to_pinyin
+    assert_equal @alabo[:py], @alabo[:pyn].to_pinyin
-    #skip
+    #wg -> py not yet implemented
     #mzd = "Mao Tse-tung"
     #assert_equal "Mao Zedong", mzd.to_pinyin(:wg)
   end
@@ -72,5 +72,6 @@ class TestRomanization < Minitest::Test
     @mzd2 = 'Mao2 Ze2-dong1'
     @py = 'nǐ hǎo'
     @sent = 'Qing3 hui2-da2 wo3 de5 wen4-ti2 .'
+    @alabo = {:pyn => 'A1-la1-bo2', :py => 'Ālābó'}
   end
 end

data/test/test_string.rb CHANGED Viewed

@@ -99,10 +99,14 @@ class TestString < Minitest::Test
     assert_equal '羊', ZhongwenTools::String.from_codepoint('\\u7f8a')
   end
   def test_punctuation
     assert ZhongwenTools::String.has_zh_punctuation?(@zh_punc)
     assert @zh_punc.has_zh_punctuation?
+    refute ZhongwenTools::String.strip_zh_punctuation(@zh_punc) == @zh_punc, "#{@zh_punc} should not equal #{ZhongwenTools::String.strip_zh_punctuation(@zh_punc)}"
+    refute @zh_punc.strip_zh_punctuation == @zh_punc, "#{@zh_punc} should not equal #{ @zh_punc.strip_zh_punctuation} "
   end
   def setup

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: zhongwen_tools
 version: !ruby/object:Gem::Version
-  version: 0.3.5
+  version: 0.4.0
 platform: ruby
 authors:
 - Steven Daniels
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2014-03-03 00:00:00.000000000 Z
+date: 2014-03-06 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: rake