mmfont 1.0.0 → 1.0.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.travis.yml +8 -0
- data/README.md +12 -5
- data/Rakefile +15 -2
- data/lib/mmfont.rb +132 -109
- data/lib/mmfont/version.rb +1 -1
- data/mmfont.gemspec +15 -11
- data/test/mmfont_test.rb +36 -5
- metadata +47 -4
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: e7b124a6538ddef586194fb379400390ba0ee2e2
|
4
|
+
data.tar.gz: 7dff56edbafabc021330e64ea270de10d3f58f91
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: c8566c36a0d2d32c8cbb8b910637e203d230fbc6b206df86823530565df22ed1f0130fc2f634cc7de1949fd6725c0eb6a775c54b33a9be36dd516f2de232a45e
|
7
|
+
data.tar.gz: dac924ce21d5c6e7a55bfa32b38681d769d59921940d5080948194f8427aa73a94d46f78862385c77430ee21a9ce81cca457dd2fb3c3188705d5d6efde2e3b90
|
data/.travis.yml
ADDED
data/README.md
CHANGED
@@ -1,6 +1,13 @@
|
|
1
1
|
# Mmfont
|
2
2
|
|
3
|
-
|
3
|
+
[![Build Status](https://travis-ci.org/yelinaung/mmfont.svg)](https://travis-ci.org/yelinaung/mmfont)
|
4
|
+
[![Gem Version](https://badge.fury.io/rb/mmfont.svg)](http://badge.fury.io/rb/mmfont)
|
5
|
+
[![Dependency Status](https://gemnasium.com/yelinaung/mmfont.svg)](https://gemnasium.com/yelinaung/mmfont)
|
6
|
+
[![Inline docs](http://inch-ci.org/github/yelinaung/mmfont.png?branch=master)](http://inch-ci.org/github/yelinaung/mmfont)
|
7
|
+
|
8
|
+
A simple gem which converts zawgyi1 <=> unicode strings. It uses the rules from [paytan](https://github.com/trhura/paytan) and basically, the ruby converter.
|
9
|
+
It's written with TDD. Special thanks to [@steveklabnik](https://github.com/steveklabnik) for his tutorials [How I Start Ruby](http://www.howistart.org/posts/ruby/1).
|
10
|
+
|
4
11
|
|
5
12
|
## Installation
|
6
13
|
|
@@ -13,13 +20,13 @@ gem 'mmfont'
|
|
13
20
|
And then execute:
|
14
21
|
|
15
22
|
```bash
|
16
|
-
|
23
|
+
$ bundle
|
17
24
|
```
|
18
25
|
|
19
26
|
Or install it yourself as:
|
20
27
|
|
21
28
|
```bash
|
22
|
-
|
29
|
+
$ gem install mmfont
|
23
30
|
```
|
24
31
|
|
25
32
|
## Usage
|
@@ -37,14 +44,14 @@ a.zg12uni51("မဂၤလာပါ") # returns unicode strings "မင်္
|
|
37
44
|
|
38
45
|
## Is it fast ?
|
39
46
|
I am not sure. But of course, Ruby is basically slow, regardless of implementations, compared to Nodejs, Go, Rust etc.
|
40
|
-
|
47
|
+
Some benchmarks, maybe ?
|
41
48
|
|
42
49
|
## TODO
|
43
50
|
- ~~Write TESTS!~~
|
44
51
|
|
45
52
|
## Contributing
|
46
53
|
|
47
|
-
1. Fork it ( https://github.com/
|
54
|
+
1. Fork it ( https://github.com/yelinaung/mmfont )
|
48
55
|
2. Create your feature branch (`git checkout -b my-new-feature`)
|
49
56
|
3. Commit your changes (`git commit -am 'Add some feature'`)
|
50
57
|
4. Push to the branch (`git push origin my-new-feature`)
|
data/Rakefile
CHANGED
@@ -1,9 +1,22 @@
|
|
1
|
-
require
|
1
|
+
require 'bundler/gem_tasks'
|
2
2
|
|
3
|
-
require
|
3
|
+
require 'rake/testtask'
|
4
|
+
require 'rubocop/rake_task'
|
4
5
|
|
5
6
|
Rake::TestTask.new do |t|
|
7
|
+
t.libs << 'lib'
|
8
|
+
t.libs << 'spec'
|
6
9
|
t.test_files = FileList['test/*_test.rb']
|
7
10
|
end
|
8
11
|
|
12
|
+
# Run robocop
|
13
|
+
desc 'Run RuboCop on the lib directory'
|
14
|
+
RuboCop::RakeTask.new(:rubocop) do |task|
|
15
|
+
task.patterns = ['lib/**/*.rb']
|
16
|
+
# only show the files with failures
|
17
|
+
task.formatters = ['files']
|
18
|
+
# don't abort rake on failure
|
19
|
+
task.fail_on_error = false
|
20
|
+
end
|
21
|
+
|
9
22
|
task default: :test
|
data/lib/mmfont.rb
CHANGED
@@ -1,4 +1,30 @@
|
|
1
|
-
|
1
|
+
#--
|
2
|
+
# Copyright (c) 2014 Ye Lin Aung
|
3
|
+
# Zawgyi<>Unicode converter python module
|
4
|
+
# Based on rules from Parabaik Myanmar Text Converter
|
5
|
+
# Copyright (C) 2014 Ngwe Tun (Solveware Solution)
|
6
|
+
#
|
7
|
+
# Permission is hereby granted, free of charge, to any person obtaining
|
8
|
+
# a copy of this software and associated documentation files (the
|
9
|
+
# "Software"), to deal in the Software without restriction, including
|
10
|
+
# without limitation the rights to use, copy, modify, merge, publish,
|
11
|
+
# distribute, sublicense, and/or sell copies of the Software, and to
|
12
|
+
# permit persons to whom the Software is furnished to do so, subject to
|
13
|
+
# the following conditions:
|
14
|
+
#
|
15
|
+
# The above copyright notice and this permission notice shall be
|
16
|
+
# included in all copies or substantial portions of the Software.
|
17
|
+
#
|
18
|
+
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
19
|
+
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
20
|
+
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
21
|
+
# NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
22
|
+
# LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
23
|
+
# OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
24
|
+
# WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
25
|
+
#--
|
26
|
+
|
27
|
+
require 'mmfont/version'
|
2
28
|
|
3
29
|
# Mmfont module
|
4
30
|
module Mmfont
|
@@ -7,115 +33,112 @@ module Mmfont
|
|
7
33
|
# Convert given text from unicode to zawgyi
|
8
34
|
def uni512zg1(input_text)
|
9
35
|
output_text = input_text
|
10
|
-
output_text = output_text.gsub(/\u104e\u1004\u103a\u1038
|
11
|
-
output_text = output_text.gsub(/\u102b\u103a
|
12
|
-
output_text = output_text.gsub(/\u102d\u1036
|
13
|
-
output_text = output_text.gsub(/\u103f
|
14
|
-
output_text = output_text.gsub(/(?<=\u102f)\u1037
|
15
|
-
output_text = output_text.gsub(/(?<=\u102f\u1036)\u1037
|
16
|
-
output_text = output_text.gsub(/(?<=\u1030)\u1037
|
17
|
-
output_text = output_text.gsub(/(?<=\u1030\u1036)\u1037
|
18
|
-
output_text = output_text.gsub(/(?<=\u1014)\u1037
|
19
|
-
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037
|
20
|
-
output_text = output_text.gsub(/(?<=\u103b)\u1037
|
21
|
-
output_text = output_text.gsub(/(?<=\u103b[\u1032\u1036])\u1037
|
22
|
-
output_text = output_text.gsub(/(?<=\u103d)\u1037
|
23
|
-
output_text = output_text.gsub(/(?<=\u103d[\u1032])\u1037
|
24
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d])\u102f
|
25
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d][\u102d\u1036])\u102f
|
26
|
-
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u102f
|
27
|
-
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u102f
|
28
|
-
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u102f
|
29
|
-
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u102f
|
30
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c])\u1030
|
31
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d])\u1030
|
32
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e])\u1030
|
33
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u102d\u1036])\u1030
|
34
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e])\u1030
|
35
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u102d\u1036])\u1030
|
36
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e][\u102d\u1036])\u1030
|
37
|
-
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e][\u102d\u1036])\u1030
|
38
|
-
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u1030
|
39
|
-
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u1030
|
40
|
-
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u1030
|
41
|
-
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u1030
|
42
|
-
output_text = output_text.gsub(/(?<=\u103c)\u103e
|
43
|
-
output_text = output_text.gsub(/\u1009(?=[\u103a])
|
44
|
-
output_text = output_text.gsub(/\u1009(?=\u1039[\u1000-\u1021])
|
45
|
-
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021])?)((?:[\u103b-\u103e\u1087]
|
46
|
-
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021\u1000-\u1021])?)(\u103c)
|
47
|
-
output_text = output_text.gsub(/\u1004\u103a\u1039
|
48
|
-
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102d
|
49
|
-
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102e
|
50
|
-
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u1036
|
51
|
-
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])
|
52
|
-
output_text = output_text.gsub(/\u100a(?=[\u1039\u102f\u1030])
|
53
|
-
output_text = output_text.gsub(/\u100a
|
54
|
-
output_text = output_text.gsub(/\u101b(?=[\u102f\u1030])
|
55
|
-
output_text = output_text.gsub(/\u101b
|
56
|
-
output_text = output_text.gsub(/\u1014(?=[\u1039\u103d\u103e\u102f\u1030])
|
57
|
-
output_text = output_text.gsub(/\u1014
|
58
|
-
output_text = output_text.gsub(/\u1039\u1000
|
59
|
-
output_text = output_text.gsub(/\u1039\u1001
|
60
|
-
output_text = output_text.gsub(/\u1039\u1002
|
61
|
-
output_text = output_text.gsub(/\u1039\u1003
|
62
|
-
output_text = output_text.gsub(/\u1039\u1005
|
63
|
-
output_text = output_text.gsub(/\u1039\u1006
|
64
|
-
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1066
|
65
|
-
output_text = output_text.gsub(/\u1039\u1007
|
66
|
-
output_text = output_text.gsub(/\u1039\u1008
|
67
|
-
output_text = output_text.gsub(/\u1039\u100f
|
68
|
-
output_text = output_text.gsub(/\u1039\u1010
|
69
|
-
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1071
|
70
|
-
output_text = output_text.gsub(/\u1039\u1011
|
71
|
-
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1073
|
72
|
-
output_text = output_text.gsub(/\u1039\u1012
|
73
|
-
output_text = output_text.gsub(/\u1039\u1013
|
74
|
-
output_text = output_text.gsub(/\u1039\u1014
|
75
|
-
output_text = output_text.gsub(/\u1039\u1015
|
76
|
-
output_text = output_text.gsub(/\u1039\u1016
|
77
|
-
output_text = output_text.gsub(/\u1039\u1017
|
78
|
-
output_text = output_text.gsub(/\u1039\u1018
|
79
|
-
output_text = output_text.gsub(/\u1039\u1019
|
80
|
-
output_text = output_text.gsub(/\u1039\u101c
|
81
|
-
output_text = output_text.gsub(/\u100f\u1039\u100d
|
82
|
-
output_text = output_text.gsub(/\u100b\u1039\u100c
|
83
|
-
output_text = output_text.gsub(/\u1039\u100c
|
84
|
-
output_text = output_text.gsub(/\u100b\u1039\u100b
|
85
|
-
output_text = output_text.gsub(/\u1039\u100b
|
86
|
-
output_text = output_text.gsub(/\u100e\u1039\u100d
|
87
|
-
output_text = output_text.gsub(/\u100d\u1039\u100d
|
88
|
-
output_text = output_text.gsub(/\u1009(?=\u103a)
|
89
|
-
output_text = output_text.gsub(/\u1025(?=[\u1039\u102f\u1030])
|
90
|
-
output_text = output_text.gsub(/\u1025
|
91
|
-
output_text = output_text.gsub(/\u103a
|
92
|
-
output_text = output_text.gsub(/\u103b\u103d\u103e
|
93
|
-
output_text = output_text.gsub(/\u103d\u103e
|
94
|
-
output_text = output_text.gsub(/\u103b
|
95
|
-
output_text = output_text.gsub(/\u103c
|
96
|
-
output_text = output_text.gsub(/\u103d
|
97
|
-
output_text = output_text.gsub(/\u103e
|
98
|
-
output_text = output_text.gsub(/\u103a(?=[\u103c\u103d\u108a])
|
99
|
-
output_text = output_text.gsub(/(?<=\u100a(?:[\u102d\u102e\u1036\u108b\u108c\u108d\u108e]))\u103d
|
100
|
-
output_text = output_text.gsub(/(?<=\u100a)\u103d
|
101
|
-
output_text = output_text.gsub(/\u103b(?=[\u1000\u1003\u1006\u100f\u1010\u1011\u1018\u101a\u101c\u101e\u101f\u1021])
|
102
|
-
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])
|
103
|
-
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u103c\u108a])
|
104
|
-
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])
|
105
|
-
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u103c\u108a])
|
106
|
-
output_text = output_text.gsub(/(?<=\u1014)\u1037
|
107
|
-
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037
|
108
|
-
output_text = output_text.gsub(/(?<=\u1033)\u1094
|
109
|
-
output_text = output_text.gsub(/(?<=\u1033[\u1036])\u1094
|
110
|
-
output_text = output_text.gsub(/(?<=\u1034)\u1094
|
111
|
-
output_text = output_text.gsub(/(?<=\u1034[\u1036])\u1094
|
112
|
-
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a])\u1037
|
113
|
-
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a][\u1032])\u1037
|
114
|
-
# 'return' is not necessary but it's there to prevent 'end' from auto-indent
|
115
|
-
return output_text
|
36
|
+
output_text = output_text.gsub(/\u104e\u1004\u103a\u1038/, "\u104e")
|
37
|
+
output_text = output_text.gsub(/\u102b\u103a/, "\u105a")
|
38
|
+
output_text = output_text.gsub(/\u102d\u1036/, "\u108e")
|
39
|
+
output_text = output_text.gsub(/\u103f/, "\u1086")
|
40
|
+
output_text = output_text.gsub(/(?<=\u102f)\u1037/, "\u1094")
|
41
|
+
output_text = output_text.gsub(/(?<=\u102f\u1036)\u1037/, "\u1094")
|
42
|
+
output_text = output_text.gsub(/(?<=\u1030)\u1037/, "\u1094")
|
43
|
+
output_text = output_text.gsub(/(?<=\u1030\u1036)\u1037/, "\u1094")
|
44
|
+
output_text = output_text.gsub(/(?<=\u1014)\u1037/, "\u1094")
|
45
|
+
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037/, "\u1094")
|
46
|
+
output_text = output_text.gsub(/(?<=\u103b)\u1037/, "\u1095")
|
47
|
+
output_text = output_text.gsub(/(?<=\u103b[\u1032\u1036])\u1037/, "\u1095")
|
48
|
+
output_text = output_text.gsub(/(?<=\u103d)\u1037/, "\u1095")
|
49
|
+
output_text = output_text.gsub(/(?<=\u103d[\u1032])\u1037/, "\u1095")
|
50
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d])\u102f/, "\u1033")
|
51
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d][\u102d\u1036])\u102f/, "\u1033")
|
52
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u102f/, "\u1033")
|
53
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u102f/, "\u1033")
|
54
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u102f/, "\u1033")
|
55
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u102f/, "\u1033")
|
56
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c])\u1030/, "\u1034")
|
57
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d])\u1030/, "\u1034")
|
58
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e])\u1030/, "\u1034")
|
59
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u102d\u1036])\u1030/, "\u1034")
|
60
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e])\u1030/, "\u1034")
|
61
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u102d\u1036])\u1030/, "\u1034")
|
62
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e][\u102d\u1036])\u1030/, "\u1034")
|
63
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e][\u102d\u1036])\u1030/, "\u1034")
|
64
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u1030/, "\u1034")
|
65
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u1030/, "\u1034")
|
66
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u1030/, "\u1034")
|
67
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u1030/, "\u1034")
|
68
|
+
output_text = output_text.gsub(/(?<=\u103c)\u103e/, "\u1087")
|
69
|
+
output_text = output_text.gsub(/\u1009(?=[\u103a])/, "\u1025")
|
70
|
+
output_text = output_text.gsub(/\u1009(?=\u1039[\u1000-\u1021])/, "\u1025")
|
71
|
+
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021])?)((?:[\u103b-\u103e\u1087])?)\u1031/, "\u1031\\1\\2\\3")
|
72
|
+
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021\u1000-\u1021])?)(\u103c)/, "\\3\\1\\2")
|
73
|
+
output_text = output_text.gsub(/\u1004\u103a\u1039/, "\u1064")
|
74
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102d/, "\\2\\3\\4\u108b")
|
75
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102e/, "\\2\\3\\4\u108c")
|
76
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u1036/, "\\2\\3\\4\u108d")
|
77
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])/, "\\2\\3\\4\u1064")
|
78
|
+
output_text = output_text.gsub(/\u100a(?=[\u1039\u102f\u1030])/, "\u106b")
|
79
|
+
output_text = output_text.gsub(/\u100a/, "\u100a")
|
80
|
+
output_text = output_text.gsub(/\u101b(?=[\u102f\u1030])/, "\u1090")
|
81
|
+
output_text = output_text.gsub(/\u101b/, "\u101b")
|
82
|
+
output_text = output_text.gsub(/\u1014(?=[\u1039\u103d\u103e\u102f\u1030])/, "\u108f")
|
83
|
+
output_text = output_text.gsub(/\u1014/, "\u1014")
|
84
|
+
output_text = output_text.gsub(/\u1039\u1000/, "\u1060")
|
85
|
+
output_text = output_text.gsub(/\u1039\u1001/, "\u1061")
|
86
|
+
output_text = output_text.gsub(/\u1039\u1002/, "\u1062")
|
87
|
+
output_text = output_text.gsub(/\u1039\u1003/, "\u1063")
|
88
|
+
output_text = output_text.gsub(/\u1039\u1005/, "\u1065")
|
89
|
+
output_text = output_text.gsub(/\u1039\u1006/, "\u1066")
|
90
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1066/, "\u1067")
|
91
|
+
output_text = output_text.gsub(/\u1039\u1007/, "\u1068")
|
92
|
+
output_text = output_text.gsub(/\u1039\u1008/, "\u1069")
|
93
|
+
output_text = output_text.gsub(/\u1039\u100f/, "\u1070")
|
94
|
+
output_text = output_text.gsub(/\u1039\u1010/, "\u1071")
|
95
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1071/, "\u1072")
|
96
|
+
output_text = output_text.gsub(/\u1039\u1011/, "\u1073")
|
97
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1073/, "\u1074")
|
98
|
+
output_text = output_text.gsub(/\u1039\u1012/, "\u1075")
|
99
|
+
output_text = output_text.gsub(/\u1039\u1013/, "\u1076")
|
100
|
+
output_text = output_text.gsub(/\u1039\u1014/, "\u1077")
|
101
|
+
output_text = output_text.gsub(/\u1039\u1015/, "\u1078")
|
102
|
+
output_text = output_text.gsub(/\u1039\u1016/, "\u1079")
|
103
|
+
output_text = output_text.gsub(/\u1039\u1017/, "\u107a")
|
104
|
+
output_text = output_text.gsub(/\u1039\u1018/, "\u107b")
|
105
|
+
output_text = output_text.gsub(/\u1039\u1019/, "\u107c")
|
106
|
+
output_text = output_text.gsub(/\u1039\u101c/, "\u1085")
|
107
|
+
output_text = output_text.gsub(/\u100f\u1039\u100d/, "\u1091")
|
108
|
+
output_text = output_text.gsub(/\u100b\u1039\u100c/, "\u1092")
|
109
|
+
output_text = output_text.gsub(/\u1039\u100c/, "\u106d")
|
110
|
+
output_text = output_text.gsub(/\u100b\u1039\u100b/, "\u1097")
|
111
|
+
output_text = output_text.gsub(/\u1039\u100b/, "\u106c")
|
112
|
+
output_text = output_text.gsub(/\u100e\u1039\u100d/, "\u106f")
|
113
|
+
output_text = output_text.gsub(/\u100d\u1039\u100d/, "\u106e")
|
114
|
+
output_text = output_text.gsub(/\u1009(?=\u103a)/, "\u1025")
|
115
|
+
output_text = output_text.gsub(/\u1025(?=[\u1039\u102f\u1030])/, "\u106a")
|
116
|
+
output_text = output_text.gsub(/\u1025/, "\u1025")
|
117
|
+
output_text = output_text.gsub(/\u103a/, "\u1039")
|
118
|
+
output_text = output_text.gsub(/\u103b\u103d\u103e/, "\u107d\u108a")
|
119
|
+
output_text = output_text.gsub(/\u103d\u103e/, "\u108a")
|
120
|
+
output_text = output_text.gsub(/\u103b/, "\u103a")
|
121
|
+
output_text = output_text.gsub(/\u103c/, "\u103b")
|
122
|
+
output_text = output_text.gsub(/\u103d/, "\u103c")
|
123
|
+
output_text = output_text.gsub(/\u103e/, "\u103d")
|
124
|
+
output_text = output_text.gsub(/\u103a(?=[\u103c\u103d\u108a])/, "\u107d")
|
125
|
+
output_text = output_text.gsub(/(?<=\u100a(?:[\u102d\u102e\u1036\u108b\u108c\u108d\u108e]))\u103d/, "\u1087")
|
126
|
+
output_text = output_text.gsub(/(?<=\u100a)\u103d/, "\u1087")
|
127
|
+
output_text = output_text.gsub(/\u103b(?=[\u1000\u1003\u1006\u100f\u1010\u1011\u1018\u101a\u101c\u101e\u101f\u1021])/, "\u107e")
|
128
|
+
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])/, "\u1080\\1")
|
129
|
+
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u103c\u108a])/, "\u1082\\1")
|
130
|
+
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])/, "\u107f\\1")
|
131
|
+
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u103c\u108a])/, "\u1081\\1")
|
132
|
+
output_text = output_text.gsub(/(?<=\u1014)\u1037/, "\u1094")
|
133
|
+
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037/, "\u1094")
|
134
|
+
output_text = output_text.gsub(/(?<=\u1033)\u1094/, "\u1095")
|
135
|
+
output_text = output_text.gsub(/(?<=\u1033[\u1036])\u1094/, "\u1095")
|
136
|
+
output_text = output_text.gsub(/(?<=\u1034)\u1094/, "\u1095")
|
137
|
+
output_text = output_text.gsub(/(?<=\u1034[\u1036])\u1094/, "\u1095")
|
138
|
+
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a])\u1037/, "\u1095")
|
139
|
+
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a][\u1032])\u1037/, "\u1095")
|
116
140
|
end # end of uni to zg1
|
117
141
|
|
118
|
-
# Convert given text from zawgyi to unicode
|
119
142
|
def zg12uni51(input_text)
|
120
143
|
output_text = input_text
|
121
144
|
output_text = output_text.gsub(/\u106a/ ,"\u1009")
|
@@ -127,7 +150,7 @@ module Mmfont
|
|
127
150
|
output_text = output_text.gsub(/\u108f/ ,"\u1014")
|
128
151
|
output_text = output_text.gsub(/\u1012/ ,"\u1012")
|
129
152
|
output_text = output_text.gsub(/\u1013/ ,"\u1013")
|
130
|
-
output_text = output_text.gsub(/[\u103d\u1087]/ ,"\
|
153
|
+
output_text = output_text.gsub(/[\u103d\u1087]/ ,"\u103e")
|
131
154
|
output_text = output_text.gsub(/\u103c/ ,"\u103d")
|
132
155
|
output_text = output_text.gsub(/[\u103b\u107e\u107f\u1080\u1081\u1082\u1083\u1084]/ ,"\u103c")
|
133
156
|
output_text = output_text.gsub(/[\u103a\u107d]/ ,"\u103b")
|
data/lib/mmfont/version.rb
CHANGED
data/mmfont.gemspec
CHANGED
@@ -1,23 +1,27 @@
|
|
1
|
-
#
|
1
|
+
# encoding: utf-8
|
2
2
|
lib = File.expand_path('../lib', __FILE__)
|
3
3
|
$LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
|
4
4
|
require 'mmfont/version'
|
5
5
|
|
6
6
|
Gem::Specification.new do |spec|
|
7
|
-
spec.name =
|
7
|
+
spec.name = 'mmfont'
|
8
8
|
spec.version = Mmfont::VERSION
|
9
|
-
spec.authors = [
|
10
|
-
spec.email = [
|
11
|
-
spec.summary =
|
12
|
-
spec.description =
|
13
|
-
spec.homepage =
|
14
|
-
spec.license =
|
9
|
+
spec.authors = ['Ye Lin Aung']
|
10
|
+
spec.email = ['me@yelinaung.com']
|
11
|
+
spec.summary = 'Myanmar font converter.'
|
12
|
+
spec.description = 'Myanmar font toolkit in Ruby.'
|
13
|
+
spec.homepage = 'https://github.com/yelinaung/mmfont'
|
14
|
+
spec.license = 'MIT'
|
15
15
|
|
16
16
|
spec.files = `git ls-files -z`.split("\x0")
|
17
17
|
spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
|
18
18
|
spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
|
19
|
-
spec.require_paths = [
|
19
|
+
spec.require_paths = ['lib']
|
20
20
|
|
21
|
-
spec.
|
22
|
-
spec.
|
21
|
+
spec.add_dependency 'coveralls'
|
22
|
+
spec.add_dependency 'rubocop'
|
23
|
+
|
24
|
+
spec.add_development_dependency 'bundler', '~> 1.6'
|
25
|
+
spec.add_development_dependency 'rake', '~> 10.0'
|
26
|
+
spec.add_development_dependency 'minitest'
|
23
27
|
end
|
data/test/mmfont_test.rb
CHANGED
@@ -1,14 +1,45 @@
|
|
1
|
-
|
2
|
-
require "mmfont"
|
1
|
+
# encoding: utf-8
|
3
2
|
|
4
|
-
|
3
|
+
#--
|
4
|
+
# Copyright (c) 2014 Ye Lin Aung
|
5
|
+
# Zawgyi<>Unicode converter python module
|
6
|
+
# Based on rules from Parabaik Myanmar Text Converter
|
7
|
+
# Copyright (C) 2014 Ngwe Tun (Solveware Solution)
|
8
|
+
#
|
9
|
+
# Permission is hereby granted, free of charge, to any person obtaining
|
10
|
+
# a copy of this software and associated documentation files (the
|
11
|
+
# "Software"), to deal in the Software without restriction, including
|
12
|
+
# without limitation the rights to use, copy, modify, merge, publish,
|
13
|
+
# distribute, sublicense, and/or sell copies of the Software, and to
|
14
|
+
# permit persons to whom the Software is furnished to do so, subject to
|
15
|
+
# the following conditions:
|
16
|
+
#
|
17
|
+
# The above copyright notice and this permission notice shall be
|
18
|
+
# included in all copies or substantial portions of the Software.
|
19
|
+
#
|
20
|
+
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
21
|
+
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
22
|
+
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
23
|
+
# NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
24
|
+
# LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
25
|
+
# OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
26
|
+
# WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
27
|
+
#--
|
28
|
+
|
29
|
+
require 'minitest/autorun'
|
30
|
+
require 'mmfont'
|
31
|
+
require 'coveralls'
|
32
|
+
Coveralls.wear!
|
33
|
+
|
34
|
+
class MmfontTest < Minitest::Test
|
5
35
|
# unicode converting test
|
6
36
|
def test_convert_uni512zg1
|
7
|
-
assert_equal
|
37
|
+
assert_equal 'မဂၤလာပါ', Mmfont::Converter.new.uni512zg1('မင်္ဂလာပါ')
|
8
38
|
end
|
9
39
|
|
10
40
|
# zawgyi converting test
|
11
41
|
def test_convert_zg12uni51
|
12
|
-
assert_equal
|
42
|
+
assert_equal 'မင်္ဂလာပါ', Mmfont::Converter.new.zg12uni51('မဂၤလာပါ')
|
43
|
+
assert_equal 'ဘောလုံးကန်တာမှ ကောင်းဦးမယ်', Mmfont::Converter.new.zg12uni51('ေဘာလုံးကန္တာမွ ေကာင္းဦးမယ္')
|
13
44
|
end
|
14
45
|
end
|
metadata
CHANGED
@@ -1,15 +1,43 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: mmfont
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.0.
|
4
|
+
version: 1.0.1
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Ye Lin Aung
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2015-02-17 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
|
+
- !ruby/object:Gem::Dependency
|
14
|
+
name: coveralls
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
16
|
+
requirements:
|
17
|
+
- - ">="
|
18
|
+
- !ruby/object:Gem::Version
|
19
|
+
version: '0'
|
20
|
+
type: :runtime
|
21
|
+
prerelease: false
|
22
|
+
version_requirements: !ruby/object:Gem::Requirement
|
23
|
+
requirements:
|
24
|
+
- - ">="
|
25
|
+
- !ruby/object:Gem::Version
|
26
|
+
version: '0'
|
27
|
+
- !ruby/object:Gem::Dependency
|
28
|
+
name: rubocop
|
29
|
+
requirement: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - ">="
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: '0'
|
34
|
+
type: :runtime
|
35
|
+
prerelease: false
|
36
|
+
version_requirements: !ruby/object:Gem::Requirement
|
37
|
+
requirements:
|
38
|
+
- - ">="
|
39
|
+
- !ruby/object:Gem::Version
|
40
|
+
version: '0'
|
13
41
|
- !ruby/object:Gem::Dependency
|
14
42
|
name: bundler
|
15
43
|
requirement: !ruby/object:Gem::Requirement
|
@@ -38,6 +66,20 @@ dependencies:
|
|
38
66
|
- - "~>"
|
39
67
|
- !ruby/object:Gem::Version
|
40
68
|
version: '10.0'
|
69
|
+
- !ruby/object:Gem::Dependency
|
70
|
+
name: minitest
|
71
|
+
requirement: !ruby/object:Gem::Requirement
|
72
|
+
requirements:
|
73
|
+
- - ">="
|
74
|
+
- !ruby/object:Gem::Version
|
75
|
+
version: '0'
|
76
|
+
type: :development
|
77
|
+
prerelease: false
|
78
|
+
version_requirements: !ruby/object:Gem::Requirement
|
79
|
+
requirements:
|
80
|
+
- - ">="
|
81
|
+
- !ruby/object:Gem::Version
|
82
|
+
version: '0'
|
41
83
|
description: Myanmar font toolkit in Ruby.
|
42
84
|
email:
|
43
85
|
- me@yelinaung.com
|
@@ -46,6 +88,7 @@ extensions: []
|
|
46
88
|
extra_rdoc_files: []
|
47
89
|
files:
|
48
90
|
- ".gitignore"
|
91
|
+
- ".travis.yml"
|
49
92
|
- Gemfile
|
50
93
|
- LICENSE.txt
|
51
94
|
- README.md
|
@@ -54,7 +97,7 @@ files:
|
|
54
97
|
- lib/mmfont/version.rb
|
55
98
|
- mmfont.gemspec
|
56
99
|
- test/mmfont_test.rb
|
57
|
-
homepage:
|
100
|
+
homepage: https://github.com/yelinaung/mmfont
|
58
101
|
licenses:
|
59
102
|
- MIT
|
60
103
|
metadata: {}
|
@@ -74,7 +117,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
74
117
|
version: '0'
|
75
118
|
requirements: []
|
76
119
|
rubyforge_project:
|
77
|
-
rubygems_version: 2.
|
120
|
+
rubygems_version: 2.4.5
|
78
121
|
signing_key:
|
79
122
|
specification_version: 4
|
80
123
|
summary: Myanmar font converter.
|