mmfont 1.0.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.gitignore +17 -0
- data/Gemfile +4 -0
- data/LICENSE.txt +22 -0
- data/README.md +54 -0
- data/Rakefile +9 -0
- data/lib/mmfont.rb +195 -0
- data/lib/mmfont/version.rb +4 -0
- data/mmfont.gemspec +23 -0
- data/test/mmfont_test.rb +14 -0
- metadata +82 -0
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: e9616736a86649aa0a6730aa46a1fdd489adb416
|
4
|
+
data.tar.gz: bab6eb66a15d489df115a9a21d9583ad619f55d4
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: af9d4d91c5e63d44dbccb04bb78da4bcc95c395dc9e3ec228ff3da45087737b667e17fbceee3dd46e8901953693c1d85ba638c54cc0c475d61d33f899aa5ec1c
|
7
|
+
data.tar.gz: 21152c8d37eea994963dae6d9cb89dfd46757500fea5f3275017e292e1d6694b0be2823e9dd06e2f2dbfff249e5e15a958cdec47e6900484e2c93ec4db66779a
|
data/.gitignore
ADDED
data/Gemfile
ADDED
data/LICENSE.txt
ADDED
@@ -0,0 +1,22 @@
|
|
1
|
+
Copyright (c) 2014 Ye Lin Aung
|
2
|
+
|
3
|
+
MIT License
|
4
|
+
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining
|
6
|
+
a copy of this software and associated documentation files (the
|
7
|
+
"Software"), to deal in the Software without restriction, including
|
8
|
+
without limitation the rights to use, copy, modify, merge, publish,
|
9
|
+
distribute, sublicense, and/or sell copies of the Software, and to
|
10
|
+
permit persons to whom the Software is furnished to do so, subject to
|
11
|
+
the following conditions:
|
12
|
+
|
13
|
+
The above copyright notice and this permission notice shall be
|
14
|
+
included in all copies or substantial portions of the Software.
|
15
|
+
|
16
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
17
|
+
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
18
|
+
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
19
|
+
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
20
|
+
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
21
|
+
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
22
|
+
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
data/README.md
ADDED
@@ -0,0 +1,54 @@
|
|
1
|
+
# Mmfont
|
2
|
+
|
3
|
+
A simple gem which converts zawgyi1 <=> unicode strings.
|
4
|
+
|
5
|
+
## Installation
|
6
|
+
|
7
|
+
Add this line to your application's Gemfile:
|
8
|
+
|
9
|
+
```ruby
|
10
|
+
gem 'mmfont'
|
11
|
+
```
|
12
|
+
|
13
|
+
And then execute:
|
14
|
+
|
15
|
+
```bash
|
16
|
+
$ bundle
|
17
|
+
```
|
18
|
+
|
19
|
+
Or install it yourself as:
|
20
|
+
|
21
|
+
```bash
|
22
|
+
$ gem install mmfont
|
23
|
+
```
|
24
|
+
|
25
|
+
## Usage
|
26
|
+
|
27
|
+
```ruby
|
28
|
+
require 'mmfont'
|
29
|
+
|
30
|
+
a = Mmfont::Converter.new
|
31
|
+
|
32
|
+
a.uni512zg1("မင်္ဂလာပါ") # returns zg strings "မဂၤလာပါ"
|
33
|
+
|
34
|
+
a.zg12uni51("မဂၤလာပါ") # returns unicode strings "မင်္ဂလာပါ"
|
35
|
+
|
36
|
+
```
|
37
|
+
|
38
|
+
## Is it fast ?
|
39
|
+
I am not sure. But of course, Ruby is basically slow, regardless of implementations, compared to Nodejs, Go, Rust etc.
|
40
|
+
Feel free to send me some bunchmarks.
|
41
|
+
|
42
|
+
## TODO
|
43
|
+
- ~~Write TESTS!~~
|
44
|
+
|
45
|
+
## Contributing
|
46
|
+
|
47
|
+
1. Fork it ( https://github.com/[my-github-username]/mmfont/fork )
|
48
|
+
2. Create your feature branch (`git checkout -b my-new-feature`)
|
49
|
+
3. Commit your changes (`git commit -am 'Add some feature'`)
|
50
|
+
4. Push to the branch (`git push origin my-new-feature`)
|
51
|
+
5. Create a new Pull Request
|
52
|
+
|
53
|
+
## License
|
54
|
+
MIT
|
data/Rakefile
ADDED
data/lib/mmfont.rb
ADDED
@@ -0,0 +1,195 @@
|
|
1
|
+
require "mmfont/version"
|
2
|
+
|
3
|
+
# Mmfont module
|
4
|
+
module Mmfont
|
5
|
+
# Your code goes here...
|
6
|
+
class Converter
|
7
|
+
# Convert given text from unicode to zawgyi
|
8
|
+
def uni512zg1(input_text)
|
9
|
+
output_text = input_text
|
10
|
+
output_text = output_text.gsub(/\u104e\u1004\u103a\u1038/ ,"\u104e")
|
11
|
+
output_text = output_text.gsub(/\u102b\u103a/ ,"\u105a")
|
12
|
+
output_text = output_text.gsub(/\u102d\u1036/ ,"\u108e")
|
13
|
+
output_text = output_text.gsub(/\u103f/ ,"\u1086")
|
14
|
+
output_text = output_text.gsub(/(?<=\u102f)\u1037/ ,"\u1094")
|
15
|
+
output_text = output_text.gsub(/(?<=\u102f\u1036)\u1037/ ,"\u1094")
|
16
|
+
output_text = output_text.gsub(/(?<=\u1030)\u1037/ ,"\u1094")
|
17
|
+
output_text = output_text.gsub(/(?<=\u1030\u1036)\u1037/ ,"\u1094")
|
18
|
+
output_text = output_text.gsub(/(?<=\u1014)\u1037/ ,"\u1094")
|
19
|
+
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037/ ,"\u1094")
|
20
|
+
output_text = output_text.gsub(/(?<=\u103b)\u1037/ ,"\u1095")
|
21
|
+
output_text = output_text.gsub(/(?<=\u103b[\u1032\u1036])\u1037/ ,"\u1095")
|
22
|
+
output_text = output_text.gsub(/(?<=\u103d)\u1037/ ,"\u1095")
|
23
|
+
output_text = output_text.gsub(/(?<=\u103d[\u1032])\u1037/ ,"\u1095")
|
24
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d])\u102f/ ,"\u1033")
|
25
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c\u103d][\u102d\u1036])\u102f/ ,"\u1033")
|
26
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u102f/ ,"\u1033")
|
27
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u102f/ ,"\u1033")
|
28
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u102f/ ,"\u1033")
|
29
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u102f/ ,"\u1033")
|
30
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c])\u1030/ ,"\u1034")
|
31
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d])\u1030/ ,"\u1034")
|
32
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e])\u1030/ ,"\u1034")
|
33
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u102d\u1036])\u1030/ ,"\u1034")
|
34
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e])\u1030/ ,"\u1034")
|
35
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u102d\u1036])\u1030/ ,"\u1034")
|
36
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103e][\u102d\u1036])\u1030/ ,"\u1034")
|
37
|
+
output_text = output_text.gsub(/(?<=[\u103b\u103c][\u103d][\u103e][\u102d\u1036])\u1030/ ,"\u1034")
|
38
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021]))\u1030/ ,"\u1034")
|
39
|
+
output_text = output_text.gsub(/(?<=(\u1039[\u1000-\u1021])[\u102d\u1036])\u1030/ ,"\u1034")
|
40
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029])\u1030/ ,"\u1034")
|
41
|
+
output_text = output_text.gsub(/(?<=[\u100a\u100c\u1020\u1025\u1029][\u102d\u1036])\u1030/ ,"\u1034")
|
42
|
+
output_text = output_text.gsub(/(?<=\u103c)\u103e/ ,"\u1087")
|
43
|
+
output_text = output_text.gsub(/\u1009(?=[\u103a])/ ,"\u1025")
|
44
|
+
output_text = output_text.gsub(/\u1009(?=\u1039[\u1000-\u1021])/ ,"\u1025")
|
45
|
+
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021])?)((?:[\u103b-\u103e\u1087]*)?)\u1031/ ,"\u1031\\1\\2\\3")
|
46
|
+
output_text = output_text.gsub(/([\u1000-\u1021\u1029])((?:\u1039[\u1000-\u1021\u1000-\u1021])?)(\u103c)/ ,"\\3\\1\\2")
|
47
|
+
output_text = output_text.gsub(/\u1004\u103a\u1039/ ,"\u1064")
|
48
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102d/ ,"\\2\\3\\4\u108b")
|
49
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u102e/ ,"\\2\\3\\4\u108c")
|
50
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u1036/ ,"\\2\\3\\4\u108d")
|
51
|
+
output_text = output_text.gsub(/(\u1064)((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])/ ,"\\2\\3\\4\u1064")
|
52
|
+
output_text = output_text.gsub(/\u100a(?=[\u1039\u102f\u1030])/ ,"\u106b")
|
53
|
+
output_text = output_text.gsub(/\u100a/ ,"\u100a")
|
54
|
+
output_text = output_text.gsub(/\u101b(?=[\u102f\u1030])/ ,"\u1090")
|
55
|
+
output_text = output_text.gsub(/\u101b/ ,"\u101b")
|
56
|
+
output_text = output_text.gsub(/\u1014(?=[\u1039\u103d\u103e\u102f\u1030])/ ,"\u108f")
|
57
|
+
output_text = output_text.gsub(/\u1014/ ,"\u1014")
|
58
|
+
output_text = output_text.gsub(/\u1039\u1000/ ,"\u1060")
|
59
|
+
output_text = output_text.gsub(/\u1039\u1001/ ,"\u1061")
|
60
|
+
output_text = output_text.gsub(/\u1039\u1002/ ,"\u1062")
|
61
|
+
output_text = output_text.gsub(/\u1039\u1003/ ,"\u1063")
|
62
|
+
output_text = output_text.gsub(/\u1039\u1005/ ,"\u1065")
|
63
|
+
output_text = output_text.gsub(/\u1039\u1006/ ,"\u1066")
|
64
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1066/ ,"\u1067")
|
65
|
+
output_text = output_text.gsub(/\u1039\u1007/ ,"\u1068")
|
66
|
+
output_text = output_text.gsub(/\u1039\u1008/ ,"\u1069")
|
67
|
+
output_text = output_text.gsub(/\u1039\u100f/ ,"\u1070")
|
68
|
+
output_text = output_text.gsub(/\u1039\u1010/ ,"\u1071")
|
69
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1071/ ,"\u1072")
|
70
|
+
output_text = output_text.gsub(/\u1039\u1011/ ,"\u1073")
|
71
|
+
output_text = output_text.gsub(/(?<=[\u1001\u1002\u1004\u1005\u1007\u1012\u1013\u108f\u1015\u1016\u1017\u1019\u101d])\u1073/ ,"\u1074")
|
72
|
+
output_text = output_text.gsub(/\u1039\u1012/ ,"\u1075")
|
73
|
+
output_text = output_text.gsub(/\u1039\u1013/ ,"\u1076")
|
74
|
+
output_text = output_text.gsub(/\u1039\u1014/ ,"\u1077")
|
75
|
+
output_text = output_text.gsub(/\u1039\u1015/ ,"\u1078")
|
76
|
+
output_text = output_text.gsub(/\u1039\u1016/ ,"\u1079")
|
77
|
+
output_text = output_text.gsub(/\u1039\u1017/ ,"\u107a")
|
78
|
+
output_text = output_text.gsub(/\u1039\u1018/ ,"\u107b")
|
79
|
+
output_text = output_text.gsub(/\u1039\u1019/ ,"\u107c")
|
80
|
+
output_text = output_text.gsub(/\u1039\u101c/ ,"\u1085")
|
81
|
+
output_text = output_text.gsub(/\u100f\u1039\u100d/ ,"\u1091")
|
82
|
+
output_text = output_text.gsub(/\u100b\u1039\u100c/ ,"\u1092")
|
83
|
+
output_text = output_text.gsub(/\u1039\u100c/ ,"\u106d")
|
84
|
+
output_text = output_text.gsub(/\u100b\u1039\u100b/ ,"\u1097")
|
85
|
+
output_text = output_text.gsub(/\u1039\u100b/ ,"\u106c")
|
86
|
+
output_text = output_text.gsub(/\u100e\u1039\u100d/ ,"\u106f")
|
87
|
+
output_text = output_text.gsub(/\u100d\u1039\u100d/ ,"\u106e")
|
88
|
+
output_text = output_text.gsub(/\u1009(?=\u103a)/ ,"\u1025")
|
89
|
+
output_text = output_text.gsub(/\u1025(?=[\u1039\u102f\u1030])/ ,"\u106a")
|
90
|
+
output_text = output_text.gsub(/\u1025/ ,"\u1025")
|
91
|
+
output_text = output_text.gsub(/\u103a/ ,"\u1039")
|
92
|
+
output_text = output_text.gsub(/\u103b\u103d\u103e/ ,"\u107d\u108a")
|
93
|
+
output_text = output_text.gsub(/\u103d\u103e/ ,"\u108a")
|
94
|
+
output_text = output_text.gsub(/\u103b/ ,"\u103a")
|
95
|
+
output_text = output_text.gsub(/\u103c/ ,"\u103b")
|
96
|
+
output_text = output_text.gsub(/\u103d/ ,"\u103c")
|
97
|
+
output_text = output_text.gsub(/\u103e/ ,"\u103d")
|
98
|
+
output_text = output_text.gsub(/\u103a(?=[\u103c\u103d\u108a])/ ,"\u107d")
|
99
|
+
output_text = output_text.gsub(/(?<=\u100a(?:[\u102d\u102e\u1036\u108b\u108c\u108d\u108e]))\u103d/ ,"\u1087")
|
100
|
+
output_text = output_text.gsub(/(?<=\u100a)\u103d/ ,"\u1087")
|
101
|
+
output_text = output_text.gsub(/\u103b(?=[\u1000\u1003\u1006\u100f\u1010\u1011\u1018\u101a\u101c\u101e\u101f\u1021])/ ,"\u107e")
|
102
|
+
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])/ ,"\u1080\\1")
|
103
|
+
output_text = output_text.gsub(/\u107e([\u1000-\u1021\u108f])(?=[\u103c\u108a])/ ,"\u1082\\1")
|
104
|
+
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u102d\u102e\u1036\u108b\u108c\u108d\u108e])/ ,"\u107f\\1")
|
105
|
+
output_text = output_text.gsub(/\u103b([\u1000-\u1021\u108f])(?=[\u103c\u108a])/ ,"\u1081\\1")
|
106
|
+
output_text = output_text.gsub(/(?<=\u1014)\u1037/ ,"\u1094")
|
107
|
+
output_text = output_text.gsub(/(?<=\u1014[\u103a\u1032])\u1037/ ,"\u1094")
|
108
|
+
output_text = output_text.gsub(/(?<=\u1033)\u1094/ ,"\u1095")
|
109
|
+
output_text = output_text.gsub(/(?<=\u1033[\u1036])\u1094/ ,"\u1095")
|
110
|
+
output_text = output_text.gsub(/(?<=\u1034)\u1094/ ,"\u1095")
|
111
|
+
output_text = output_text.gsub(/(?<=\u1034[\u1036])\u1094/ ,"\u1095")
|
112
|
+
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a])\u1037/ ,"\u1095")
|
113
|
+
output_text = output_text.gsub(/(?<=[\u103c\u103d\u108a][\u1032])\u1037/ ,"\u1095")
|
114
|
+
# 'return' is not necessary but it's there to prevent 'end' from auto-indent
|
115
|
+
return output_text
|
116
|
+
end # end of uni to zg1
|
117
|
+
|
118
|
+
# Convert given text from zawgyi to unicode
|
119
|
+
def zg12uni51(input_text)
|
120
|
+
output_text = input_text
|
121
|
+
output_text = output_text.gsub(/\u106a/ ,"\u1009")
|
122
|
+
output_text = output_text.gsub(/\u1025(?=[\u1039\u102c])/ ,"\u1009")
|
123
|
+
output_text = output_text.gsub(/\u1025\u102e/ ,"\u1026")
|
124
|
+
output_text = output_text.gsub(/\u106b/ ,"\u100a")
|
125
|
+
output_text = output_text.gsub(/\u1090/ ,"\u101b")
|
126
|
+
output_text = output_text.gsub(/\u1040/ ,"\u1040")
|
127
|
+
output_text = output_text.gsub(/\u108f/ ,"\u1014")
|
128
|
+
output_text = output_text.gsub(/\u1012/ ,"\u1012")
|
129
|
+
output_text = output_text.gsub(/\u1013/ ,"\u1013")
|
130
|
+
output_text = output_text.gsub(/[\u103d\u1087]/ ,"\u103d")
|
131
|
+
output_text = output_text.gsub(/\u103c/ ,"\u103d")
|
132
|
+
output_text = output_text.gsub(/[\u103b\u107e\u107f\u1080\u1081\u1082\u1083\u1084]/ ,"\u103c")
|
133
|
+
output_text = output_text.gsub(/[\u103a\u107d]/ ,"\u103b")
|
134
|
+
output_text = output_text.gsub(/\u103d\u103b/ ,"\u103b\u103d")
|
135
|
+
output_text = output_text.gsub(/\u108a/ ,"\u103d\u103d")
|
136
|
+
output_text = output_text.gsub(/\u103d\u103d/ ,"\u103d\u103d")
|
137
|
+
output_text = output_text.gsub(/((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u1064/ ,"\u1064\\1\\2\\3")
|
138
|
+
output_text = output_text.gsub(/((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u108b/ ,"\u1064\\1\\2\\3\u102d")
|
139
|
+
output_text = output_text.gsub(/((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u108c/ ,"\u1064\\1\\2\\3\u102e")
|
140
|
+
output_text = output_text.gsub(/((?:\u1031)?)((?:\u103c)?)([\u1000-\u1021])\u108d/ ,"\u1064\\1\\2\\3\u1036")
|
141
|
+
output_text = output_text.gsub(/\u105a/ ,"\u102b\u103a")
|
142
|
+
output_text = output_text.gsub(/\u108e/ ,"\u102d\u1036")
|
143
|
+
output_text = output_text.gsub(/\u1033/ ,"\u102f")
|
144
|
+
output_text = output_text.gsub(/\u1034/ ,"\u1030")
|
145
|
+
output_text = output_text.gsub(/\u1088/ ,"\u103d\u102f")
|
146
|
+
output_text = output_text.gsub(/\u1089/ ,"\u103d\u1030")
|
147
|
+
output_text = output_text.gsub(/\u1039/ ,"\u103a")
|
148
|
+
output_text = output_text.gsub(/[\u1094\u1095]/ ,"\u1037")
|
149
|
+
output_text = output_text.gsub(/([\u1000-\u1021])([\u102c\u102d\u102e\u1032\u1036]){1,2}([\u1060\u1061\u1062\u1063\u1065\u1066\u1067\u1068\u1069\u1070\u1071\u1072\u1073\u1074\u1075\u1076\u1077\u1078\u1079\u107a\u107b\u107c\u1085])/ ,"\\1\\3\\2")
|
150
|
+
output_text = output_text.gsub(/\u1064/ ,"\u1004\u103a\u1039")
|
151
|
+
output_text = output_text.gsub(/\u104e/ ,"\u104e\u1004\u103a\u1038")
|
152
|
+
output_text = output_text.gsub(/\u1086/ ,"\u103f")
|
153
|
+
output_text = output_text.gsub(/\u1060/ ,"\u1039\u1000")
|
154
|
+
output_text = output_text.gsub(/\u1061/ ,"\u1039\u1001")
|
155
|
+
output_text = output_text.gsub(/\u1062/ ,"\u1039\u1002")
|
156
|
+
output_text = output_text.gsub(/\u1063/ ,"\u1039\u1003")
|
157
|
+
output_text = output_text.gsub(/\u1065/ ,"\u1039\u1005")
|
158
|
+
output_text = output_text.gsub(/[\u1066\u1067]/ ,"\u1039\u1006")
|
159
|
+
output_text = output_text.gsub(/\u1068/ ,"\u1039\u1007")
|
160
|
+
output_text = output_text.gsub(/\u1069/ ,"\u1039\u1008")
|
161
|
+
output_text = output_text.gsub(/\u106c/ ,"\u1039\u100b")
|
162
|
+
output_text = output_text.gsub(/\u1070/ ,"\u1039\u100f")
|
163
|
+
output_text = output_text.gsub(/[\u1071\u1072]/ ,"\u1039\u1010")
|
164
|
+
output_text = output_text.gsub(/[\u1073\u1074]/ ,"\u1039\u1011")
|
165
|
+
output_text = output_text.gsub(/\u1075/ ,"\u1039\u1012")
|
166
|
+
output_text = output_text.gsub(/\u1076/ ,"\u1039\u1013")
|
167
|
+
output_text = output_text.gsub(/\u1077/ ,"\u1039\u1014")
|
168
|
+
output_text = output_text.gsub(/\u1078/ ,"\u1039\u1015")
|
169
|
+
output_text = output_text.gsub(/\u1079/ ,"\u1039\u1016")
|
170
|
+
output_text = output_text.gsub(/\u107a/ ,"\u1039\u1017")
|
171
|
+
output_text = output_text.gsub(/\u107b/ ,"\u1039\u1018")
|
172
|
+
output_text = output_text.gsub(/\u107c/ ,"\u1039\u1019")
|
173
|
+
output_text = output_text.gsub(/\u1085/ ,"\u1039\u101c")
|
174
|
+
output_text = output_text.gsub(/\u106d/ ,"\u1039\u100c")
|
175
|
+
output_text = output_text.gsub(/\u1091/ ,"\u100f\u1039\u100d")
|
176
|
+
output_text = output_text.gsub(/\u1092/ ,"\u100b\u1039\u100c")
|
177
|
+
output_text = output_text.gsub(/\u1097/ ,"\u100b\u1039\u100b")
|
178
|
+
output_text = output_text.gsub(/\u106f/ ,"\u100e\u1039\u100d")
|
179
|
+
output_text = output_text.gsub(/\u106e/ ,"\u100d\u1039\u100d")
|
180
|
+
output_text = output_text.gsub(/(\u103c)([\u1000-\u1021])((?:\u1039[\u1000-\u1021])?)/ ,"\\2\\3\\1")
|
181
|
+
output_text = output_text.gsub(/(\u103d)(\u103d)([\u103b\u103c])/ ,"\\3\\2\\1")
|
182
|
+
output_text = output_text.gsub(/(\u103d)([\u103b\u103c])/ ,"\\2\\1")
|
183
|
+
output_text = output_text.gsub(/(\u103d)([\u103b\u103c])/ ,"\\2\\1")
|
184
|
+
output_text = output_text.gsub(/(?<=([\u1000-\u101c\u101e-\u102a\u102c\u102e-\u103d\u104c-\u109f]))(\u1040)(?=\s)?/ ,"\u101d")
|
185
|
+
output_text = output_text.gsub(/(?<=(\u101d))(\u1040)(?=\s)?/ ,"\u101d")
|
186
|
+
output_text = output_text.gsub(/(?<=([\u1000-\u101c\u101e-\u102a\u102c\u102e-\u103d\u104c-\u109f\s]))(\u1047)/ ,"\u101b")
|
187
|
+
output_text = output_text.gsub(/(\u1047)(?=[\u1000-\u101c\u101e-\u102a\u102c\u102e-\u103d\u104c-\u109f\s])/ ,"\u101b")
|
188
|
+
output_text = output_text.gsub(/((?:\u1031)?)([\u1000-\u1021])((?:\u1039[\u1000-\u1021])?)((?:[\u102d\u102e\u1032])?)([\u1036\u1037\u1038]{0,2})([\u103b-\u103d]{0,3})((?:[\u102f\u1030])?)([\u1036\u1037\u1038]{0,2})((?:[\u102d\u102e\u1032])?)/ ,"\\2\\3\\6\\1\\4\\9\\7\\5\\8")
|
189
|
+
output_text = output_text.gsub(/\u1036\u102f/ ,"\u102f\u1036")
|
190
|
+
output_text = output_text.gsub(/(\u103a)(\u1037)/ ,"\\2\\1")
|
191
|
+
# 'return' is not necessary but it's there to prevent 'end' from auto-indent
|
192
|
+
return output_text
|
193
|
+
end # end of zg1 to uni
|
194
|
+
end # end of class
|
195
|
+
end # end of module
|
data/mmfont.gemspec
ADDED
@@ -0,0 +1,23 @@
|
|
1
|
+
# coding: utf-8
|
2
|
+
lib = File.expand_path('../lib', __FILE__)
|
3
|
+
$LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
|
4
|
+
require 'mmfont/version'
|
5
|
+
|
6
|
+
Gem::Specification.new do |spec|
|
7
|
+
spec.name = "mmfont"
|
8
|
+
spec.version = Mmfont::VERSION
|
9
|
+
spec.authors = ["Ye Lin Aung"]
|
10
|
+
spec.email = ["me@yelinaung.com"]
|
11
|
+
spec.summary = %q{Myanmar font converter.}
|
12
|
+
spec.description = %q{Myanmar font toolkit in Ruby.}
|
13
|
+
spec.homepage = ""
|
14
|
+
spec.license = "MIT"
|
15
|
+
|
16
|
+
spec.files = `git ls-files -z`.split("\x0")
|
17
|
+
spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
|
18
|
+
spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
|
19
|
+
spec.require_paths = ["lib"]
|
20
|
+
|
21
|
+
spec.add_development_dependency "bundler", "~> 1.6"
|
22
|
+
spec.add_development_dependency "rake", "~> 10.0"
|
23
|
+
end
|
data/test/mmfont_test.rb
ADDED
@@ -0,0 +1,14 @@
|
|
1
|
+
require "minitest/autorun"
|
2
|
+
require "mmfont"
|
3
|
+
|
4
|
+
class MmfontTest < MiniTest::Unit::TestCase
|
5
|
+
# unicode converting test
|
6
|
+
def test_convert_uni512zg1
|
7
|
+
assert_equal "မဂၤလာပါ", Mmfont::Converter.new.uni512zg1("မင်္ဂလာပါ")
|
8
|
+
end
|
9
|
+
|
10
|
+
# zawgyi converting test
|
11
|
+
def test_convert_zg12uni51
|
12
|
+
assert_equal "မင်္ဂလာပါ", Mmfont::Converter.new.zg12uni51("မဂၤလာပါ")
|
13
|
+
end
|
14
|
+
end
|
metadata
ADDED
@@ -0,0 +1,82 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: mmfont
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 1.0.0
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Ye Lin Aung
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2014-07-26 00:00:00.000000000 Z
|
12
|
+
dependencies:
|
13
|
+
- !ruby/object:Gem::Dependency
|
14
|
+
name: bundler
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
16
|
+
requirements:
|
17
|
+
- - "~>"
|
18
|
+
- !ruby/object:Gem::Version
|
19
|
+
version: '1.6'
|
20
|
+
type: :development
|
21
|
+
prerelease: false
|
22
|
+
version_requirements: !ruby/object:Gem::Requirement
|
23
|
+
requirements:
|
24
|
+
- - "~>"
|
25
|
+
- !ruby/object:Gem::Version
|
26
|
+
version: '1.6'
|
27
|
+
- !ruby/object:Gem::Dependency
|
28
|
+
name: rake
|
29
|
+
requirement: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - "~>"
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: '10.0'
|
34
|
+
type: :development
|
35
|
+
prerelease: false
|
36
|
+
version_requirements: !ruby/object:Gem::Requirement
|
37
|
+
requirements:
|
38
|
+
- - "~>"
|
39
|
+
- !ruby/object:Gem::Version
|
40
|
+
version: '10.0'
|
41
|
+
description: Myanmar font toolkit in Ruby.
|
42
|
+
email:
|
43
|
+
- me@yelinaung.com
|
44
|
+
executables: []
|
45
|
+
extensions: []
|
46
|
+
extra_rdoc_files: []
|
47
|
+
files:
|
48
|
+
- ".gitignore"
|
49
|
+
- Gemfile
|
50
|
+
- LICENSE.txt
|
51
|
+
- README.md
|
52
|
+
- Rakefile
|
53
|
+
- lib/mmfont.rb
|
54
|
+
- lib/mmfont/version.rb
|
55
|
+
- mmfont.gemspec
|
56
|
+
- test/mmfont_test.rb
|
57
|
+
homepage: ''
|
58
|
+
licenses:
|
59
|
+
- MIT
|
60
|
+
metadata: {}
|
61
|
+
post_install_message:
|
62
|
+
rdoc_options: []
|
63
|
+
require_paths:
|
64
|
+
- lib
|
65
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
66
|
+
requirements:
|
67
|
+
- - ">="
|
68
|
+
- !ruby/object:Gem::Version
|
69
|
+
version: '0'
|
70
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
71
|
+
requirements:
|
72
|
+
- - ">="
|
73
|
+
- !ruby/object:Gem::Version
|
74
|
+
version: '0'
|
75
|
+
requirements: []
|
76
|
+
rubyforge_project:
|
77
|
+
rubygems_version: 2.2.2
|
78
|
+
signing_key:
|
79
|
+
specification_version: 4
|
80
|
+
summary: Myanmar font converter.
|
81
|
+
test_files:
|
82
|
+
- test/mmfont_test.rb
|