interscript 0.1.1 → 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,105 @@
1
+ ---
2
+ authority_id: icao
3
+ id: 9303
4
+ language: per
5
+ source_script: Arab
6
+ destination_script: Latn
7
+ name: ICAO Doc 9303 Machine Readable Travel Documents Part 3 -- Persian Arabic to Latin
8
+ url: https://www.icao.int/publications/pages/publication.aspx?docnum=9303
9
+ creation_date: 2015
10
+ description: |
11
+ Part 3 defines specifications that are common to TD1, TD2 and TD3
12
+ size machine readable travel documents (MRTDs) including those
13
+ necessary for global interoperability using visual inspection and
14
+ machine readable (optical character recognition) means.
15
+
16
+ Since only Latin-alphabet characters are allowed in the VIZ, if
17
+ mandatory data elements are in a national language that does not use
18
+ the Latin alphabet, a transcription or transliteration shall also be
19
+ provided.
20
+
21
+ This document defines the transliteration mappings used to produce
22
+ this transcription or transliteration.
23
+ tests:
24
+ - source:
25
+ expected:
26
+ map:
27
+ # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
28
+ characters:
29
+
30
+ "\u0027": "" # '
31
+ "\u0621": "XE" # ء
32
+ "\u0622": "XAA" # آ
33
+ "\u0623": 'XAE', # أ
34
+ "\u0624": 'U', # ؤ
35
+ "\u0625": 'I', # إ
36
+ "\u0626": 'XI', # ئ
37
+ "\u0627": "A" # ا
38
+ "\u0628": "B" # ب
39
+ "\u0629": "P" # ة
40
+ "\u062A": "T" # ت
41
+ "\u062B": "XTH" # ث
42
+ "\u062C": "J" # ج
43
+ "\u062D": "XH" # ح
44
+ "\u062E": "XKH" # خ
45
+ "\u062F": "D" # د
46
+ "\u0630": "XDH" # ذ
47
+ "\u0631": "R" # ر
48
+ "\u0632": "Z" # ز
49
+ "\u0633": "S" # س
50
+ "\u0634": "XSH" # ش
51
+ "\u0635": "XSS" # ص
52
+ "\u0636": "XDZ" # ض
53
+ "\u0637": "XTT" # ط
54
+ "\u0638": "XZZ" # ظ
55
+ "\u0639": "E" # ع
56
+ "\u063A": "G" # غ
57
+ "\u0641": "F" # ف
58
+ "\u0642": "Q" # ق
59
+ "\u0643": "K" # ك
60
+ "\u0644": "L" # ل
61
+ "\u0645": "M" # م
62
+ "\u0646": "N" # ن
63
+ "\u0647": "H" # ه
64
+ "\u0648": "W" # و
65
+ "\u0649": "XAY" # ى
66
+ "\u064A": "Y" # ي
67
+ "\u064B": "F" # ً
68
+ "\u064C": "N" # ٌ
69
+ "\u064D": "K" # ٍ
70
+ "\u064E": "A" # َ
71
+ "\u064F": "U" # ُ
72
+ "\u0650": "I" # ِ
73
+ "\u0652": "O" # ْ
74
+ "\u0670": "" # '
75
+ "\u0671": "XXA" # ٱ
76
+ "\u0679": "XXT" # ٹ
77
+ "\u067C": "XRT" # ټ
78
+ "\u067E": "P" # پ
79
+ "\u0681": "XKE" # ځ
80
+ "\u0685": "XXH" # څ
81
+ "\u0686": "XC" # چ
82
+ "\u0688": "XXD" # ڈ
83
+ "\u0689": "XDR" # ډ
84
+ "\u0691": "XXR" # ڑ
85
+ "\u0693": "XRR" # ړ
86
+ "\u0696": "XRX" # ږ
87
+ "\u0698": "XJ" # ژ
88
+ "\u069A": "XXS" # ښ
89
+ "\u06A9": "XKK" # ک
90
+ "\u06AB": "XXK" # ګ
91
+ "\u06AD": "XNG" # ڭ
92
+ "\u06AF": "XGG" # گ
93
+ "\u06BA": "XNN" # ں
94
+ "\u06BC": "XXN" # ڼ
95
+ "\u06BE": "XDO" # ھ
96
+ "\u06C0": "XYH" # ۀ
97
+ "\u06C1": "XXG" # ہ
98
+ "\u06C2": "XGE" # ۂ
99
+ "\u06C3": "XTG" # ۃ
100
+ "\u06CC": "XYA" # ی
101
+ "\u06CD": "XXY" # ۍ
102
+ "\u06D0": "Y" # ې
103
+ "\u06D2": "XYB" # ے
104
+ "\u06D3": "XBE" # ۓ
105
+
@@ -0,0 +1,119 @@
1
+ ---
2
+ authority_id: icao
3
+ id: 9303
4
+ language: rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ICAO Doc 9303 Machine Readable Travel Documents Part 3 -- Russian Cyrillic to Latin
8
+ url: https://www.icao.int/publications/pages/publication.aspx?docnum=9303
9
+ creation_date: 2015
10
+ description: |
11
+ Part 3 defines specifications that are common to TD1, TD2 and TD3
12
+ size machine readable travel documents (MRTDs) including those
13
+ necessary for global interoperability using visual inspection and
14
+ machine readable (optical character recognition) means.
15
+
16
+ Since only Latin-alphabet characters are allowed in the VIZ, if
17
+ mandatory data elements are in a national language that does not use
18
+ the Latin alphabet, a transcription or transliteration shall also be
19
+ provided.
20
+
21
+ This document defines the transliteration mappings used to produce
22
+ this transcription or transliteration.
23
+ tests:
24
+ - source:
25
+ expected:
26
+ map:
27
+ # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
28
+ characters:
29
+ "\u0027": "" # '
30
+ "\u0410": "A" # А
31
+ "\u0411": "B" # Б
32
+ "\u0414": "D" # Д
33
+ "\u0401": "E" # Ё
34
+ "\u0415": "E" # Е
35
+ "\u042D": "E" # Э
36
+ "\u0424": "F" # Ф
37
+ "\u0413": "G" # Г
38
+ "\u0418": "I" # И
39
+ "\u0419": "I" # Й
40
+ "\u041A": "K" # К
41
+ "\u041B": "L" # Л
42
+ "\u041C": "M" # М
43
+ "\u041D": "N" # Н
44
+ "\u041E": "O" # О
45
+ "\u041F": "P" # П
46
+ "\u0420": "R" # Р
47
+ "\u0421": "S" # С
48
+ "\u0422": "T" # Т
49
+ "\u0423": "U" # У
50
+ "\u0412": "V" # В
51
+ "\u042B": "Y" # Ы
52
+ "\u0417": "Z" # З
53
+ "\u0427": "CH" # Ч
54
+ "\u042F": "IA" # Я
55
+ "\u042E": "IU" # Ю
56
+ "\u0425": "KH" # Х
57
+ "\u0428": "SH" # Ш
58
+ "\u0429": "SHCH" # Щ
59
+ "\u0426": "TS" # Ц
60
+ "\u0416": "ZH" # Ж
61
+ "\u0490": "G" # Ґ
62
+ "\u040E": "U" # Ў
63
+ "\u046A": "U" # Ѫ
64
+ "\u0402": "D" # Ђ
65
+ "\u0405": "DZ" # Ѕ
66
+ "\u0408": "J" # Ј
67
+ "\u0409": "LJ" # Љ
68
+ "\u040A": "NJ" # Њ
69
+ "\u04BA": "C" # Һ
70
+ "\u040F": "DZ" # Џ
71
+ "\u0404": "IE" # Є
72
+ "\u0407": "I" # Ї
73
+ "\u0403": "G" # Ѓ
74
+
75
+ "\u0430": "a" # а
76
+ "\u0431": "b" # б
77
+ "\u0434": "d" # д
78
+ "\u0451": "e" # ё
79
+ "\u0435": "e" # e
80
+ "\u044D": "e" # э
81
+ "\u0444": "f" # ф
82
+ "\u0433": "g" # г
83
+ "\u0438": "i" # и
84
+ "\u0439": "i" # й
85
+ "\u043A": "k" # к
86
+ "\u043B": "l" # л
87
+ "\u043C": "m" # м
88
+ "\u043D": "n" # н
89
+ "\u043E": "o" # о
90
+ "\u043F": "p" # п
91
+ "\u0440": "r" # р
92
+ "\u0441": "s" # с
93
+ "\u0442": "t" # т
94
+ "\u0443": "u" # у
95
+ "\u0432": "v" # в
96
+ "\u044B": "y" # ы
97
+ "\u0437": "z" # з
98
+ "\u0447": "ch" # ч
99
+ "\u044F": "ia" # я
100
+ "\u044E": "iu" # ю
101
+ "\u0445": "kh" # х
102
+ "\u0448": "sh" # ш
103
+ "\u0449": "shch" # щ
104
+ "\u0446": "ts" # ц
105
+ "\u0436": "zh" # ж
106
+ "\u0491": "g" # ґ
107
+ "\u045E": "u" # ў
108
+ "\u046B": "u" # ѫ
109
+ "\u0452": "d" # ђ
110
+ "\u0455": "dz" # ѕ
111
+ "\u0458": "j" # ј
112
+ "\u0459": "lj" # љ
113
+ "\u045A": "nj" # њ
114
+ "\u04BB": "c" # һ
115
+ "\u045F": "dz" # џ
116
+ "\u0454": "ie" # є
117
+ "\u0457": "i" # ї
118
+ "\u0453": "g" # ѓ
119
+
@@ -0,0 +1,118 @@
1
+ ---
2
+ authority_id: icao
3
+ id: 9303
4
+ language: srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ICAO Doc 9303 Machine Readable Travel Documents Part 3 -- Serbian Cyrillic to Latin
8
+ url: https://www.icao.int/publications/pages/publication.aspx?docnum=9303
9
+ creation_date: 2015
10
+ description: |
11
+ Part 3 defines specifications that are common to TD1, TD2 and TD3
12
+ size machine readable travel documents (MRTDs) including those
13
+ necessary for global interoperability using visual inspection and
14
+ machine readable (optical character recognition) means.
15
+
16
+ Since only Latin-alphabet characters are allowed in the VIZ, if
17
+ mandatory data elements are in a national language that does not use
18
+ the Latin alphabet, a transcription or transliteration shall also be
19
+ provided.
20
+
21
+ This document defines the transliteration mappings used to produce
22
+ this transcription or transliteration.
23
+ tests:
24
+ - source:
25
+ expected:
26
+ map:
27
+ # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
28
+ characters:
29
+ "\u0027": "" # '
30
+ "\u0410": "A" # А
31
+ "\u0411": "B" # Б
32
+ "\u0414": "D" # Д
33
+ "\u0401": "E" # Ё
34
+ "\u0415": "E" # Е
35
+ "\u042D": "E" # Э
36
+ "\u0424": "F" # Ф
37
+ "\u0413": "H" # Г
38
+ "\u0418": "I" # И
39
+ "\u0419": "I" # Й
40
+ "\u041A": "K" # К
41
+ "\u041B": "L" # Л
42
+ "\u041C": "M" # М
43
+ "\u041D": "N" # Н
44
+ "\u041E": "O" # О
45
+ "\u041F": "P" # П
46
+ "\u0420": "R" # Р
47
+ "\u0421": "S" # С
48
+ "\u0422": "T" # Т
49
+ "\u0423": "U" # У
50
+ "\u0412": "V" # В
51
+ "\u042B": "Y" # Ы
52
+ "\u0417": "Z" # З
53
+ "\u0427": "C" # Ч
54
+ "\u042F": "IA" # Я
55
+ "\u042E": "IU" # Ю
56
+ "\u0425": "H" # Х
57
+ "\u0428": "S" # Ш
58
+ "\u0429": "SHCH" # Щ
59
+ "\u0426": "C" # Ц
60
+ "\u0416": "Z" # Ж
61
+ "\u0490": "G" # Ґ
62
+ "\u040E": "U" # Ў
63
+ "\u046A": "U" # Ѫ
64
+ "\u0402": "D" # Ђ
65
+ "\u0405": "DZ" # Ѕ
66
+ "\u0408": "J" # Ј
67
+ "\u0409": "LJ" # Љ
68
+ "\u040A": "NJ" # Њ
69
+ "\u04BA": "C" # Һ
70
+ "\u040F": "DZ" # Џ
71
+ "\u0404": "IE" # Є
72
+ "\u0407": "I" # Ї
73
+ "\u0403": "G" # Ѓ
74
+
75
+ "\u0430": "a" # а
76
+ "\u0431": "b" # б
77
+ "\u0434": "d" # д
78
+ "\u0451": "e" # ё
79
+ "\u0435": "e" # e
80
+ "\u044D": "e" # э
81
+ "\u0444": "f" # ф
82
+ "\u0433": "h" # г
83
+ "\u0438": "i" # и
84
+ "\u0439": "i" # й
85
+ "\u043A": "k" # к
86
+ "\u043B": "l" # л
87
+ "\u043C": "m" # м
88
+ "\u043D": "n" # н
89
+ "\u043E": "o" # о
90
+ "\u043F": "p" # п
91
+ "\u0440": "r" # р
92
+ "\u0441": "s" # с
93
+ "\u0442": "t" # т
94
+ "\u0443": "" # у
95
+ "\u0432": "v" # в
96
+ "\u044B": "y" # ы
97
+ "\u0437": "z" # з
98
+ "\u0447": "c" # ч
99
+ "\u044F": "ia" # я
100
+ "\u044E": "i" # ю
101
+ "\u0445": "h" # х
102
+ "\u0448": "s" # ш
103
+ "\u0449": "shch" # щ
104
+ "\u0446": "c" # ц
105
+ "\u0436": "z" # ж
106
+ "\u0491": "g" # ґ
107
+ "\u045E": "" # ў
108
+ "\u046B": "" # ѫ
109
+ "\u0452": "d" # ђ
110
+ "\u0455": "dz" # ѕ
111
+ "\u0458": "j" # ј
112
+ "\u0459": "lj" # љ
113
+ "\u045A": "nj" # њ
114
+ "\u04BB": "c" # һ
115
+ "\u045F": "dz" # џ
116
+ "\u0454": "ie" # є
117
+ "\u0457": "i" # ї
118
+ "\u0453": "g" # ѓ
@@ -0,0 +1,121 @@
1
+ ---
2
+ authority_id: icao
3
+ id: 9303
4
+ language: ukr
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ICAO Doc 9303 Machine Readable Travel Documents Part 3 -- Ukranian Cyrillic to Latin
8
+ url: https://www.icao.int/publications/pages/publication.aspx?docnum=9303
9
+ creation_date: 2015
10
+ description: |
11
+ Part 3 defines specifications that are common to TD1, TD2 and TD3
12
+ size machine readable travel documents (MRTDs) including those
13
+ necessary for global interoperability using visual inspection and
14
+ machine readable (optical character recognition) means.
15
+
16
+ Since only Latin-alphabet characters are allowed in the VIZ, if
17
+ mandatory data elements are in a national language that does not use
18
+ the Latin alphabet, a transcription or transliteration shall also be
19
+ provided.
20
+
21
+ This document defines the transliteration mappings used to produce
22
+ this transcription or transliteration.
23
+ tests:
24
+ - source:
25
+ expected:
26
+
27
+ map:
28
+ # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
29
+ characters:
30
+ "\u0027": "" # '
31
+ "\u0410": "A" # А
32
+ "\u0411": "B" # Б
33
+ "\u0414": "D" # Д
34
+ "\u0401": "E" # Ё
35
+ "\u0415": "E" # Е
36
+ "\u042D": "E" # Э
37
+ "\u0424": "F" # Ф
38
+ "\u0413": "G" # Г
39
+ "\u0418": "Y" # И
40
+ "\u0419": "I" # Й
41
+ "\u041A": "K" # К
42
+ "\u041B": "L" # Л
43
+ "\u041C": "M" # М
44
+ "\u041D": "N" # Н
45
+ "\u041E": "O" # О
46
+ "\u041F": "P" # П
47
+ "\u0420": "R" # Р
48
+ "\u0421": "S" # С
49
+ "\u0422": "T" # Т
50
+ "\u0423": "U" # У
51
+ "\u0412": "V" # В
52
+ "\u042B": "Y" # Ы
53
+ "\u0417": "Z" # З
54
+ "\u0427": "CH" # Ч
55
+ "\u042F": "IA" # Я
56
+ "\u042E": "IU" # Ю
57
+ "\u0425": "KH" # Х
58
+ "\u0428": "SH" # Ш
59
+ "\u0429": "SHCH" # Щ
60
+ "\u0426": "TS" # Ц
61
+ "\u0416": "ZH" # Ж
62
+ "\u0490": "G" # Ґ
63
+ "\u040E": "U" # Ў
64
+ "\u046A": "U" # Ѫ
65
+ "\u0402": "D" # Ђ
66
+ "\u0405": "DZ" # Ѕ
67
+ "\u0408": "J" # Ј
68
+ "\u0409": "LJ" # Љ
69
+ "\u040A": "NJ" # Њ
70
+ "\u04BA": "C" # Һ
71
+ "\u040F": "DZ" # Џ
72
+ "\u0404": "IE" # Є
73
+ "\u0407": "I" # Ї
74
+ "\u0403": "G" # Ѓ
75
+ "\u0406": "I" # І
76
+
77
+ "\u0430": "a" # а
78
+ "\u0431": "b" # б
79
+ "\u0434": "d" # д
80
+ "\u0451": "e" # ё
81
+ "\u0435": "e" # e
82
+ "\u044D": "e" # э
83
+ "\u0444": "f" # ф
84
+ "\u0433": "g" # г
85
+ "\u0438": "y" # и
86
+ "\u0439": "i" # й
87
+ "\u043A": "k" # к
88
+ "\u043B": "l" # л
89
+ "\u043C": "m" # м
90
+ "\u043D": "n" # н
91
+ "\u043E": "o" # о
92
+ "\u043F": "p" # п
93
+ "\u0440": "r" # р
94
+ "\u0441": "s" # с
95
+ "\u0442": "t" # т
96
+ "\u0443": "" # у
97
+ "\u0432": "v" # в
98
+ "\u044B": "y" # ы
99
+ "\u0437": "z" # з
100
+ "\u0447": "ch" # ч
101
+ "\u044F": "ia" # я
102
+ "\u044E": "i" # ю
103
+ "\u0445": "kh" # х
104
+ "\u0448": "sh" # ш
105
+ "\u0449": "shch" # щщ
106
+ "\u0446": "ts" # ц
107
+ "\u0436": "zh" # ж
108
+ "\u0491": "g" # ґ
109
+ "\u045E": "" # ў
110
+ "\u046B": "" # ѫ
111
+ "\u0452": "d" # ђ
112
+ "\u0455": "dz" # ѕ
113
+ "\u0458": "j" # ј
114
+ "\u0459": "lj" # љ
115
+ "\u045A": "nj" # њ
116
+ "\u04BB": "c" # һ
117
+ "\u045F": "dz" # џ
118
+ "\u0454": "ie" # є
119
+ "\u0457": "i" # ї
120
+ "\u0453": "g" # ѓ
121
+