text-hyphen 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (79) hide show
  1. checksums.yaml +7 -0
  2. data/.standard.yml +5 -0
  3. data/Code-of-Conduct.md +73 -0
  4. data/Contributing.md +68 -0
  5. data/History.md +139 -0
  6. data/Licence.md +159 -0
  7. data/Manifest.txt +12 -5
  8. data/README.md +81 -0
  9. data/Rakefile +68 -19
  10. data/bin/ruby-hyphen +0 -0
  11. data/lib/text/hyphen/language/1.8/de1.rb +1307 -571
  12. data/lib/text/hyphen/language/1.8/en_us.rb +412 -453
  13. data/lib/text/hyphen/language/1.8/fr.rb +128 -334
  14. data/lib/text/hyphen/language/1.8/la.rb +1 -0
  15. data/lib/text/hyphen/language/1.8/lt.rb +115 -0
  16. data/lib/text/hyphen/language/1.8/pt.rb +2 -1
  17. data/lib/text/hyphen/language/1.8/sk.rb +277 -0
  18. data/lib/text/hyphen/language/1.9/ca.rb +2 -1
  19. data/lib/text/hyphen/language/1.9/cs.rb +2 -1
  20. data/lib/text/hyphen/language/1.9/da.rb +2 -1
  21. data/lib/text/hyphen/language/1.9/de1.rb +1382 -646
  22. data/lib/text/hyphen/language/1.9/de2.rb +110 -109
  23. data/lib/text/hyphen/language/1.9/en_uk.rb +2 -1
  24. data/lib/text/hyphen/language/1.9/en_us.rb +412 -454
  25. data/lib/text/hyphen/language/1.9/es.rb +2 -1
  26. data/lib/text/hyphen/language/1.9/et.rb +6 -5
  27. data/lib/text/hyphen/language/1.9/eu.rb +4 -3
  28. data/lib/text/hyphen/language/1.9/fi.rb +3 -2
  29. data/lib/text/hyphen/language/1.9/fr.rb +136 -343
  30. data/lib/text/hyphen/language/1.9/ga.rb +27 -26
  31. data/lib/text/hyphen/language/1.9/hr.rb +6 -5
  32. data/lib/text/hyphen/language/1.9/hsb.rb +3 -2
  33. data/lib/text/hyphen/language/1.9/hu1.rb +3 -2
  34. data/lib/text/hyphen/language/1.9/hu2.rb +5 -4
  35. data/lib/text/hyphen/language/1.9/ia.rb +2 -1
  36. data/lib/text/hyphen/language/1.9/id.rb +8 -7
  37. data/lib/text/hyphen/language/1.9/is.rb +2 -1
  38. data/lib/text/hyphen/language/1.9/it.rb +74 -74
  39. data/lib/text/hyphen/language/1.9/la.rb +54 -53
  40. data/lib/text/hyphen/language/1.9/lt.rb +116 -0
  41. data/lib/text/hyphen/language/1.9/mn.rb +7 -6
  42. data/lib/text/hyphen/language/1.9/nl.rb +2 -1
  43. data/lib/text/hyphen/language/1.9/no1.rb +3 -2
  44. data/lib/text/hyphen/language/1.9/no2.rb +3 -2
  45. data/lib/text/hyphen/language/1.9/pl.rb +2 -1
  46. data/lib/text/hyphen/language/1.9/pt.rb +3 -2
  47. data/lib/text/hyphen/language/1.9/ru.rb +2 -1
  48. data/lib/text/hyphen/language/1.9/sk.rb +280 -0
  49. data/lib/text/hyphen/language/1.9/sv.rb +4 -3
  50. data/lib/text/hyphen/language/cs.rb +1 -1
  51. data/lib/text/hyphen/language/de.rb +2 -1
  52. data/lib/text/hyphen/language/de1.rb +1 -1
  53. data/lib/text/hyphen/language/de2.rb +1 -1
  54. data/lib/text/hyphen/language/en_us.rb +1 -1
  55. data/lib/text/hyphen/language/eu.rb +1 -1
  56. data/lib/text/hyphen/language/fr.rb +1 -1
  57. data/lib/text/hyphen/language/hu.rb +1 -1
  58. data/lib/text/hyphen/language/hu1.rb +1 -1
  59. data/lib/text/hyphen/language/hu2.rb +1 -1
  60. data/lib/text/hyphen/language/is.rb +1 -1
  61. data/lib/text/hyphen/language/lt.rb +4 -0
  62. data/lib/text/hyphen/language/ms.rb +3 -3
  63. data/lib/text/hyphen/language/nl.rb +1 -1
  64. data/lib/text/hyphen/language/no.rb +1 -1
  65. data/lib/text/hyphen/language/sk.rb +4 -0
  66. data/lib/text/hyphen/language.rb +45 -45
  67. data/lib/text/hyphen.rb +139 -97
  68. data/lib/text-hyphen.rb +1 -1
  69. data/test/data/bug_9807_latin1.rb +2 -2
  70. data/test/data/bug_9807_utf-8.rb +1 -1
  71. data/test/test_bugs.rb +14 -13
  72. data/test/test_text_hyphen.rb +31 -21
  73. metadata +146 -96
  74. data/.autotest +0 -23
  75. data/.gemtest +0 -0
  76. data/History.rdoc +0 -99
  77. data/License.rdoc +0 -159
  78. data/README.rdoc +0 -95
  79. data/text-hyphen.gemspec +0 -51
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Irish Gaelic
3
4
  # Converted from the TeX hyphenation/gahyph.tex file, by Kevin P. Scannell
4
5
  # <scannell@slu.edu> (2004).
@@ -13,37 +14,37 @@
13
14
  # modify it under the terms of the GNU General Public License
14
15
  # as published by the Free Software Foundation; either version 2
15
16
  # of the License, or (at your option) any later version.
16
- #
17
+ #
17
18
  # This program is distributed in the hope that it will be useful,
18
19
  # but WITHOUT ANY WARRANTY; without even the implied warranty of
19
20
  # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20
21
  # GNU General Public License for more details.
21
- #
22
- #%% ====================================================================
23
- #%% @TeX-hyphen-file{
24
- #%% author = "Kevin P. Scannell",
25
- #%% version = "1.0",
26
- #%% date = "23 January 2004",
27
- #%% time = "15:46:12 CST",
28
- #%% filename = "gahyph.tex",
29
- #%% email = "scannell@slu.edu",
30
- #%% codetable = "ISO/ASCII",
31
- #%% keywords = "TeX, hyphen, Irish, Gaeilge",
32
- #%% supported = "yes",
33
- #%% abstract = "Hyphenation patterns for Irish (Gaeilge)",
34
- #%% docstring = "This file contains the hyphenation patterns
35
- #%% for the Irish language",
36
- #%% }
37
- #%% ====================================================================
22
+ #
23
+ # %% ====================================================================
24
+ # %% @TeX-hyphen-file{
25
+ # %% author = "Kevin P. Scannell",
26
+ # %% version = "1.0",
27
+ # %% date = "23 January 2004",
28
+ # %% time = "15:46:12 CST",
29
+ # %% filename = "gahyph.tex",
30
+ # %% email = "scannell@slu.edu",
31
+ # %% codetable = "ISO/ASCII",
32
+ # %% keywords = "TeX, hyphen, Irish, Gaeilge",
33
+ # %% supported = "yes",
34
+ # %% abstract = "Hyphenation patterns for Irish (Gaeilge)",
35
+ # %% docstring = "This file contains the hyphenation patterns
36
+ # %% for the Irish language",
37
+ # %% }
38
+ # %% ====================================================================
38
39
  #
39
40
  # See the web page http://borel.slu.edu/fleiscin/index.html
40
41
  # for more information on how these patterns were generated.
41
- #
42
- # Please report incorrect hyphenations to the author at the
42
+ #
43
+ # Please report incorrect hyphenations to the author at the
43
44
  # email address above.
44
- #message{Hyphenation patterns `gahyph.tex' Version 1.0 <2004/01/22>}
45
+ # message{Hyphenation patterns `gahyph.tex' Version 1.0 <2004/01/22>}
45
46
  #++
46
- require 'text/hyphen/language'
47
+ require "text/hyphen/language"
47
48
 
48
49
  Text::Hyphen::Language::GA = Text::Hyphen::Language.new do |lang|
49
50
  lang.encoding "UTF-8"
@@ -593,10 +594,10 @@ veant5 vear3 vearn6 3v4ei veil5b v3eo véar6 véis5 véist6 5v6ial 3v4ini vios5
593
594
  vir5 virg6 v6íc v3la 3vol4 volt3 vuít5 x3ac x5ai x5aí
594
595
  PATTERNS
595
596
 
596
- # See the web page cited above for descriptions of these ambiguities.
597
- # These cover capitalized versions, *including* eclipsed capitals
598
- # 2004-01-25: 46 of them coming from 23 classes modulo
599
- # lenition/eclipsis
597
+ # See the web page cited above for descriptions of these ambiguities.
598
+ # These cover capitalized versions, *including* eclipsed capitals
599
+ # 2004-01-25: 46 of them coming from 23 classes modulo
600
+ # lenition/eclipsis
600
601
  lang.exceptions <<-EXCEPTIONS
601
602
  bhrachtaí mbrachtaí cháintí gcáintí cheiltí gceiltí chistí gcistí choirtí
602
603
  gcoirtí chreataí gcreataí dhoirteá dhoirtear dhoirtí doirtear ndoirteá
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Croatian
3
4
  # Converted from the TeX hyphenation/bahyph.tex file, by Marinovi\'c Igor
4
5
  # (1994 - 1996).
@@ -6,19 +7,19 @@
6
7
  # The original copyright holds and is reproduced in the source to this file.
7
8
  # The Ruby version of these patterns are copyright 2004 Austin Ziegler.
8
9
  #--
9
- # Hyphenation patterns for Croatian language words for use with
10
- # T1 encoding, which is supported in DC fonts.
10
+ # Hyphenation patterns for Croatian language words for use with
11
+ # T1 encoding, which is supported in DC fonts.
11
12
  # These can also be used with OT1 encoding.
12
13
  #
13
- # The first version was realized in late 1994.
14
+ # The first version was realized in late 1994.
14
15
  # Second, much more improved version was realized in the beginning of 1996.
15
16
  # Date of the last change: 19.03.1996.
16
17
  #
17
18
  # Marinovi\'c Igor
18
19
  # migor@student.math.hr
19
- #
20
+ #
20
21
  #++
21
- require 'text/hyphen/language'
22
+ require "text/hyphen/language"
22
23
 
23
24
  Text::Hyphen::Language::HR = Text::Hyphen::Language.new do |lang|
24
25
  encoding "UTF-8"
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Upper Sorbian
3
4
  # Converted from the TeX hyphenation/bahyph.tex file, by E. Werner (1997).
4
5
  #
@@ -12,10 +13,10 @@
12
13
  # \message{Hyphenation patterns for Upper Sorbian, E. Werner}
13
14
  # \message{Completely new revision 1997, March 22}
14
15
  #++
15
- require 'text/hyphen/language'
16
+ require "text/hyphen/language"
16
17
 
17
18
  Text::Hyphen::Language::HSB = Text::Hyphen::Language.new do |lang|
18
- lang.encoding "UTF-8"
19
+ lang.encoding "UTF-8"
19
20
  lang.patterns <<-PATTERNS
20
21
  % ě
21
22
 
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Hungarian
3
4
  # Converted from the TeX hyphenation/huhyph.tex 3.12 file,
4
5
  # by MIKL\'OS Dezs\H o and MAYER Gyula from 1989 - 1998.
@@ -30,11 +31,11 @@
30
31
  # MHSz10 p.8-9. földolgozatlan; cf. p.62.
31
32
  #++
32
33
 
33
- require 'text/hyphen/language'
34
+ require "text/hyphen/language"
34
35
 
35
36
  Text::Hyphen::Language::HU1 = Text::Hyphen::Language.new do |lang|
36
37
  lang.encoding "UTF-8"
37
- lang.isocode = 'hu'
38
+ lang.isocode = "hu"
38
39
  lang.patterns <<-PATTERNS
39
40
  % 1C(s/z/y)V (V <> y)
40
41
  % 1C(f/h/s/z)y occurs at the end of names, so I added some of them
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Hungarian
3
4
  # Converted from the TeX hyphenation/huhyphn.tex file, by NAGY Bence
4
5
  # <huhyphn@tipogral.hu>.
@@ -11,15 +12,15 @@
11
12
  # Copyright (C) 2003, NAGY Bence <huhyphn@tipogral.hu>
12
13
  # This file can be distributed under the terms of the
13
14
  # GNU General Public License version 2.
14
- #
15
- # Encoding: Cork/T1/EC
15
+ #
16
+
16
17
  #++
17
18
 
18
- require 'text/hyphen/language'
19
+ require "text/hyphen/language"
19
20
 
20
21
  Text::Hyphen::Language::HU2 = Text::Hyphen::Language.new do |lang|
21
22
  lang.encoding "UTF-8"
22
- lang.isocode 'hu'
23
+ lang.isocode "hu"
23
24
  lang.patterns <<-PATTERNS
24
25
  .a2 .adás1s .ae1 .agyon1 .al1eg .al1e2m .al1e2s .al1ér .al1is .al1os .arc1c
25
26
  .ar2c3ho .atmo1 .az1a2 .az1ám .aze2 .á2 .ál1a2 .ál1e .ál1é2 .ál1i .ál1ok
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Interlingua
3
4
  # Converted from the TeX hyphenation/iahyph.tex file, Version 0.2b.
4
5
  # Released 3 July 2001, Created by Peter Kleiweg, kleiweg@let.rug.nl
@@ -16,7 +17,7 @@
16
17
  #
17
18
  # About Interlingua: http://www.interlingua.com/
18
19
  #++
19
- require 'text/hyphen/language'
20
+ require "text/hyphen/language"
20
21
 
21
22
  Text::Hyphen::Language::IA = Text::Hyphen::Language.new do |lang|
22
23
  lang.encoding "UTF-8"
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby
3
4
  # id (Indonesian) and ms (Malay)
4
5
  # Converted from the TeX hyphenation/inhyph.tex file, by Jörg Knappen and
@@ -7,19 +8,19 @@
7
8
  # The original copyright holds and is reproduced in the source to this file.
8
9
  # The Ruby version of these patterns are copyright 2004 Austin Ziegler.
9
10
  #--
10
- # inhyph.tex
11
+ # inhyph.tex
11
12
  # Version 1.3 19-SEP-1997
12
13
  #
13
14
  # Hyphenation patterns for bahasa indonesia (probably also usable
14
15
  # for bahasa melayu)
15
16
  #
16
17
  # (c) Copyright 1996, 1997 Jörg Knappen and Terry Mart
17
- #
18
- # This patterns are free software according to the GNU General Public
18
+ #
19
+ # This patterns are free software according to the GNU General Public
19
20
  # licence version 2, June 1991.
20
21
  #
21
22
  # Please read the GNU licence for details. If you don't receive a GNU
22
- # licence with these patterns, you can obtain it from
23
+ # licence with these patterns, you can obtain it from
23
24
  #
24
25
  # Free Software Foundation, Inc.
25
26
  # 675 Mass Ave, Cambridge, MA 02139, USA
@@ -50,7 +51,7 @@
50
51
  # email : mart@kph.uni-mainz.de
51
52
  #
52
53
  #++
53
- require 'text/hyphen/language'
54
+ require "text/hyphen/language"
54
55
 
55
56
  Text::Hyphen::Language::ID = Text::Hyphen::Language.new do |lang|
56
57
  lang.encoding "UTF-8"
@@ -78,8 +79,8 @@ a2ir % ber-air
78
79
  % Don't overload the exception list...
79
80
  PATTERNS
80
81
 
81
- # Exeptions to the above rules, specially words beginning in ber... and
82
- # ter..
82
+ # Exeptions to the above rules, specially words beginning in ber... and
83
+ # ter..
83
84
  lang.exceptions <<-EXCEPTIONS
84
85
  be-ra-be be-ra-hi be-rak be-ran-da be-ran-dal be-rang be-ra-ngas-an
85
86
  be-rang-sang be-ra-ngus be-ra-ni be-ran-tak-an be-ran-tam be-ran-tas
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Icelandic
3
4
  # Converted from the TeX hyphenation/bahyph.tex file, by Jorgen Pind
4
5
  # (1987).
@@ -52,7 +53,7 @@
52
53
  # e.g. that if one wants to use, say, umlaut marks over u or a it is
53
54
  # necessary to write \" a (space before a) or \"{a} instead of PLAINS \"a.
54
55
  #++
55
- require 'text/hyphen/language'
56
+ require "text/hyphen/language"
56
57
 
57
58
  Text::Hyphen::Language::IS = Text::Hyphen::Language.new do |lang|
58
59
  lang.encoding "UTF-8"
@@ -4,7 +4,7 @@
4
4
  # The original copyright holds and is reproduced in the source to this file.
5
5
  # The Ruby version of these patterns are copyright 2004 Austin Ziegler.
6
6
  #--
7
- #%%%%%%%%%%%%%%%%%%%%%%%%%% file ithyph.tex %%%%%%%%%%%%%%%%%%%%%%%%%%%%%
7
+ # %%%%%%%%%%%%%%%%%%%%%%%%%% file ithyph.tex %%%%%%%%%%%%%%%%%%%%%%%%%%%%%
8
8
  #
9
9
  # Prepared by Claudio Beccari e-mail claudio.beccari@polito.it
10
10
  #
@@ -30,7 +30,7 @@
30
30
  #
31
31
  # See comments at the end of the file after the \endinput line
32
32
  #++
33
- require 'text/hyphen/language'
33
+ require "text/hyphen/language"
34
34
 
35
35
  Text::Hyphen::Language::IT = Text::Hyphen::Language.new do |lang|
36
36
  lang.encoding "UTF-8"
@@ -60,75 +60,75 @@ t2t3s 2tv 2tw t2z 2tzk tz2s 2t. 2t'. 2t'' 1v 2vc v2l v2r 2vv 2v. 2v'. 2v''
60
60
  PATTERNS
61
61
  end
62
62
 
63
- # Information
64
- # ON ITALIAN HYPHENATION
65
- #
66
- # I have been working on patterns for the Italian language since 1987; in
67
- # 1992 I published
68
- #
69
- # C. Beccari, "Computer aided hyphenation for Italian and Modern Latin",
70
- # TUG vol. 13, n. 1, pp. 23-33 (1992)
71
- #
72
- # which contained a set of patterns that allowed hyphenation for both
73
- # Italian and Latin; a slightly modified version of the patterns published
74
- # in the above paper is contained in LAHYPH.TEX available on the CTAN
75
- # archives.
76
- #
77
- # This minor revision has been tested with an enlarged set of difficult
78
- # Italian words so as to comply with a larger number of technical words
79
- # with foreign roots. The overall number of patterns is slightly reduced,
80
- # but its strength is increased. As with the previous release hyathi are
81
- # not hyphenated in order to cope with the habits of Italian readers.
82
- # Similarly single vowel internal syllables are avoided.
83
- #
84
- # As the previous versions, this new set of patterns does not contain any
85
- # accented character so that the hyphenation algorithm behaves properly in
86
- # both cases, that is with OT1 and T1 encodings. With the former encoding
87
- # fonts do not contain accented characters, while with the latter accented
88
- # characters are present and sequences such as à map directly to slot "E0
89
- # that contains "agrave".
90
- #
91
- # Of course if you use T1 encoded fonts you get the full power of the
92
- # hyphenation algorithm, while if you use OT1 encoded fonts you miss some
93
- # possible break points; this is not a big inconvenience in Italian
94
- # because:
95
- #
96
- # 1) The Regulation UNI 6015 on accents specifies that compulsory accents
97
- # appear only on the ending vowel of oxitone words; this means that it
98
- # is almost indifferent to have or to miss the T1 encoded fonts because
99
- # the only difference consists in how TeX evaluates the end of the
100
- # word; in practice if you have these special facilities you get
101
- # "qua-li-tà", while if you miss them, you get "qua-lità" (assuming
102
- # that \righthyphenmin > 1).
103
- #
104
- # 2) Optional accents are so rare in Italian, that if you absolutely want
105
- # to use them in those rare instances, and you miss the T1 encoding
106
- # facilities, you should also provide explicit discretionary hyphens as
107
- # in "sé\-gui\-to".
108
- #
109
- # There is no explicit hyphenation exception list because these patterns
110
- # proved to hyphenate correctly a very large set of words suitably chosen
111
- # in order to test them in the most heavy circumstances; these patterns
112
- # were used in the preparation of a number of books and no errors were
113
- # discovered.
114
- #
115
- # Nevertheless if you frequently use technical terms that you want
116
- # hyphenated differently from what is normally done (for example if you
117
- # prefer etymological hyphenation of prefixed and/or suffixed words) you
118
- # should insert a specific hyphenation list in the preamble of your
119
- # document, for example:
120
- #
121
- # \hyphenation{su-per-in-dut-to-re su-per-in-dut-to-ri}
122
- #
123
- # If you use, as you should, the italan option of the babel package, then
124
- # you have available the active charater " that allows you to put
125
- # a discretionary break at a word boundary of a compound word while
126
- # maintaning the hyphenation algorithm on the rest of the word.
127
- #
128
- # Please, read the babel package documentation.
129
- #
130
- # Should you find any word that gets hyphenated in a wrong way, please,
131
- # AFTER CHECKING ON A RELIABLE MODERN DICTIONARY, report to the author,
132
- # preferably by e-mail.
133
- #
134
- # Happy multilingual typesetting!
63
+ # Information
64
+ # ON ITALIAN HYPHENATION
65
+ #
66
+ # I have been working on patterns for the Italian language since 1987; in
67
+ # 1992 I published
68
+ #
69
+ # C. Beccari, "Computer aided hyphenation for Italian and Modern Latin",
70
+ # TUG vol. 13, n. 1, pp. 23-33 (1992)
71
+ #
72
+ # which contained a set of patterns that allowed hyphenation for both
73
+ # Italian and Latin; a slightly modified version of the patterns published
74
+ # in the above paper is contained in LAHYPH.TEX available on the CTAN
75
+ # archives.
76
+ #
77
+ # This minor revision has been tested with an enlarged set of difficult
78
+ # Italian words so as to comply with a larger number of technical words
79
+ # with foreign roots. The overall number of patterns is slightly reduced,
80
+ # but its strength is increased. As with the previous release hyathi are
81
+ # not hyphenated in order to cope with the habits of Italian readers.
82
+ # Similarly single vowel internal syllables are avoided.
83
+ #
84
+ # As the previous versions, this new set of patterns does not contain any
85
+ # accented character so that the hyphenation algorithm behaves properly in
86
+ # both cases, that is with OT1 and T1 encodings. With the former encoding
87
+ # fonts do not contain accented characters, while with the latter accented
88
+ # characters are present and sequences such as à map directly to slot "E0
89
+ # that contains "agrave".
90
+ #
91
+ # Of course if you use T1 encoded fonts you get the full power of the
92
+ # hyphenation algorithm, while if you use OT1 encoded fonts you miss some
93
+ # possible break points; this is not a big inconvenience in Italian
94
+ # because:
95
+ #
96
+ # 1) The Regulation UNI 6015 on accents specifies that compulsory accents
97
+ # appear only on the ending vowel of oxitone words; this means that it
98
+ # is almost indifferent to have or to miss the T1 encoded fonts because
99
+ # the only difference consists in how TeX evaluates the end of the
100
+ # word; in practice if you have these special facilities you get
101
+ # "qua-li-tà", while if you miss them, you get "qua-lità" (assuming
102
+ # that \righthyphenmin > 1).
103
+ #
104
+ # 2) Optional accents are so rare in Italian, that if you absolutely want
105
+ # to use them in those rare instances, and you miss the T1 encoding
106
+ # facilities, you should also provide explicit discretionary hyphens as
107
+ # in "sé\-gui\-to".
108
+ #
109
+ # There is no explicit hyphenation exception list because these patterns
110
+ # proved to hyphenate correctly a very large set of words suitably chosen
111
+ # in order to test them in the most heavy circumstances; these patterns
112
+ # were used in the preparation of a number of books and no errors were
113
+ # discovered.
114
+ #
115
+ # Nevertheless if you frequently use technical terms that you want
116
+ # hyphenated differently from what is normally done (for example if you
117
+ # prefer etymological hyphenation of prefixed and/or suffixed words) you
118
+ # should insert a specific hyphenation list in the preamble of your
119
+ # document, for example:
120
+ #
121
+ # \hyphenation{su-per-in-dut-to-re su-per-in-dut-to-ri}
122
+ #
123
+ # If you use, as you should, the italan option of the babel package, then
124
+ # you have available the active charater " that allows you to put
125
+ # a discretionary break at a word boundary of a compound word while
126
+ # maintaning the hyphenation algorithm on the rest of the word.
127
+ #
128
+ # Please, read the babel package documentation.
129
+ #
130
+ # Should you find any word that gets hyphenated in a wrong way, please,
131
+ # AFTER CHECKING ON A RELIABLE MODERN DICTIONARY, report to the author,
132
+ # preferably by e-mail.
133
+ #
134
+ # Happy multilingual typesetting!
@@ -1,4 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
+
2
3
  # Hyphenation patterns for Text::Hyphen in Ruby: Latin
3
4
  # Converted from the TeX hyphenation/lahyph.tex file, by Claudio Beccari
4
5
  # (1999 - 2001).
@@ -44,9 +45,9 @@
44
45
  #
45
46
  # Information after \endinput.
46
47
  #
47
- #message{Latin Hyphenation Patterns `lahyph' Version 3.0b <2001/11/21>}
48
+ # message{Latin Hyphenation Patterns `lahyph' Version 3.0b <2001/11/21>}
48
49
  #++
49
- require 'text/hyphen/language'
50
+ require "text/hyphen/language"
50
51
 
51
52
  Text::Hyphen::Language::LA = Text::Hyphen::Language.new do |lang|
52
53
  lang.encoding "UTF-8"
@@ -81,54 +82,54 @@ o2r1ue o2r1ui o2r1uo o2r1uu u2r1ua u2r1ue u2r1ui u2r1uo u2r1uu
81
82
  PATTERNS
82
83
  end
83
84
 
84
- # For documentation see:
85
- #
86
- # C. Beccari, "Computer aided hyphenation for Italian and Modern Latin",
87
- # TUG vol. 13, n. 1, pp. 23-33 (1992)
88
- #
89
- # see also
90
- #
91
- # C. Beccari, "Typesetting of ancient languages",
92
- # TUG vol.15, n.1, pp. 9-16 (1994)
93
- #
94
- # In the former paper the code was described as being contained in file
95
- # ITALAT.TEX; this is substantially the same code, but the file has been
96
- # renamed LAHYPH.TEX in accordance with the ISO name for Latin and the
97
- # convention that all hyphenation pattern file names should be formed by the
98
- # agglutination of two letter language ISO code and the abbreviation HYPH.
99
- #
100
- # A corresponding file (ITHYPH.TEX) has been extracted in order to eliminate
101
- # the (few) patterns specific to Latin and leave those specific to Italian;
102
- # ITHYPH.TEX has been further extended with many new patterns in order to
103
- # cope with the many neologisms and technical terms with foreign roots.
104
- #
105
- # Should you find any word that gets hyphenated in a wrong way, please, AFTER
106
- # CHECKING ON A RELIABLE MODERN DICTIONARY, report to the author, preferably
107
- # by e-mail. Please do not report about wrong break points concerning
108
- # prefixes and/or suffixes; see at the bottom of this file.
109
- #
110
- # Compared with the previous versions, this file has been extended so as to
111
- # cope also with the medieval Latin spelling, where the letter `V' played the
112
- # roles of both `U' and `V', as in the Roman times, save that the Romans used
113
- # only capitals. In the middle ages the availability of soft writing supports
114
- # and the necessity of copying books with a reasonable speed, several scripts
115
- # evolved in (practically) all of which there was a lower case alphabet
116
- # different from the upper case one, and where the lower case `v' had the
117
- # rounded shape of our modern lower case `u', and where the Latin diphthongs
118
- # `AE' and `OE', both in upper and lower case, where written as ligatures,
119
- # not to mention the habit of substituting them with their sound, that is a
120
- # simple `E'.
121
- #
122
- # According to Leon Battista Alberti, who in 1466 wrote a book on
123
- # cryptography where he thoroughly analyzed the hyphenation of the Latin
124
- # language of his (still medieval) times, the differences from the Tuscan
125
- # language (the Italian language, as it was named at his time) were very
126
- # limited, in particular for what concerns the handling of the ascending and
127
- # descending diphthongs; in central and northern Europe, and later on in
128
- # North America, the Scholars perceived the above diphthongs as made of two
129
- # distinct vowels; the hyphenation of medieval Latin, therefore, was quite
130
- # different in the northern countries compared to the southern ones, at least
131
- # for what concerns these diphthongs. If you need hyphenation patterns for
132
- # medieval Latin that suite you better according to the habits of northern
133
- # Europe you should resort to the hyphenation patterns prepared by Yannis
134
- # Haralambous (TUGboat, vol.13 n.4 (1992)).
85
+ # For documentation see:
86
+ #
87
+ # C. Beccari, "Computer aided hyphenation for Italian and Modern Latin",
88
+ # TUG vol. 13, n. 1, pp. 23-33 (1992)
89
+ #
90
+ # see also
91
+ #
92
+ # C. Beccari, "Typesetting of ancient languages",
93
+ # TUG vol.15, n.1, pp. 9-16 (1994)
94
+ #
95
+ # In the former paper the code was described as being contained in file
96
+ # ITALAT.TEX; this is substantially the same code, but the file has been
97
+ # renamed LAHYPH.TEX in accordance with the ISO name for Latin and the
98
+ # convention that all hyphenation pattern file names should be formed by the
99
+ # agglutination of two letter language ISO code and the abbreviation HYPH.
100
+ #
101
+ # A corresponding file (ITHYPH.TEX) has been extracted in order to eliminate
102
+ # the (few) patterns specific to Latin and leave those specific to Italian;
103
+ # ITHYPH.TEX has been further extended with many new patterns in order to
104
+ # cope with the many neologisms and technical terms with foreign roots.
105
+ #
106
+ # Should you find any word that gets hyphenated in a wrong way, please, AFTER
107
+ # CHECKING ON A RELIABLE MODERN DICTIONARY, report to the author, preferably
108
+ # by e-mail. Please do not report about wrong break points concerning
109
+ # prefixes and/or suffixes; see at the bottom of this file.
110
+ #
111
+ # Compared with the previous versions, this file has been extended so as to
112
+ # cope also with the medieval Latin spelling, where the letter `V' played the
113
+ # roles of both `U' and `V', as in the Roman times, save that the Romans used
114
+ # only capitals. In the middle ages the availability of soft writing supports
115
+ # and the necessity of copying books with a reasonable speed, several scripts
116
+ # evolved in (practically) all of which there was a lower case alphabet
117
+ # different from the upper case one, and where the lower case `v' had the
118
+ # rounded shape of our modern lower case `u', and where the Latin diphthongs
119
+ # `AE' and `OE', both in upper and lower case, where written as ligatures,
120
+ # not to mention the habit of substituting them with their sound, that is a
121
+ # simple `E'.
122
+ #
123
+ # According to Leon Battista Alberti, who in 1466 wrote a book on
124
+ # cryptography where he thoroughly analyzed the hyphenation of the Latin
125
+ # language of his (still medieval) times, the differences from the Tuscan
126
+ # language (the Italian language, as it was named at his time) were very
127
+ # limited, in particular for what concerns the handling of the ascending and
128
+ # descending diphthongs; in central and northern Europe, and later on in
129
+ # North America, the Scholars perceived the above diphthongs as made of two
130
+ # distinct vowels; the hyphenation of medieval Latin, therefore, was quite
131
+ # different in the northern countries compared to the southern ones, at least
132
+ # for what concerns these diphthongs. If you need hyphenation patterns for
133
+ # medieval Latin that suite you better according to the habits of northern
134
+ # Europe you should resort to the hyphenation patterns prepared by Yannis
135
+ # Haralambous (TUGboat, vol.13 n.4 (1992)).