srx-languagetool 0.7.0 → 0.8.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: c277febbbdec765f5eeba65cdc43dd661ddf807a53f2e2858f0e321eccdf3459
4
- data.tar.gz: 34aa30e138bddfacd30ed8f9a48f45d4e91afa5c4e4a789d3208860c1bbd608e
3
+ metadata.gz: f73cebe4cfa7e771e3250f1f1dc13694b6450e19a4f9adf81769c5a75baa76d5
4
+ data.tar.gz: 35f29775c7d85150bc61551e9fb32adcb60cebc392d9d37e01d829b193a7464c
5
5
  SHA512:
6
- metadata.gz: 62a56ee4d2cb0ba5fe16181681561a829f7f59f84155753d896fa6dc6153bd238ed9de8337cea2e75ac6c83e94381d84a0ede80c2bbcff1648fe97c57f3d5fed
7
- data.tar.gz: 66d09127f9eb76307bd38938c619a6099c0ff941bcd3c33b51e4c130c0d4373ea12cdb080bec1aab783e4070c0d5d70fa2e97a4d64d1c394390316630012e0b3
6
+ metadata.gz: 548319e33a292724739e81eb28433594dfea9ec8e9e1fd78366d1847e601a5c6e1521e1fa639bd760fd33ee80d45190a83e92fdcb64d17efae730f5ac7958e6d
7
+ data.tar.gz: b55939faa805e0e5102a8610c4c89571f47c5002d3c7b7dfa26fa9f8785f83ce4083bec63abad845565091ddfad752c2ca6b9599a88be621e5618053ad5b0394
@@ -13,7 +13,7 @@ jobs:
13
13
  ruby-version: 2.7.6
14
14
  - name: Install
15
15
  run: |
16
- gem install bundler -v 2.3.17
16
+ gem install bundler -v 2.3.22
17
17
  bundle install
18
18
  - name: Type check
19
19
  run: bundle exec solargraph typecheck --level typed
data/CHANGELOG.md CHANGED
@@ -1,5 +1,9 @@
1
1
  ## [Unreleased]
2
2
 
3
+ ## [0.8.0] - 2022-09-29
4
+
5
+ - Update rules to LanguageTool 5.9
6
+
3
7
  ## [0.7.0] - 2022-07-04
4
8
 
5
9
  - Update rules to LanguageTool 5.8
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- srx-languagetool (0.7.0)
4
+ srx-languagetool (0.8.0)
5
5
  srx (< 1.0)
6
6
 
7
7
  GEM
@@ -19,37 +19,37 @@ GEM
19
19
  rexml
20
20
  kramdown-parser-gfm (1.1.0)
21
21
  kramdown (~> 2.0)
22
- minitest (5.16.2)
23
- nokogiri (1.13.6-x86_64-darwin)
22
+ minitest (5.16.3)
23
+ nokogiri (1.13.8-x86_64-darwin)
24
24
  racc (~> 1.4)
25
25
  parallel (1.22.1)
26
- parser (3.1.2.0)
26
+ parser (3.1.2.1)
27
27
  ast (~> 2.4.1)
28
28
  racc (1.6.0)
29
29
  rainbow (3.1.1)
30
30
  rake (13.0.6)
31
- regexp_parser (2.5.0)
31
+ regexp_parser (2.6.0)
32
32
  reverse_markdown (2.1.1)
33
33
  nokogiri
34
34
  rexml (3.2.5)
35
- rspec-expectations (3.11.0)
35
+ rspec-expectations (3.11.1)
36
36
  diff-lcs (>= 1.2.0, < 2.0)
37
37
  rspec-support (~> 3.11.0)
38
- rspec-support (3.11.0)
39
- rubocop (1.31.1)
38
+ rspec-support (3.11.1)
39
+ rubocop (1.36.0)
40
40
  json (~> 2.3)
41
41
  parallel (~> 1.10)
42
- parser (>= 3.1.0.0)
42
+ parser (>= 3.1.2.1)
43
43
  rainbow (>= 2.2.2, < 4.0)
44
44
  regexp_parser (>= 1.8, < 3.0)
45
45
  rexml (>= 3.2.5, < 4.0)
46
- rubocop-ast (>= 1.18.0, < 2.0)
46
+ rubocop-ast (>= 1.20.1, < 2.0)
47
47
  ruby-progressbar (~> 1.7)
48
48
  unicode-display_width (>= 1.4.0, < 3.0)
49
- rubocop-ast (1.18.0)
49
+ rubocop-ast (1.21.0)
50
50
  parser (>= 3.1.1.0)
51
51
  ruby-progressbar (1.11.0)
52
- solargraph (0.45.0)
52
+ solargraph (0.47.1)
53
53
  backport (~> 1.2)
54
54
  benchmark
55
55
  bundler (>= 1.17.2)
@@ -67,8 +67,8 @@ GEM
67
67
  srx (0.6.0)
68
68
  nokogiri (~> 1.11)
69
69
  thor (1.2.1)
70
- tilt (2.0.10)
71
- unicode-display_width (2.2.0)
70
+ tilt (2.0.11)
71
+ unicode-display_width (2.3.0)
72
72
  webrick (1.7.0)
73
73
  yard (0.9.28)
74
74
  webrick (~> 1.7.0)
@@ -87,4 +87,4 @@ DEPENDENCIES
87
87
  srx-languagetool!
88
88
 
89
89
  BUNDLED WITH
90
- 2.3.17
90
+ 2.3.22
@@ -2,6 +2,6 @@
2
2
 
3
3
  module Srx
4
4
  module Languagetool
5
- VERSION = '0.7.0'
5
+ VERSION = '0.8.0'
6
6
  end
7
7
  end
data/lib/srx/segment.srx CHANGED
@@ -1159,7 +1159,7 @@
1159
1159
  <afterbreak>D\.?</afterbreak>
1160
1160
  </rule>
1161
1161
  <rule break="no"><!-- min. -->
1162
- <beforebreak>\b([Aa]vg|[Ee]d|pp|[Vv]iz|i\.?[\s\u00A0]*e|[Vvol]|[Rr]col|maj|Lt|[Ff]ig|[Ff]igs|[Vv]iz|[Vv]ols|[Aa]pprox|[Ii]ncl?|[Aa]cc|Pres|[Cc]orp|[Ee]x|[Cc]onn|[Dd]ept|[Ll]tda|[Mm]in|[Mm]ax|[Gg]ovt|[Rr]etd|lb|lbf|ft|c\.?[\s\u00A0]*f|vs|dia|lbs|\d+-(:?oz|kc|in|h[rp]|ml)|M?sec)\.[\s\u00A0]</beforebreak>
1162
+ <beforebreak>\b([Aa]vg|[Ee]d|pp|[Vv]iz|i\.?[\s\u00A0]*e|[Vvol]|[Rr]col|maj|Lt|[Ff]ig|[Ff]igs|[Vv]iz|[Vv]ols|[Aa]pprox|[Ii]ncl?|[Aa]cc|Pres|[Cc]orp|[Ee]x|[Cc]onn|[Dd]ept|[Ll]tda|[Mm]in|[Mm]ax|[Gg]ovt|[Rr]etd|Ing|lb|lbf|ft|c\.?[\s\u00A0]*f|vs|dia|lbs|\d+-(:?oz|kc|in|h[rp]|ml)|M?sec)\.[\s\u00A0]</beforebreak>
1163
1163
  <afterbreak>[^\p{Lu}]|I</afterbreak>
1164
1164
  </rule>
1165
1165
  <rule break="no"><!-- hr. -->
@@ -1553,6 +1553,10 @@
1553
1553
  <beforebreak>\b[A-Za-z0-9\-]+\.</beforebreak>
1554
1554
  <afterbreak>[A-Za-z0-9\-]+\.(com|net|org|info|de|es|edu|co|eu|nl|io|cn|uk|gov|biz|ca|tk|ru|br|jp|pl)(\.|\b)</afterbreak>
1555
1555
  </rule>
1556
+ <rule break="no"><!-- Abbreviated books of the Bible and biblical apocrypha-->
1557
+ <beforebreak>\b(Ge?n|Ex|Le?v|Nu?m|D(eu)?t|Jo?z|Ri|R[ei]cht|Sa?m|Ko?n|Kr[on]{0,2}|Neh?|Est?|Jb|Ps|Spr?|Pr[ed]{0,2}|H(oog)?l|Je?s|Je?r|Kl(aagl)?|Ez(ech)?|Da?n|Ho?s|Jl|Am|Ob|Mc|Mi[ch]{0,2}|Nah?|Hk|Hab|Zf|[SZ]ef|Ha?g|Zc|Zach|Ma?l|Ma?t|Mk|Mar|Lk|Jh|H(an)?d|Ro?m|Kor|Ga?l|Ef|Fp|Fil|Ko|[CK]ol|Th|Th?e[s]{1,2}|Tm|Ti?t|Fm|Fil(em)?|Hb|Hebr?|Jk|Ja[ck]|Pe?tr?|Joh|Jud|Op(enb)?|Wijsh|Tob|Sir|Bar|Makk)\.\s</beforebreak>
1558
+ <afterbreak></afterbreak>
1559
+ </rule>
1556
1560
  <rule break="no">
1557
1561
  <beforebreak>\b(Drs|Art|Afr|Am|Ar|Br|Cie|Comp|Dhr|([Pp]rof\.)?[Dd]r|Em|Fa|Kon|Bros|Stb)\.\s</beforebreak>
1558
1562
  <afterbreak></afterbreak>
@@ -1578,7 +1582,7 @@
1578
1582
  <afterbreak></afterbreak>
1579
1583
  </rule>
1580
1584
  <rule break="no">
1581
- <beforebreak>\b(arch|archeol|art|bc|betr|bez|bibl|bijl|bijv)\.\s</beforebreak>
1585
+ <beforebreak>\b(arch|archeol|art|bc|bep|betr|bez|bibl|bijl|[Bb]ijv)\.\s</beforebreak>
1582
1586
  <afterbreak></afterbreak>
1583
1587
  </rule>
1584
1588
  <rule break="no">
@@ -1590,15 +1594,15 @@
1590
1594
  <afterbreak></afterbreak>
1591
1595
  </rule>
1592
1596
  <rule break="no">
1593
- <beforebreak>\b(ed|em|enz|etc|ev|excl|fa|fam|fig|fl|fr.)\.\s</beforebreak>
1597
+ <beforebreak>\b(ed|em|enz|etc|ev|[Ee]xcl|fa|fam|fig|fin|fl|fr.)\.\s</beforebreak>
1594
1598
  <afterbreak></afterbreak>
1595
1599
  </rule>
1596
1600
  <rule break="no">
1597
- <beforebreak>\b(geb|get|gld|id|incl|ing|intern|ir|jhr|jkvr)\.\s</beforebreak>
1601
+ <beforebreak>\b(geb|[Gg]em|get|gld|id|[Ii]ncl|ind|inf|ing|intern|inz|ir|jhr|jkvr)\.\s</beforebreak>
1598
1602
  <afterbreak></afterbreak>
1599
1603
  </rule>
1600
1604
  <rule break="no">
1601
- <beforebreak>\b(jl|jr|kr|kt|lab|lic|ll|lt|lw|max|mi|min|mld)\.\s</beforebreak>
1605
+ <beforebreak>\b(jl|jr|kr|kt|lab|lic|ll|lt|lw|max|mevr|mi|[Mm]in|mld)\.\s</beforebreak>
1602
1606
  <afterbreak></afterbreak>
1603
1607
  </rule>
1604
1608
  <rule break="no">
@@ -1606,11 +1610,11 @@
1606
1610
  <afterbreak></afterbreak>
1607
1611
  </rule>
1608
1612
  <rule break="no">
1609
- <beforebreak>\b(opm|org|ov|pag|par|penn|plm|plv)\.\s</beforebreak>
1613
+ <beforebreak>\b(opm|org|ov|pag|par|penn|([1-3][\.e]?)[\s]?pers|plm|plv)\.\s</beforebreak>
1610
1614
  <afterbreak></afterbreak>
1611
1615
  </rule>
1612
1616
  <rule break="no">
1613
- <beforebreak>\b(prov|pseud|qty|red|ref|resp|soc|st|tab|tel|temp|tk)\.\s</beforebreak>
1617
+ <beforebreak>\b(prov|pseud|psych|qty|red|ref|resp|soc|st|tab|tel|temp|tk)\.\s</beforebreak>
1614
1618
  <afterbreak></afterbreak>
1615
1619
  </rule>
1616
1620
  <rule break="no">
@@ -1622,7 +1626,7 @@
1622
1626
  <afterbreak>Chr</afterbreak>
1623
1627
  </rule>
1624
1628
  <rule break="no">
1625
- <beforebreak>\b(uitsl|ver|vgl|vnl|vnw|voorz|ww|zat|zg)\.\s</beforebreak>
1629
+ <beforebreak>\b(uitsl|ver|vgl|vnl|vnw|voorz|ww|zat|[Zz]elfst|zgn?)\.\s</beforebreak>
1626
1630
  <afterbreak></afterbreak>
1627
1631
  </rule>
1628
1632
  <rule break="no">
@@ -4373,7 +4377,7 @@
4373
4377
  <afterbreak>\p{Ll}</afterbreak>
4374
4378
  </rule>
4375
4379
  <rule break="no">
4376
- <beforebreak>\b(уд|ул|уч|физ|х|хор|э)\.\s</beforebreak>
4380
+ <beforebreak>\b(уд|ул|уч|физ|х|хор|э|Эл|эл)\.\s</beforebreak>
4377
4381
  <afterbreak></afterbreak>
4378
4382
  </rule>
4379
4383
  <rule break="no">
@@ -4717,6 +4721,12 @@
4717
4721
  </rule>
4718
4722
  </languagerule>
4719
4723
  <languagerule languagerulename="Spanish">
4724
+
4725
+ <rule break="no">
4726
+ <beforebreak>¿[^?]+:[\s\u00A0]</beforebreak>
4727
+ <afterbreak>.</afterbreak>
4728
+ </rule>
4729
+
4720
4730
  <rule break="no">
4721
4731
  <beforebreak>Yahoo![\s\u00A0]</beforebreak>
4722
4732
  <afterbreak>\p{Ll}</afterbreak>
@@ -4798,7 +4808,7 @@
4798
4808
  </rule>
4799
4809
  <!-- Abbreviations that can finish sentences -->
4800
4810
  <rule break="no">
4801
- <beforebreak>\b([Ee]ds?|[Cc]oords?|grs?|Sr|Jr|Admón|Inc|Co|Hnos|Vda|[VU]d[s]?)\.[\p{Pe}\p{Pf}\p{Pd}"']*[\s\u00A0]</beforebreak>
4811
+ <beforebreak>\b([Ee]ds?|[Cc]oords?|grs?|Sr|Jr|Admón|Inc|Co|Hnos|Vda|[VUuv]d[s]?)\.[\p{Pe}\p{Pf}\p{Pd}"']*[\s\u00A0]</beforebreak>
4802
4812
  <afterbreak>[\-¡¿«»"'\u2018\u201C\p{Ps}\u2012\u2013\u2014\u2015\u2053]*\p{Ll}</afterbreak>
4803
4813
  </rule>
4804
4814
  <!-- Any word in acronyms like U.S.A.F or F. B. I. or C. or c.s.p. or p. e. -->
@@ -4864,14 +4874,18 @@
4864
4874
  </rule>
4865
4875
  <!-- Split at e.g. "1a. Und ..." -->
4866
4876
  <rule break="yes">
4867
- <beforebreak>\d+[a-z]\.[\u00A0\s]</beforebreak>
4877
+ <beforebreak>\d+[a-z]\.[\u00A0\s]{1,2}</beforebreak>
4868
4878
  <afterbreak>\p{Lu}</afterbreak>
4869
4879
  </rule>
4870
4880
  <!-- Don't split at e.g. "d. h." -->
4871
4881
  <rule break="no">
4872
- <beforebreak>[^-\p{L}'’/]\p{L}[\.!?…]['|"|“|«|\)|\]|\}]?[\u00A0\s]</beforebreak>
4882
+ <beforebreak>[^-\p{L}'’/°]\p{L}[\.!?…]['|"|“|«|\)|\]|\}]?[\u00A0\s]</beforebreak>
4873
4883
  <afterbreak></afterbreak>
4874
4884
  </rule>
4885
+ <rule break="no"><!-- special case: "Das 1. Internationale Filmfestival findet nächste Woche statt." -->
4886
+ <beforebreak>([Dd](as|er|ie|iese[rsmn]?|en|em)|[kmsd]?ein(e[rsnm]?)?|am|fürs|ins|zum|im|am|zur) \d+\.[\u00A0\s]+</beforebreak>
4887
+ <afterbreak>[A-ZÄÖÜ].*</afterbreak>
4888
+ </rule>
4875
4889
  <rule break="no">
4876
4890
  <beforebreak>Ust.</beforebreak><!-- needed for German rule UST_ID -->
4877
4891
  <afterbreak>Id</afterbreak>
@@ -4893,11 +4907,11 @@
4893
4907
  <afterbreak>3|4|Buzz|Crozz</afterbreak>
4894
4908
  </rule>
4895
4909
  <rule break="no">
4896
- <beforebreak>[1-3]\.[\u00A0\s]</beforebreak>
4910
+ <beforebreak>[1-3]\.[\u00A0\s]{1,2}</beforebreak>
4897
4911
  <afterbreak>Liga|Bundesliga|(Fußball|Handball|Basketball)(-B|b)undesliga</afterbreak>
4898
4912
  </rule>
4899
4913
  <rule break="no">
4900
- <beforebreak>\d+\.[\u00A0\s]</beforebreak>
4914
+ <beforebreak>\d+\.[\u00A0\s]{1,2}</beforebreak>
4901
4915
  <afterbreak>Klässler[sn]?</afterbreak>
4902
4916
  </rule>
4903
4917
  <rule break="no">
@@ -4912,43 +4926,43 @@
4912
4926
  <!-- Don't split after a white-space followed by a single letter followed
4913
4927
  by a dot followed by another whitespace. e.g. " p. " -->
4914
4928
  <rule break="no">
4915
- <beforebreak>[\u00A0\s]\p{L}\.[\u00A0\s]</beforebreak>
4929
+ <beforebreak>[\u00A0\s]\p{L}\.[\u00A0\s]{1,2}</beforebreak>
4916
4930
  <afterbreak>\p{L}\.</afterbreak>
4917
4931
  </rule>
4918
4932
  <!-- Don't split at "bla bla... yada yada" -->
4919
4933
  <rule break="no">
4920
- <beforebreak>[\[\(]?\.\.\.[\]\)]?[\u00A0\s]</beforebreak>
4934
+ <beforebreak>[\[\(]?\.\.\.[\]\)]?[\u00A0\s]{1,2}</beforebreak>
4921
4935
  <afterbreak>\p{Ll}</afterbreak>
4922
4936
  </rule>
4923
4937
  <!-- Don't split [.?!] when they're quoted -->
4924
4938
  <rule break="no">
4925
- <beforebreak>['"„][\.!?…]['"“«»][\u00A0\s]</beforebreak>
4939
+ <beforebreak>['"„][\.!?…]['"“«»][\u00A0\s]{1,2}</beforebreak>
4926
4940
  <afterbreak></afterbreak>
4927
4941
  </rule>
4928
4942
  <!-- Don't break after quote unless there's a capital letter
4929
4943
  e.g.: "That's right!" he said. -->
4930
4944
  <rule break="no">
4931
- <beforebreak>["'“«»][\u00A0\s]</beforebreak>
4945
+ <beforebreak>["'“«»][\u00A0\s]{1,2}</beforebreak>
4932
4946
  <afterbreak>\p{Ll}</afterbreak>
4933
4947
  </rule>
4934
4948
  <!-- e.g. "Das ist . so." - assume one sentence. -->
4935
4949
  <rule break="no">
4936
- <beforebreak>[\u00A0\s]([\.!?]{1,3}|…)['|"|“|«|\)|\]|\}]?[\u00A0\s]</beforebreak>
4950
+ <beforebreak>[\u00A0\s]([\.!?]{1,3}|…)['|"|“|«|\)|\]|\}]?[\u00A0\s]{1,2}</beforebreak>
4937
4951
  <afterbreak></afterbreak>
4938
4952
  </rule>
4939
4953
  <!-- Numbers, dates e.g. "3.10. datiert" -->
4940
4954
  <rule break="no">
4941
- <beforebreak>\b\d+\.[\u00A0\s]</beforebreak>
4955
+ <beforebreak>\b\d+\.[\u00A0\s]{1,2}</beforebreak>
4942
4956
  <afterbreak>\p{Ll}|\p{Lu}{2,}</afterbreak>
4943
4957
  </rule>
4944
4958
  <!-- z.B. "Das hier ist ein(!) Satz." -->
4945
4959
  <rule break="no">
4946
- <beforebreak>[\(\[][!?]{1,3}[\]\)][\u00A0\s]</beforebreak>
4960
+ <beforebreak>[\(\[][!?]{1,3}[\]\)][\u00A0\s]{1,2}</beforebreak>
4947
4961
  <afterbreak></afterbreak>
4948
4962
  </rule>
4949
4963
  <!-- z.B. "Das hier ist (genau!) ein Satz." -->
4950
4964
  <rule break="no">
4951
- <beforebreak>[!?]{1,3}[\)\]][\u00A0\s]</beforebreak>
4965
+ <beforebreak>[!?]{1,3}[\)\]][\u00A0\s]{1,2}</beforebreak>
4952
4966
  <afterbreak></afterbreak>
4953
4967
  </rule>
4954
4968
  <!-- z.B. "bla (...) blubb" -> kein Satzende -->
@@ -4958,55 +4972,55 @@
4958
4972
  </rule>
4959
4973
  <!-- don't split at cases like "Friedrich II. wird auch..." -->
4960
4974
  <rule break="no">
4961
- <beforebreak>[\u00A0\s ][IVX]+\.[\u00A0\s]</beforebreak>
4975
+ <beforebreak>[\u00A0\s ][IVX]+\.[\u00A0\s]{1,2}</beforebreak>
4962
4976
  <afterbreak>[^\p{Lu}]+</afterbreak>
4963
4977
  </rule>
4964
4978
  <!-- don't split at cases like "im 13. oder 14. Jahrhundert" -->
4965
4979
  <rule break="no">
4966
- <beforebreak>\d+\.[\u00A0\s]</beforebreak>
4980
+ <beforebreak>\d+\.[\u00A0\s]{1,2}</beforebreak>
4967
4981
  <afterbreak>(und|oder|bis)[\u00A0\s]</afterbreak>
4968
4982
  </rule>
4969
4983
  <!-- einige deutsche Monate, vor denen eine Zahl erscheinen kann,
4970
4984
  ohne dass eine Satzgrenze erkannt wird
4971
4985
  (z.B. "am 13. Dezember" -> keine Satzgrenze) -->
4972
4986
  <rule break="no">
4973
- <beforebreak>\d+\.[\u00A0\s]</beforebreak>
4987
+ <beforebreak>\d+\.[\u00A0\s]{1,2}</beforebreak>
4974
4988
  <afterbreak>Januar|Jänner|Februar|März|Merz|April|Mai|Ju[ln]i|August|September|Oktober|November|Dezember</afterbreak>
4975
4989
  </rule>
4976
4990
  <rule break="no">
4977
- <beforebreak>\d+\.[\u00A0\s]</beforebreak>
4991
+ <beforebreak>\d+\.[\u00A0\s]{1,2}</beforebreak>
4978
4992
  <afterbreak>J[aä]n|Febr?|Mär|Apr|Mai|Ju[nl]|Aug|Sept?|Okt|Nov|Dez</afterbreak>
4979
4993
  </rule>
4980
4994
  <rule break="no">
4981
- <beforebreak>(Jan|Jän|Febr?|Mär|Apr|Mai|Ju[nl]|Aug|Sept?|Okt|Nov|Dez)\.[\u00A0\s]</beforebreak>
4995
+ <beforebreak>(Jan|Jän|Febr?|Mär|Apr|Mai|Ju[nl]|Aug|Sept?|Okt|Nov|Dez)\.[\u00A0\s]{1,2}</beforebreak>
4982
4996
  <afterbreak>\d\d(\d\d)?</afterbreak>
4983
4997
  </rule>
4984
4998
  <!-- ähnliche Fälle außerhalb der Monatsnamen -->
4985
4999
  <rule break="no">
4986
- <beforebreak>\d+\.[\u00A0\s]</beforebreak>
5000
+ <beforebreak>\d+\.[\u00A0\s]{1,2}</beforebreak>
4987
5001
  <afterbreak>Amtsperiode|Breitengrads?|Breitengrades|Jubiläum|Jhd?|Jhdts?|Konferenz|(Jahres|Partei)(-K|k)onferenz|Längengrade?s?|Tags?|Tages|(Jahres|Spiel|Partei|Geburts)tag|(Jahres|Spiel|Partei|Geburts)tages|(Jahres|Spiel|Partei|Geburts)tags|Jahrhunderts?|Jahrtausend|Platz|Platzes|Lebensjahrs?|Lebensjahres|Lochs?|Loches|Grads|Grades|Obergeschoss|Stock(werk)?s?|Etage|Klasse|Runde|Bezirk|Etappe|Staffel|Sinfonie</afterbreak>
4988
5002
  </rule>
4989
5003
  <!-- English abbreviations - but these work globally for all languages -->
4990
5004
  <rule break="no">
4991
- <beforebreak>\b(Mrs?|No|pp|St|no|Sr|Jr|[Ss]ek|Bros|etc|[Bb]tw|vs|esp|[Ff]ig|Jan|Feb|Mar|Apr|Ju[nl]|Aug|Sept?|O[ck]t|Nov|Dec|PhD|BSc|BEng|BComp|BArch|al|cf|Inc|Ms|MEng|MSc|MComp|Gen|Sen|Prof|Corp|Co|co|Ltd|Buchst)\.[\u00A0\s]</beforebreak>
5005
+ <beforebreak>\b(Mrs?|No|pp|St|no|Sr|Jr|[Ss]ek|Bros|etc|[Bb]tw|vs|esp|[Ff]ig|Jan|Feb|Mar|Apr|Ju[nl]|Aug|Sept?|O[ck]t|Nov|Dec|PhD|BSc|BEng|BComp|BArch|al|cf|Inc|Ms|MEng|MSc|MComp|Gen|Sen|Prof|Corp|Co|co|Ltd|Buchst)\.[\u00A0\s]{1,2}</beforebreak>
4992
5006
  <afterbreak></afterbreak>
4993
5007
  </rule>
4994
5008
  <!-- Latin abbreviations - but these work globally for all languages -->
4995
5009
  <rule break="no">
4996
- <beforebreak>\b(spp?)\.[\u00A0\s]</beforebreak>
5010
+ <beforebreak>\b(spp?)\.[\u00A0\s]{1,2}</beforebreak>
4997
5011
  <afterbreak></afterbreak>
4998
5012
  </rule>
4999
5013
  <!-- German abbreviations -->
5000
5014
  <rule break="no">
5001
- <beforebreak>\b(betr|Geb|Stk|ggü|Mag|mtl|versch|d|Übers|usw|Bzw|bzw|Ab[hkst]|abzgl|[Ll]tda|[Ee]inschl|[Vv]mtl|Ev|bezgl|Abzw|[Vv]sl|ahd|Akk|aktual|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|autom|Auftragsnr|Az|Bat|bayr|Bde?|bearb|Bed|Bem|bes|bez|Bez|Bhf|bspw|btto|bw|Dtl|Dez)\.[\u00A0\s]</beforebreak>
5015
+ <beforebreak>\b(betr|Geb|Stk|ggü|Mag|mtl|versch|[Ss]tellv|d|Übers|usw|[Bb]zw|Ab[hkst]|[Aa]bzü?gl|[Ll]tda|[Ee]inschl|[Vv]mtl|Ev|bezgl|Abzw|[Vv]sl|ahd|Akk|aktual|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|[Aa]utom|Auftragsnr|Az|Bat|bayr|Bde?|bearb|Bed|Bem|bes|bez|Bez|Bhf|bspw|btto|bw|Dtl|Dez)\.[\u00A0\s]{1,2}</beforebreak>
5002
5016
  <afterbreak></afterbreak>
5003
5017
  </rule>
5004
5018
  <rule break="no">
5005
- <beforebreak>\b(cts?|Ca|ca|chem|chin|Chr|cresc|dat|Dat|desgl|ders|dgl|Dipl|Dir?|Doz?|durchg|durchges|Dr|dt|ebd|Ed|eigtl|Eigtl|eigl|Eigl|akt|Engl|engl|Erg|al|et[cw]|Etw|ev(tl)?|Evtl|Evt|evt|exkl|Expl|Exz)\.[\u00A0\s]</beforebreak>
5019
+ <beforebreak>\b(cts?|[Cc]a|chem|chin|Chr|cresc|[Dd]at|desgl|ders|dgl|Dipl|Dir?|Doz?|durchg|durchges|Dr|dt|ebd|Ed|[Ee]igt?l|akt|[Ee]ngl|Erg|al|et[cw]|Etw|ev|[Ee]vtl?|exkl|Expl|Exz)\.[\u00A0\s]{1,2}</beforebreak>
5006
5020
  <afterbreak></afterbreak>
5007
5021
  </rule>
5008
5022
  <rule break="no">
5009
- <beforebreak>\bDipl\.-[A-Z][a-z]{2,4}\.[\u00A0\s]</beforebreak>
5023
+ <beforebreak>\bDipl\.-[A-Z][a-z]{2,4}\.[\u00A0\s]{1,2}</beforebreak>
5010
5024
  <afterbreak></afterbreak>
5011
5025
  </rule>
5012
5026
  <rule break="no">
@@ -5014,23 +5028,27 @@
5014
5028
  <afterbreak>\p{Ll}</afterbreak>
5015
5029
  </rule>
5016
5030
  <rule break="no">
5017
- <beforebreak>\b(ff|Fa|fachspr|fam|fem|Fem|Fr|franz|frz?|[Aa]ltfranz|frdl|Frl|Fut|Gd|gebr?|Gebr|geh|geleg|gen|Gen|germ|gesch|ges|get|ggf|Ggf|Ggs|ggT|Gr|[Gg]rds|griech)\.[\u00A0\s]</beforebreak>
5031
+ <beforebreak>\b(ff|Fa|fachspr|fam|fem|Fem|Fr|franz|frz?|[Aa]ltfranz|frdl|Frl|Fut|Gd|gebr?|Gebr|geh|geleg|gen|Gen|germ|gesch|ges|get|ggf|Ggf|Ggs|ggT|Gr|[Gg]rds|griech)\.[\u00A0\s]{1,2}</beforebreak>
5018
5032
  <afterbreak></afterbreak>
5019
5033
  </rule>
5020
5034
  <rule break="no">
5021
- <beforebreak>\b(hebr|hg|hl|Hrsg|Hg|hist|hochd|hochspr|Hptst|Hr|hrsg|Allg|IdNr|ill|inkl|incl|Ind|Inf|Ing|ital|Tr|jap|Jb|Jg|Jhd?|Jhdts?|jmd[mns]?|jur|Kap|kart|kath|kfm|kaufm|Kfm|kgl|Kl|Konj|königl|Krs?|Kto)\.[\u00A0\s]</beforebreak>
5035
+ <beforebreak>\b(hebr|hg|hl|Hrsg|Hg|hist|hochd|hochspr|Hptst|Hr|hrsg|Allg|IdNr|ill|inkl|incl|Ind|Inf|Ing|ital|Tr|jap|Jb|Jg|Jhd?|Jhdts?|jmd[mns]?|jur|Kap|kart|kath|kfm|kaufm|Kfm|kgl|Kl|Konj|königl|Krs?|Kto)\.[\u00A0\s]{1,2}</beforebreak>
5022
5036
  <afterbreak></afterbreak>
5023
5037
  </rule>
5024
5038
  <rule break="no">
5025
- <beforebreak>\b([A-ZÖÄÜ][a-zöäüß]+nr|tel|gem|Pat|prov|Betr|lat|lfd|Lit|lt|Lz|Mask|mask|max|Mrd|mdal|me[dt]|phil|mhd|Mio?|mind?|Mo|mod|nachm|nördlBr|neutr|Nhd|Nom|Nrn?|Num|Obj|od|dgl|offz)\.[\u00A0\s]</beforebreak>
5039
+ <beforebreak>\b([A-ZÖÄÜ][a-zöäüß]+nr|tel|[Gg]em|Pat|prov|Betr|lat|lfd|Lit|lt|Lz|Mask|mask|max|Mrd|mdal|me[dt]|phil|mhd|Mio?|mio|mind?|Mo|mod|nachm|nördlBr|neutr|Nhd|Nom|Nrn?|Num|Obj|od|dgl|offz)\.[\u00A0\s]{1,2}</beforebreak>
5026
5040
  <afterbreak></afterbreak>
5027
5041
  </rule>
5028
5042
  <rule break="no">
5029
- <beforebreak>\b(Part|Per[fs]|Pfd|Pl(ur)?|pl|Plusq|Pos|pp|Prä[ps]|Prät|Pro[vf]|rd|reg|resp|Rhld|rit|Sa|südl|Br|se[ln]|Sept|Sing|sign|So|sog|Sp|Std?|stacc|Str|stud|Subst|sva|svw|sZ)\.[\u00A0\s]</beforebreak>
5043
+ <beforebreak>\b(Part|Per[fs]|Pfd|Pl(ur)?|pl|Plusq|Pos|pp|Prä[ps]|Prät|Pro[vf]|rd|reg|resp|Rhld|rit|Sa|südl|Br|se[ln]|Sept|Sing|sign|So|sog|Sp|Std?|stacc|Str|stud|Subst|sva|svw|sZ)\.[\u00A0\s]{1,2}</beforebreak>
5030
5044
  <afterbreak></afterbreak>
5031
5045
  </rule>
5032
5046
  <rule break="no">
5033
- <beforebreak>\b(Tel|teilw|Temp|trans|Tsd|übertr|übl|ff|überarb|ugs|univ|unveränd|urspr|USt|UST|USt\-IdNr|[Aa][bn]schl|sw|kl|[Gg]r|vgl|vll|Vll|vlt|Vlt|vllt|Vllt|Vgl|Vol|vollst|vorm|Vp|Vs|vs|wesentl|wg|Whg|Hd|Ztr|zus|Zus|zzt?|zzgl|zB|zb|Zz|Zt|zw|Min|Bzgl|bzgl|bezügl|Frhr|ggfs|insb|autom|Mw[sS]t)\.[\u00A0\s]</beforebreak>
5047
+ <beforebreak>([A-ZÖÄÜ][a-zöäüß]+str)\.[\u00A0\s]{1,2}</beforebreak>
5048
+ <afterbreak>\p{Ll}</afterbreak>
5049
+ </rule>
5050
+ <rule break="no">
5051
+ <beforebreak>\b(Tel|teilw|Temp|trans|Tsd|übertr|übl|ff|überarb|ugs|univ|unveränd|urspr|USt|UST|USt\-IdNr|[Aa][bn]schl|sw|kl|[Gg]r|vgl|vll|Vll|vlt|Vlt|vllt|Vllt|Vgl|Vol|vollst|vorm|Vp|Vs|vs|wesentl|wg|Whg|Hd|Ztr|zus|Zus|zzt?|zzgl|zB|zb|Zz|Zt|zw|Min|Bzgl|bzgl|bezügl|Frhr|ggfs|insb|autom|Mw[sS]t)\.[\u00A0\s]{1,2}</beforebreak>
5034
5052
  <afterbreak></afterbreak>
5035
5053
  </rule>
5036
5054
  <!-- Break rules -->
@@ -5043,7 +5061,7 @@
5043
5061
  <afterbreak>\p{Lu}[^\p{Lu}]</afterbreak>
5044
5062
  </rule>
5045
5063
  <rule break="yes">
5046
- <beforebreak>[\u00A0\s]\p{L}[\.!?…][\u00A0\s]</beforebreak>
5064
+ <beforebreak>[\u00A0\s]\p{L}[\.!?…][\u00A0\s]{1,2}</beforebreak>
5047
5065
  <afterbreak>\p{Lu}\p{Ll}</afterbreak>
5048
5066
  </rule>
5049
5067
  <!-- z.B. 2 sentences: “Liebst du mich?” “Ja!” -->
@@ -5262,6 +5280,18 @@
5262
5280
  <beforebreak>[\s\u00A0]</beforebreak>
5263
5281
  <afterbreak>[»”’"'›]</afterbreak>
5264
5282
  </rule>
5283
+ <rule break="no">
5284
+ <beforebreak>ambass|cuil|p|liv|assoc|bibl|ENREG|al|phot|circ|concl|deb|dest|dupl|éd|écon|incl?|ital|jur|juris|jurispr|larg|lex|législ|longit|(?-i)RR|(?-i)ÉÉm|(?-i)EExc|métr|méd|néol|obs|plur|préf|prog|publ|trib|trim|suiv|(?-i)LL|env|élem|ér|ét|hon|hypexp|conj|coop|ch|alph|anglic|app|pr|collab|paragr|sect|para|commiss|coord|dép|dir|gér|secour|sén|gén|abrév|adj|adr|anon|append|av|auj|bibl|bibliogr|bdc|boul|bull|bur|caar|cat|cell|chap|cir|compl|cf|corres|dest|dict|div|dom|dr|édif|éd|électr|élém|encycl|fig|fl|graph|hist|hyp|ill|imm|imp|impr|incl|inc|ind|in[gtvf]|jur|lat|litt|liq|loc|liv|livr|méd|mém|pl|réd|rel|sc|suiv|sup|suppl|trad|univ|mus|pharm|soc|pol|compt|urb|act|confect|exp|réal|prov|introd|inv|tial|enr|ép|équiv|esp|étym|excl|exc|ap|arr|arch|adv|al|anc|angl|ann|gest|gouv|prés|rect|représ|resp|scrut|vol|coll|réf|id|sqq?|janv|fév|avr|juill|oct|nov|déc|admin</beforebreak>
5285
+ <afterbreak>\p{Ll}.*</afterbreak>
5286
+ </rule>
5287
+ <rule break="no">
5288
+ <beforebreak>\p{Ll}.*</beforebreak>
5289
+ <afterbreak>ambass|cuil|p|liv|assoc|bibl|oct|déc|jan|fév|avr|juil|sept|nov|ENREG|al|circ|concl|deb|dest|dupl|éd|écon|incl?|ital|jur|juris|jurispr|larg|lex|législ|longit|(?-i)RR|(?-i)ÉÉm|(?-i)EExc|métr|méd|néol|obs|plur|préf|prog|publ|trib|trim|suiv|(?-i)LL|env|élem|ér|ét|hon|hypexp|conj|coop|ch|alph|anglic|app|pr|collab|paragr|sect|para|commiss|coord|dép|dir|gér|secour|sén|gén|abrév|adj|adr|anon|append|av|auj|bibl|bibliogr|bdc|boul|bull|bur|caar|cat|cell|chap|cir|compl|cf|corres|dest|dict|div|dom|dr|édif|éd|électr|élém|encycl|fig|fl|graph|hist|hyp|ill|imm|imp|impr|incl|inc|ind|in[gtvf]|jur|lat|litt|liq|loc|liv|livr|méd|mém|pl|réd|rel|sc|suiv|sup|suppl|trad|univ|mus|pharm|soc|pol|compt|urb|act|confect|exp|réal|prov|introd|inv|tial|enr|ép|équiv|esp|étym|excl|exc|ap|arr|arch|adv|al|anc|angl|ann|gest|gouv|prés|rect|représ|resp|scrut|vol|coll|réf|id|sqq?|janv|fév|avr|juill|oct|nov|déc|admin</afterbreak>
5290
+ </rule>
5291
+ <rule break="no">
5292
+ <beforebreak>.*°C</beforebreak>
5293
+ <afterbreak>de</afterbreak>
5294
+ </rule>
5265
5295
  <rule break="yes">
5266
5296
  <beforebreak>[\.!?][\s\u00A0][»”’"'›][\s\u00A0]</beforebreak>
5267
5297
  <afterbreak>[«“‘‹"'\p{Lu}]</afterbreak>
@@ -5270,7 +5300,7 @@
5270
5300
  <beforebreak>Yahoo![\s\u00A0]</beforebreak>
5271
5301
  <afterbreak>\p{Ll}</afterbreak>
5272
5302
  </rule>
5273
- <!-- !? + lowercase -->
5303
+ <!-- !? + lowercase -->
5274
5304
  <rule break="no">
5275
5305
  <beforebreak>(\!|\?)[\s\u00A0]</beforebreak>
5276
5306
  <afterbreak>\p{Ll}</afterbreak>
@@ -5648,7 +5678,7 @@
5648
5678
  </rule>
5649
5679
  <!-- abbreviation with proper noun: проф. Грицько, о. Лісове -->
5650
5680
  <rule break="no">
5651
- <beforebreak>\b([Аа]кад|[Пп]роф|[Дд]оц|[Аа]сист|[Рр]еж|[Аа]рх|[Сс]вв?|о|ім|упоряд|чл\.-кор|[Пп]реп)\.[\h\v]*</beforebreak>
5681
+ <beforebreak>\b(ап|[Аа]кад|[Пп]роф|[Дд]оц|[Аа]сист|[Рр]еж|[Аа]рх|[Сс]вв?|о|оз|ім|інж|упоряд|чл\.-кор|[Пп]реп)\.[\h\v]*</beforebreak>
5652
5682
  <afterbreak>[\h\v]*[А-ЯІЇЄҐA-Z]</afterbreak>
5653
5683
  </rule>
5654
5684
  <rule break="no">
@@ -5996,7 +6026,7 @@
5996
6026
  </rule>
5997
6027
  <!-- Abbreviations that cannot finish sentences-->
5998
6028
  <rule break="no">
5999
- <beforebreak>\b(a|Ab|abrev|absol|acad|Açor|A\. ?D|add|adj|adv|advers|Aeron|afér|Agric|Álg|aprox|[Aa]rts?|Artilh|auxil|av|Av)\.\s?</beforebreak>
6029
+ <beforebreak>\b(a|Ab|abr|abrev|absol|acad|Açor|A\. ?D|add|adj|adv|advers|Aeron|afér|Agric|ago|Álg|aprox|[Aa]rts?|Artilh|auxil|av|Av)\.\s?</beforebreak>
6000
6030
  <afterbreak></afterbreak>
6001
6031
  </rule>
6002
6032
  <rule break="no">
@@ -6008,7 +6038,7 @@
6008
6038
  <afterbreak></afterbreak>
6009
6039
  </rule>
6010
6040
  <rule break="no">
6011
- <beforebreak>\b(D|def|dem|deprec|deriv|det|disj|[Dd]ra?s?)\.\s?</beforebreak>
6041
+ <beforebreak>\b(D|def|dem|deprec|deriv|det|dez|disj|[Dd]ra?s?)\.\s?</beforebreak>
6012
6042
  <afterbreak></afterbreak>
6013
6043
  </rule>
6014
6044
  <rule break="no">
@@ -6020,7 +6050,7 @@
6020
6050
  <afterbreak>\p{Ll}</afterbreak>
6021
6051
  </rule>
6022
6052
  <rule break="no">
6023
- <beforebreak>\b(f|fam|Farm|fem|fig|fin|fl|fr|frac)\.\s?</beforebreak>
6053
+ <beforebreak>\b(f|fam|Farm|fem|fev|fig|fin|fl|fr|frac)\.\s?</beforebreak>
6024
6054
  <afterbreak></afterbreak>
6025
6055
  </rule>
6026
6056
  <rule break="no">
@@ -6036,7 +6066,7 @@
6036
6066
  <afterbreak></afterbreak>
6037
6067
  </rule>
6038
6068
  <rule break="no">
6039
- <beforebreak>\b(Jorn|Jur)\.\s?</beforebreak>
6069
+ <beforebreak>\b(jan|jul|jun|Jorn|Jur)\.\s?</beforebreak>
6040
6070
  <afterbreak></afterbreak>
6041
6071
  </rule>
6042
6072
  <rule break="no">
@@ -6044,15 +6074,15 @@
6044
6074
  <afterbreak></afterbreak>
6045
6075
  </rule>
6046
6076
  <rule break="no">
6047
- <beforebreak>\b(m|masc|Mat|máx|Mecân|[Mm]ed|Mil|mín|mult|Mús)\.\s?</beforebreak>
6077
+ <beforebreak>\b(m|mai|mar|masc|Mat|máx|Mecân|[Mm]ed|Mil|mín|mult|Mús)\.\s?</beforebreak>
6048
6078
  <afterbreak></afterbreak>
6049
6079
  </rule>
6050
6080
  <rule break="no">
6051
- <beforebreak>\b(n|N|Náut|N.B|neg|neol|num|núm)\.\s?</beforebreak>
6081
+ <beforebreak>\b(n|N|Náut|N.B|neg|neol|nov|num|núm)\.\s?</beforebreak>
6052
6082
  <afterbreak></afterbreak>
6053
6083
  </rule>
6054
6084
  <rule break="no">
6055
- <beforebreak>\b(ord)\.\s?</beforebreak>
6085
+ <beforebreak>\b(ord|out)\.\s?</beforebreak>
6056
6086
  <afterbreak></afterbreak>
6057
6087
  </rule>
6058
6088
  <rule break="no">
@@ -6068,7 +6098,7 @@
6068
6098
  <afterbreak></afterbreak>
6069
6099
  </rule>
6070
6100
  <rule break="no">
6071
- <beforebreak>\b(S|S.A|símb|S. ?M|[Ss]ra?s?|[Ss]rta|suf|superl)\.\s?</beforebreak>
6101
+ <beforebreak>\b(S|S.A|set|símb|S. ?M|[Ss]ra?s?|[Ss]rta|suf|superl)\.\s?</beforebreak>
6072
6102
  <afterbreak></afterbreak>
6073
6103
  </rule>
6074
6104
  <rule break="no">
@@ -6090,7 +6120,7 @@
6090
6120
  <!-- s. XIX; s.IX; sec. XX; séc. XX -->
6091
6121
  <rule break="no">
6092
6122
  <beforebreak>\bs([eé]c)?\.\s?</beforebreak>
6093
- <afterbreak>[IVXVDMCL]+</afterbreak>
6123
+ <afterbreak>[IVXDMCL]+</afterbreak>
6094
6124
  </rule>
6095
6125
  <!-- English abbreviations - but these work globally for all languages -->
6096
6126
  <rule break="no">
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: srx-languagetool
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.7.0
4
+ version: 0.8.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Aaron Madlon-Kay
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2022-07-04 00:00:00.000000000 Z
11
+ date: 2022-09-29 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: srx