srx-languagetool 0.10.0 → 0.11.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +4 -0
- data/Gemfile.lock +1 -1
- data/lib/srx/languagetool/version.rb +1 -1
- data/lib/srx/segment.srx +31 -3
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: e0a06f5751cf7cff07ccd1325c123c311e24d067e63a15cca3e0ee4e1c9fe9a4
|
4
|
+
data.tar.gz: c019c0245332deca27f493f0e8e5482cb60e5bd6e81783e594e7629a0b3e7edd
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 2e45b12a8d3c92acea434dec2cef44eb3c94020612c159db520147cd1b47a987b5a79742cc55fad93fbcdffde6c2594130ab75a4910cd8c2a17e2f99d45fe8d1
|
7
|
+
data.tar.gz: 87c2ed74cda5f578b79cc649f62c04e3c6b63ebeca07b6451cfb94ebe45ab16398c719828ca76d4258f92140ad8eb43c7f9ebd299e07f12b8839bb81fe34efe5
|
data/CHANGELOG.md
CHANGED
data/Gemfile.lock
CHANGED
data/lib/srx/segment.srx
CHANGED
@@ -5,7 +5,7 @@
|
|
5
5
|
<formathandle type="end" include="yes"></formathandle>
|
6
6
|
<formathandle type="isolated" include="no"></formathandle>
|
7
7
|
<okpsrx:options oneSegmentIncludesAll="no" trimLeadingWhitespaces="no" trimTrailingWhitespaces="no" useJavaRegex="yes" useIcu4JBreakRules="no" treatIsolatedCodesAsWhitespace="no"></okpsrx:options>
|
8
|
-
<okpsrx:sample language="nl" useMappedRules="yes">De
|
8
|
+
<okpsrx:sample language="nl" useMappedRules="yes">De les is in jul. en aug. op maandagavond.</okpsrx:sample>
|
9
9
|
<okpsrx:rangeRule></okpsrx:rangeRule>
|
10
10
|
</header>
|
11
11
|
<body>
|
@@ -1540,6 +1540,14 @@
|
|
1540
1540
|
</rule>
|
1541
1541
|
</languagerule>
|
1542
1542
|
<languagerule languagerulename="Dutch">
|
1543
|
+
<rule break="yes">
|
1544
|
+
<beforebreak>(^| )O\.\s</beforebreak>
|
1545
|
+
<afterbreak>([A-Z][a-z]{1,3}[ ,:;.!?]|Indië|Wanneer|Kunnen|Sorry)</afterbreak>
|
1546
|
+
</rule>
|
1547
|
+
<rule break="yes">
|
1548
|
+
<beforebreak>\sEd[.]\s</beforebreak>
|
1549
|
+
<afterbreak>([A-Z][a-z]{1,3}|Wanneer|Misschien|Daarna|Zoals|Zelfs|Bedankt|Zullen|Vooral|Volgens|Vervolgens)(\s|[,:;])</afterbreak>
|
1550
|
+
</rule>
|
1543
1551
|
<rule break="no">
|
1544
1552
|
<beforebreak>\b(sp|SP)</beforebreak>
|
1545
1553
|
<afterbreak>\.[aA]\b</afterbreak>
|
@@ -1645,6 +1653,14 @@
|
|
1645
1653
|
<beforebreak>\b(prov|pseud|psych|qty|red|ref|resp|soc|st|tab|tel|temp|prof|tk)\.\s</beforebreak>
|
1646
1654
|
<afterbreak></afterbreak>
|
1647
1655
|
</rule>
|
1656
|
+
<rule break="yes">
|
1657
|
+
<beforebreak>\sgraden C\.\s</beforebreak>
|
1658
|
+
<afterbreak>[A-Z]</afterbreak>
|
1659
|
+
</rule>
|
1660
|
+
<rule break="yes">
|
1661
|
+
<beforebreak>°C\.\s</beforebreak>
|
1662
|
+
<afterbreak>[A-Z][a-z]</afterbreak>
|
1663
|
+
</rule>
|
1648
1664
|
<rule break="no">
|
1649
1665
|
<beforebreak>\b([A-Z]|Adr|Chr|Fr|Fred|IJ|Jac|Joh|Ph|St|Th|Tj|v|v\.(\s)?d)\.(\s)?</beforebreak>
|
1650
1666
|
<afterbreak>\p{Lu}</afterbreak>
|
@@ -1693,6 +1709,10 @@
|
|
1693
1709
|
<beforebreak>\b\p{L}\.</beforebreak>
|
1694
1710
|
<afterbreak>\p{L}\.</afterbreak>
|
1695
1711
|
</rule>
|
1712
|
+
<rule break="yes">
|
1713
|
+
<beforebreak>\sik\.\s</beforebreak>
|
1714
|
+
<afterbreak>ik\s</afterbreak>
|
1715
|
+
</rule>
|
1696
1716
|
<rule break="no">
|
1697
1717
|
<beforebreak>[\.\s]\p{L}{1,2}\.\s</beforebreak>
|
1698
1718
|
<afterbreak>[\p{N}\p{Ll}]</afterbreak>
|
@@ -1746,6 +1766,14 @@
|
|
1746
1766
|
<beforebreak>\s[A-Z].+!\s</beforebreak>
|
1747
1767
|
<afterbreak>[a-z]</afterbreak>
|
1748
1768
|
</rule>
|
1769
|
+
<rule break="no">
|
1770
|
+
<beforebreak>\b(jan|mrt|mar|jun|jul|aug|sept|okt|sep|spt|nov|dec|.*opp)\.\s</beforebreak>
|
1771
|
+
<afterbreak>[a-z]</afterbreak>
|
1772
|
+
</rule>
|
1773
|
+
<rule break="no">
|
1774
|
+
<beforebreak>Groen!\s</beforebreak>
|
1775
|
+
<afterbreak>[a-z]</afterbreak>
|
1776
|
+
</rule>
|
1749
1777
|
<rule break="yes">
|
1750
1778
|
<beforebreak>[.!?…][’'"\u00BB\u2019\u201D\u203A\u00AB\p{Pe}\u0002¹²³]*\s</beforebreak>
|
1751
1779
|
<afterbreak></afterbreak>
|
@@ -5030,7 +5058,7 @@
|
|
5030
5058
|
</rule>
|
5031
5059
|
<!-- German abbreviations -->
|
5032
5060
|
<rule break="no">
|
5033
|
-
<beforebreak>\b(betr|Geb|Stk|ggü|Mag|mtl|[Pp]arl|Bsp|versch|[Ss]tellv|d|Übers|usw|[Bb]zw|Ab[hkst]|[Aa]bzü?gl|[Ll]tda|[Ee]inschl|[Vv]mtl|Ev|bezgl|Abzw|[Vv]sl|ahd|Akk|aktual|[Öö]ffentl|prof|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|[Aa]utom|Auftragsnr|Az|Bat|bayr|Bde?|bearb|Bed|Bem|bes|bez|Bez|Bhf|bspw|btto|bw|Dtl|Dez)\.[\u00A0\s]{1,2}</beforebreak>
|
5061
|
+
<beforebreak>\b(betr|Geb|Stk|ggü|Mag|mtl|[Pp]arl|Bsp|versch|[Dd]iesbzgl|[Dd]bzgl[Ss]tellv|d|Übers|usw|[Bb]zw|Ab[hkst]|[Aa]bzü?gl|\d+-tlg|tlg|ggfls|[Ll]tda|[Ee]inschl|[Vv]mtl|Ev|bezgl|lit|Abzw|[Vv]sl|ahd|Akk|aktual|[Öö]ffentl|prof|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|[Aa]utom|Auftragsnr|Az|Bat|bayr|Bde?|bearb|Bed|Bem|bes|bez|Bez|Bhf|Blvd|bspw|btto|bw|Dtl|Dez|[Jj]gdfr|[Ee]ff)\.[\u00A0\s]{1,2}</beforebreak>
|
5034
5062
|
<afterbreak></afterbreak>
|
5035
5063
|
</rule>
|
5036
5064
|
<rule break="no">
|
@@ -6568,7 +6596,7 @@
|
|
6568
6596
|
</rule>
|
6569
6597
|
<!-- German abbreviations -->
|
6570
6598
|
<rule break="no">
|
6571
|
-
<beforebreak>\b(versch|d|Übers|usw|Ab[hkts]|ahd|Akk|aktual|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|Az|Bat|bayr|Bd|Bde|bearb|Bed|Bem|bes|bez|Bez|Bhf|bspw|btto|bw|bzw)\.\s</beforebreak>
|
6599
|
+
<beforebreak>\b(versch|d|Übers|usw|Ab[hkts]|ahd|Akk|aktual|allg|alltagsspr|altdt|alttest|amerikan|Anh|Ank|Anm|Art|Az|Bat|bayr|Bd|Bde|bearb|Bed|Bem|bes|bez|Bez|Bhf|bspw|btto|bw|bzw|pot)\.\s</beforebreak>
|
6572
6600
|
<afterbreak></afterbreak>
|
6573
6601
|
</rule>
|
6574
6602
|
<!--Српске скраћенице-->
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: srx-languagetool
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.11.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Aaron Madlon-Kay
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-03
|
11
|
+
date: 2023-07-03 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: srx
|