pragmatic_segmenter_server 0.0.2 → 0.0.4

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
- SHA1:
3
- metadata.gz: 21b427165d4f9fc6809d1b7fc54ce4deb2471965
4
- data.tar.gz: 5aa4b6fff20a032d79ca12841e2c1c8209784e05
2
+ SHA256:
3
+ metadata.gz: cbbfa81ea6f9f89d46a43592d074b1dfce290e92025df05dfa404c834ba823d5
4
+ data.tar.gz: a8a5de048c216ed3e8714a51268301013e839962d04681323f0c2d9693735cd9
5
5
  SHA512:
6
- metadata.gz: 67f0ace7f6000cadeee63268481e7e8568b2cadc9f8c9aba3acae2d52b1659456a46f9e4245e78e55f9418add4de84442084c3bf52a6dc80eccfc0d1f90a768f
7
- data.tar.gz: 5e9330d0e2c943f1d49d4cdc6de30eef2985d9b5f638c8801e5e6d6e14a33cd3c5e06af30d654f94c9c2dfb8973456955c68ac41480c74834f2ca8bf2fc08122
6
+ metadata.gz: 26bf50391aa511334e76690fce663b9b405f66e4ef31b691afce77cfcc10c20d98487441bd979a0bcc5620d2d27903471b0e7743c9c702d370361c46aa007c69
7
+ data.tar.gz: 6efc4d1754da81a31a27b80bf290f697d4ab09896a729136587438a12ebc75ebcac9533fca477f13ab39d3f8f4274f1cbba6e884333419d8acc4c94f20308606
@@ -2,6 +2,7 @@ require 'pragmatic_segmenter'
2
2
 
3
3
 
4
4
  def segment(text, lang, segmentByNewline)
5
+
5
6
  newLineRegex = /((?: *[\n\r\t]+ *)+)/
6
7
  mask = ''
7
8
  segments = []
@@ -11,17 +12,22 @@ def segment(text, lang, segmentByNewline)
11
12
  else
12
13
  textParts = [text]
13
14
  end
14
-
15
+
15
16
  textParts.each do |textPart|
16
17
  if segmentByNewline && textPart.match(newLineRegex)
17
18
  mask += textPart
18
19
  else
20
+ if textPart == ""
21
+ next
22
+ end
19
23
  ps = PragmaticSegmenter::Segmenter.new(text: textPart, language: lang, clean:false)
20
24
  ps.segment.each do |segment|
21
25
  segments.push(segment)
22
26
  end
23
27
  mask += textPart.gsub(Regexp.new(ps.segment.map { |string| Regexp.escape(string) }.join("|")), "{}")
28
+
24
29
  end
30
+
25
31
  end
26
32
 
27
33
  return segments, mask
@@ -61,5 +61,5 @@ post '/segment' do
61
61
  })
62
62
  end
63
63
 
64
- puts results.to_json
64
+ results.to_json
65
65
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: pragmatic_segmenter_server
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.2
4
+ version: 0.0.4
5
5
  platform: ruby
6
6
  authors:
7
7
  - Laurent Bié
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-01-07 00:00:00.000000000 Z
11
+ date: 2023-01-26 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: sinatra
@@ -66,7 +66,7 @@ dependencies:
66
66
  - - '='
67
67
  - !ruby/object:Gem::Version
68
68
  version: 0.3.18
69
- description: A HTTP server for pragmatic segmenter
69
+ description: An HTTP server for pragmatic segmenter
70
70
  email: l.bie@pangeanic.com
71
71
  executables: []
72
72
  extensions: []
@@ -93,8 +93,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
93
93
  - !ruby/object:Gem::Version
94
94
  version: '0'
95
95
  requirements: []
96
- rubyforge_project:
97
- rubygems_version: 2.5.2.1
96
+ rubygems_version: 3.1.2
98
97
  signing_key:
99
98
  specification_version: 4
100
99
  summary: A server for pragmatic segmenter