anystyle-parser 0.4.4 → 0.4.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/HISTORY.md +2 -2
- data/lib/anystyle/parser/parser.rb +4 -9
- data/lib/anystyle/parser/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: bc18ecd238c51394c2a34f8ec45c9ece02eaaeeb
|
4
|
+
data.tar.gz: 7e26461b65683e798ca4a6e166d1691d6ff2db7a
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: a6afa20d3b20068d49d773c90677a8a4f815e05b86e9cf50c0bf32489a8e51c7b51d7358389ad6bca3d628c81f4d30ab4ab8e7406bef73bc07de26c77d427ac6
|
7
|
+
data.tar.gz: 6ecaaa31b450b68fdcc5fd04b5d34dbca250604408163a482e783cf6d70061fba9a0cd56220fbb5ebcb8a66befd6cc320385970f4d58bcf0555de622024c9591
|
data/HISTORY.md
CHANGED
@@ -63,9 +63,7 @@ module Anystyle
|
|
63
63
|
|
64
64
|
# Returns an array of label/segment pairs for each line in the passed-in string.
|
65
65
|
def label(input, labelled = false)
|
66
|
-
|
67
|
-
|
68
|
-
model.label(prepare(string, labelled)).map! do |sequence|
|
66
|
+
model.label(prepare(input, labelled)).map! do |sequence|
|
69
67
|
sequence.inject([]) do |ts, (token, label)|
|
70
68
|
token, label = token[/^\S+/], label.to_sym
|
71
69
|
if (prev = ts[-1]) && prev[0] == label
|
@@ -139,14 +137,12 @@ module Anystyle
|
|
139
137
|
end
|
140
138
|
|
141
139
|
def train(input = options[:training_data], truncate = true)
|
142
|
-
string = input_to_s(input)
|
143
|
-
|
144
140
|
if truncate
|
145
141
|
@model = Wapiti::Model.new(options.reject { |k,_| k == :model })
|
146
142
|
end
|
147
143
|
|
148
|
-
unless
|
149
|
-
@model.train(prepare(
|
144
|
+
unless input.nil? || input.empty?
|
145
|
+
@model.train(prepare(input, true))
|
150
146
|
end
|
151
147
|
|
152
148
|
@model.path = options[:model]
|
@@ -161,9 +157,8 @@ module Anystyle
|
|
161
157
|
end
|
162
158
|
|
163
159
|
def test(input)
|
164
|
-
string = input_to_s(input)
|
165
160
|
model.options.check!
|
166
|
-
model.label(prepare(
|
161
|
+
model.label(prepare(input, true))
|
167
162
|
end
|
168
163
|
|
169
164
|
def normalize(hash)
|