anystyle-parser 0.4.4 → 0.4.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/HISTORY.md +2 -2
- data/lib/anystyle/parser/parser.rb +4 -9
- data/lib/anystyle/parser/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: bc18ecd238c51394c2a34f8ec45c9ece02eaaeeb
|
4
|
+
data.tar.gz: 7e26461b65683e798ca4a6e166d1691d6ff2db7a
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: a6afa20d3b20068d49d773c90677a8a4f815e05b86e9cf50c0bf32489a8e51c7b51d7358389ad6bca3d628c81f4d30ab4ab8e7406bef73bc07de26c77d427ac6
|
7
|
+
data.tar.gz: 6ecaaa31b450b68fdcc5fd04b5d34dbca250604408163a482e783cf6d70061fba9a0cd56220fbb5ebcb8a66befd6cc320385970f4d58bcf0555de622024c9591
|
data/HISTORY.md
CHANGED
@@ -63,9 +63,7 @@ module Anystyle
|
|
63
63
|
|
64
64
|
# Returns an array of label/segment pairs for each line in the passed-in string.
|
65
65
|
def label(input, labelled = false)
|
66
|
-
|
67
|
-
|
68
|
-
model.label(prepare(string, labelled)).map! do |sequence|
|
66
|
+
model.label(prepare(input, labelled)).map! do |sequence|
|
69
67
|
sequence.inject([]) do |ts, (token, label)|
|
70
68
|
token, label = token[/^\S+/], label.to_sym
|
71
69
|
if (prev = ts[-1]) && prev[0] == label
|
@@ -139,14 +137,12 @@ module Anystyle
|
|
139
137
|
end
|
140
138
|
|
141
139
|
def train(input = options[:training_data], truncate = true)
|
142
|
-
string = input_to_s(input)
|
143
|
-
|
144
140
|
if truncate
|
145
141
|
@model = Wapiti::Model.new(options.reject { |k,_| k == :model })
|
146
142
|
end
|
147
143
|
|
148
|
-
unless
|
149
|
-
@model.train(prepare(
|
144
|
+
unless input.nil? || input.empty?
|
145
|
+
@model.train(prepare(input, true))
|
150
146
|
end
|
151
147
|
|
152
148
|
@model.path = options[:model]
|
@@ -161,9 +157,8 @@ module Anystyle
|
|
161
157
|
end
|
162
158
|
|
163
159
|
def test(input)
|
164
|
-
string = input_to_s(input)
|
165
160
|
model.options.check!
|
166
|
-
model.label(prepare(
|
161
|
+
model.label(prepare(input, true))
|
167
162
|
end
|
168
163
|
|
169
164
|
def normalize(hash)
|