treat 0.2.0 → 0.2.5
Sign up to get free protection for your applications and to get access to all the features.
- data/TODO +3 -0
- data/lib/economist/hungarys_troubles.txt +46 -0
- data/lib/economist/indias_slowdown.txt +15 -0
- data/lib/economist/merkozy_rides_again.txt +24 -0
- data/lib/economist/prada_is_not_walmart.txt +9 -0
- data/lib/ferret/_11.cfs +0 -0
- data/lib/ferret/_14.cfs +0 -0
- data/lib/ferret/_p.cfs +0 -0
- data/lib/ferret/_s.cfs +0 -0
- data/lib/ferret/_v.cfs +0 -0
- data/lib/ferret/_y.cfs +0 -0
- data/lib/ferret/segments +0 -0
- data/lib/ferret/segments_15 +0 -0
- data/lib/treat/buildable.rb +10 -4
- data/lib/treat/categories.rb +2 -1
- data/lib/treat/delegatable.rb +2 -1
- data/lib/treat/doable.rb +3 -2
- data/lib/treat/entities/collection.rb +2 -9
- data/lib/treat/entities/entity.rb +13 -14
- data/lib/treat/entities.rb +5 -4
- data/lib/treat/extractors/coreferences/stanford.rb +1 -0
- data/lib/treat/extractors/topic_words/lda.rb +2 -15
- data/lib/treat/formatters/readers/autoselect.rb +0 -1
- data/lib/treat/formatters/unserializers/yaml.rb +2 -0
- data/lib/treat/formatters.rb +0 -7
- data/lib/treat/group.rb +4 -2
- data/lib/treat/languages/english.rb +1 -1
- data/lib/treat/lexicalizers/tag/brill.rb +17 -15
- data/lib/treat/lexicalizers/tag/lingua.rb +11 -6
- data/lib/treat/lexicalizers/tag/stanford.rb +28 -36
- data/lib/treat/lexicalizers.rb +1 -2
- data/lib/treat/processors/parsers/enju.rb +7 -5
- data/lib/treat/processors/parsers/stanford.rb +3 -1
- data/lib/treat/retrievers/indexers/ferret.rb +28 -0
- data/lib/treat/retrievers/searchers/ferret.rb +53 -0
- data/lib/treat/retrievers.rb +17 -0
- data/lib/treat/visitable.rb +1 -1
- data/lib/treat.rb +17 -16
- metadata +50 -30
- data/lib/economist/hose_and_dry.doc +0 -0
- data/lib/economist/hungarys_troubles.abw +0 -70
- data/lib/economist/republican_nomination.pdf +0 -0
- data/lib/economist/saving_the_euro.odt +0 -0
- data/lib/economist/zero_sum.html +0 -91
- data/lib/treat/lexicalizers/tag/tagger.rb +0 -29
@@ -1,29 +0,0 @@
|
|
1
|
-
module Treat
|
2
|
-
module Lexicalizers
|
3
|
-
module Tag
|
4
|
-
class Tagger
|
5
|
-
def self.tag(entity, options = {})
|
6
|
-
if (entity.is_a?(Treat::Entities::Sentence) ||
|
7
|
-
entity.is_a?(Treat::Entities::Phrase)) &&
|
8
|
-
!entity.has_children?
|
9
|
-
raise Treat::Exception,
|
10
|
-
"Annotator 'tag' requires processor 'tokenize'."
|
11
|
-
elsif entity.is_a?(Treat::Entities::Word)
|
12
|
-
if entity.has_parent?
|
13
|
-
ps = entity.parent_sentence
|
14
|
-
pp = entity.parent_phrase
|
15
|
-
if ps
|
16
|
-
self.tag(ps, options)
|
17
|
-
elsif pp
|
18
|
-
self.tag(pp, options)
|
19
|
-
end
|
20
|
-
return entity.features[:tag]
|
21
|
-
else
|
22
|
-
return :isolated_word
|
23
|
-
end
|
24
|
-
end
|
25
|
-
end
|
26
|
-
end
|
27
|
-
end
|
28
|
-
end
|
29
|
-
end
|