treat 0.2.0 → 0.2.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (45) hide show
  1. data/TODO +3 -0
  2. data/lib/economist/hungarys_troubles.txt +46 -0
  3. data/lib/economist/indias_slowdown.txt +15 -0
  4. data/lib/economist/merkozy_rides_again.txt +24 -0
  5. data/lib/economist/prada_is_not_walmart.txt +9 -0
  6. data/lib/ferret/_11.cfs +0 -0
  7. data/lib/ferret/_14.cfs +0 -0
  8. data/lib/ferret/_p.cfs +0 -0
  9. data/lib/ferret/_s.cfs +0 -0
  10. data/lib/ferret/_v.cfs +0 -0
  11. data/lib/ferret/_y.cfs +0 -0
  12. data/lib/ferret/segments +0 -0
  13. data/lib/ferret/segments_15 +0 -0
  14. data/lib/treat/buildable.rb +10 -4
  15. data/lib/treat/categories.rb +2 -1
  16. data/lib/treat/delegatable.rb +2 -1
  17. data/lib/treat/doable.rb +3 -2
  18. data/lib/treat/entities/collection.rb +2 -9
  19. data/lib/treat/entities/entity.rb +13 -14
  20. data/lib/treat/entities.rb +5 -4
  21. data/lib/treat/extractors/coreferences/stanford.rb +1 -0
  22. data/lib/treat/extractors/topic_words/lda.rb +2 -15
  23. data/lib/treat/formatters/readers/autoselect.rb +0 -1
  24. data/lib/treat/formatters/unserializers/yaml.rb +2 -0
  25. data/lib/treat/formatters.rb +0 -7
  26. data/lib/treat/group.rb +4 -2
  27. data/lib/treat/languages/english.rb +1 -1
  28. data/lib/treat/lexicalizers/tag/brill.rb +17 -15
  29. data/lib/treat/lexicalizers/tag/lingua.rb +11 -6
  30. data/lib/treat/lexicalizers/tag/stanford.rb +28 -36
  31. data/lib/treat/lexicalizers.rb +1 -2
  32. data/lib/treat/processors/parsers/enju.rb +7 -5
  33. data/lib/treat/processors/parsers/stanford.rb +3 -1
  34. data/lib/treat/retrievers/indexers/ferret.rb +28 -0
  35. data/lib/treat/retrievers/searchers/ferret.rb +53 -0
  36. data/lib/treat/retrievers.rb +17 -0
  37. data/lib/treat/visitable.rb +1 -1
  38. data/lib/treat.rb +17 -16
  39. metadata +50 -30
  40. data/lib/economist/hose_and_dry.doc +0 -0
  41. data/lib/economist/hungarys_troubles.abw +0 -70
  42. data/lib/economist/republican_nomination.pdf +0 -0
  43. data/lib/economist/saving_the_euro.odt +0 -0
  44. data/lib/economist/zero_sum.html +0 -91
  45. data/lib/treat/lexicalizers/tag/tagger.rb +0 -29
@@ -1,29 +0,0 @@
1
- module Treat
2
- module Lexicalizers
3
- module Tag
4
- class Tagger
5
- def self.tag(entity, options = {})
6
- if (entity.is_a?(Treat::Entities::Sentence) ||
7
- entity.is_a?(Treat::Entities::Phrase)) &&
8
- !entity.has_children?
9
- raise Treat::Exception,
10
- "Annotator 'tag' requires processor 'tokenize'."
11
- elsif entity.is_a?(Treat::Entities::Word)
12
- if entity.has_parent?
13
- ps = entity.parent_sentence
14
- pp = entity.parent_phrase
15
- if ps
16
- self.tag(ps, options)
17
- elsif pp
18
- self.tag(pp, options)
19
- end
20
- return entity.features[:tag]
21
- else
22
- return :isolated_word
23
- end
24
- end
25
- end
26
- end
27
- end
28
- end
29
- end