treat 0.2.0 → 0.2.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (45) hide show
  1. data/TODO +3 -0
  2. data/lib/economist/hungarys_troubles.txt +46 -0
  3. data/lib/economist/indias_slowdown.txt +15 -0
  4. data/lib/economist/merkozy_rides_again.txt +24 -0
  5. data/lib/economist/prada_is_not_walmart.txt +9 -0
  6. data/lib/ferret/_11.cfs +0 -0
  7. data/lib/ferret/_14.cfs +0 -0
  8. data/lib/ferret/_p.cfs +0 -0
  9. data/lib/ferret/_s.cfs +0 -0
  10. data/lib/ferret/_v.cfs +0 -0
  11. data/lib/ferret/_y.cfs +0 -0
  12. data/lib/ferret/segments +0 -0
  13. data/lib/ferret/segments_15 +0 -0
  14. data/lib/treat/buildable.rb +10 -4
  15. data/lib/treat/categories.rb +2 -1
  16. data/lib/treat/delegatable.rb +2 -1
  17. data/lib/treat/doable.rb +3 -2
  18. data/lib/treat/entities/collection.rb +2 -9
  19. data/lib/treat/entities/entity.rb +13 -14
  20. data/lib/treat/entities.rb +5 -4
  21. data/lib/treat/extractors/coreferences/stanford.rb +1 -0
  22. data/lib/treat/extractors/topic_words/lda.rb +2 -15
  23. data/lib/treat/formatters/readers/autoselect.rb +0 -1
  24. data/lib/treat/formatters/unserializers/yaml.rb +2 -0
  25. data/lib/treat/formatters.rb +0 -7
  26. data/lib/treat/group.rb +4 -2
  27. data/lib/treat/languages/english.rb +1 -1
  28. data/lib/treat/lexicalizers/tag/brill.rb +17 -15
  29. data/lib/treat/lexicalizers/tag/lingua.rb +11 -6
  30. data/lib/treat/lexicalizers/tag/stanford.rb +28 -36
  31. data/lib/treat/lexicalizers.rb +1 -2
  32. data/lib/treat/processors/parsers/enju.rb +7 -5
  33. data/lib/treat/processors/parsers/stanford.rb +3 -1
  34. data/lib/treat/retrievers/indexers/ferret.rb +28 -0
  35. data/lib/treat/retrievers/searchers/ferret.rb +53 -0
  36. data/lib/treat/retrievers.rb +17 -0
  37. data/lib/treat/visitable.rb +1 -1
  38. data/lib/treat.rb +17 -16
  39. metadata +50 -30
  40. data/lib/economist/hose_and_dry.doc +0 -0
  41. data/lib/economist/hungarys_troubles.abw +0 -70
  42. data/lib/economist/republican_nomination.pdf +0 -0
  43. data/lib/economist/saving_the_euro.odt +0 -0
  44. data/lib/economist/zero_sum.html +0 -91
  45. data/lib/treat/lexicalizers/tag/tagger.rb +0 -29
@@ -1,29 +0,0 @@
1
- module Treat
2
- module Lexicalizers
3
- module Tag
4
- class Tagger
5
- def self.tag(entity, options = {})
6
- if (entity.is_a?(Treat::Entities::Sentence) ||
7
- entity.is_a?(Treat::Entities::Phrase)) &&
8
- !entity.has_children?
9
- raise Treat::Exception,
10
- "Annotator 'tag' requires processor 'tokenize'."
11
- elsif entity.is_a?(Treat::Entities::Word)
12
- if entity.has_parent?
13
- ps = entity.parent_sentence
14
- pp = entity.parent_phrase
15
- if ps
16
- self.tag(ps, options)
17
- elsif pp
18
- self.tag(pp, options)
19
- end
20
- return entity.features[:tag]
21
- else
22
- return :isolated_word
23
- end
24
- end
25
- end
26
- end
27
- end
28
- end
29
- end